{"0": {"caption": "a photo of a black cat and a white cat ", "segment": [{"bbox": [0.127859375, 0.466743648960739, 0.691125, 0.7394688221709007], "label": "a black cat"}, {"bbox": [0.542578125, 0.5063741339491916, 0.8065468750000001, 0.7475750577367205], "label": "a white cat"}], "image_id": "500084"}, "1": {"caption": "a photo of a red bird and a red bird ", "segment": [{"bbox": [0.46834375, 0.4154583333333333, 0.7821875, 0.6729583333333333], "label": "a red bird"}, {"bbox": [0.148390625, 0.26237499999999997, 0.42096874999999995, 0.47312499999999996], "label": "a red bird"}], "image_id": "74711"}, "2": {"caption": "a photo of a brown apple and a blue banana and a yellow banana and a blue banana and a yellow banana and a black banana ", "segment": [{"bbox": [0.12285416666666667, 0.52546875, 1.0, 0.9838906250000001], "label": "a brown apple"}, {"bbox": [0.4005, 0.014359374999999999, 0.6088958333333333, 0.230265625], "label": "a blue banana"}, {"bbox": [0.14681249999999998, 0.02471875, 0.38052083333333336, 0.2], "label": "a yellow banana"}, {"bbox": [0.0039791666666666664, 0.034765625, 0.1595625, 0.211375], "label": "a blue banana"}, {"bbox": [0.2485, 0.318921875, 0.40875, 0.484125], "label": "a yellow banana"}, {"bbox": [0.5778125000000001, 0.301125, 0.7125625000000001, 0.454484375], "label": "a black banana"}], "image_id": "329533"}, "3": {"caption": "a photo of a black knife and a brown pizza and a black bowl and a brown bowl and a yellow dining table ", "segment": [{"bbox": [0.701609375, 0.6870083102493074, 0.92621875, 0.9937119113573407], "label": "a black knife"}, {"bbox": [0.241921875, 0.022022160664819945, 0.845453125, 0.7737119113573407], "label": "a brown pizza"}, {"bbox": [0.31403125, 0.6451246537396121, 0.522390625, 0.9459002770083101], "label": "a black bowl"}, {"bbox": [0.141890625, 0.5285318559556788, 0.354984375, 0.8153462603878118], "label": "a brown bowl"}, {"bbox": [0.004390625, 0.002880886426592798, 1.0, 0.9899445983379501], "label": "a yellow dining table"}], "image_id": "170038"}, "4": {"caption": "a photo of a red backpack and a brown suitcase and a yellow suitcase and a yellow suitcase ", "segment": [{"bbox": [0.559921875, 0.19249307479224376, 0.759859375, 0.582409972299169], "label": "a red backpack"}, {"bbox": [0.455046875, 0.6112465373961219, 0.675609375, 0.9887534626038781], "label": "a brown suitcase"}, {"bbox": [0.553921875, 0.4760387811634349, 0.7035, 0.8265927977839335], "label": "a yellow suitcase"}, {"bbox": [0.69871875, 0.09908587257617729, 0.8245000000000001, 0.4504432132963989], "label": "a yellow suitcase"}], "image_id": "206112"}, "5": {"caption": "a photo of a brown sheep and a yellow chair and a brown chair ", "segment": [{"bbox": [0.11604215456674473, 0.511828125, 0.9347540983606557, 0.82365625], "label": "a brown sheep"}, {"bbox": [0.10929742388758783, 0.744796875, 0.9562763466042156, 0.984375], "label": "a yellow chair"}, {"bbox": [0.19081967213114756, 0.43020312499999996, 0.8707494145199063, 0.619328125], "label": "a brown chair"}], "image_id": "504256"}, "6": {"caption": "a photo of a red bed and a brown potted plant and a yellow potted plant ", "segment": [{"bbox": [0.12, 0.40089184060721067, 0.860359375, 1.0], "label": "a red bed"}, {"bbox": [0.8041874999999999, 0.7792220113851992, 1.0, 0.9740227703984818], "label": "a brown potted plant"}, {"bbox": [0.0, 0.0, 0.392078125, 1.0], "label": "a yellow potted plant"}], "image_id": "380597"}, "7": {"caption": "a photo of a white oven and a white bowl ", "segment": [{"bbox": [0.5124375, 0.2016388888888889, 0.648125, 0.47330555555555553], "label": "a white oven"}, {"bbox": [0.6543593750000001, 0.5684444444444444, 0.795296875, 0.73175], "label": "a white bowl"}], "image_id": "425569"}, "8": {"caption": "a photo of a black chair and a green chair and a white couch and a white dining table and a black bench and a brown book ", "segment": [{"bbox": [0.094875, 0.6113451776649746, 0.26487499999999997, 1.0], "label": "a black chair"}, {"bbox": [0.87078125, 0.6038071065989847, 1.0, 0.8277664974619289], "label": "a green chair"}, {"bbox": [0.668203125, 0.4482233502538071, 0.9546093750000001, 0.621015228426396], "label": "a white couch"}, {"bbox": [0.072421875, 0.48000000000000004, 0.38965625, 0.7058883248730965], "label": "a white dining table"}, {"bbox": [0.27390625, 0.5378172588832487, 0.45148437500000005, 0.8558375634517766], "label": "a black bench"}, {"bbox": [0.040625, 0.13959390862944163, 0.2171875, 0.7208121827411168], "label": "a brown book"}], "image_id": "340175"}, "9": {"caption": "a photo of a green umbrella and a green chair and a brown chair and a blue chair and a yellow chair and a blue umbrella ", "segment": [{"bbox": [0.07415625, 0.009145833333333332, 0.9, 0.3574583333333333], "label": "a green umbrella"}, {"bbox": [0.302203125, 0.54825, 0.5666718749999999, 0.9411458333333333], "label": "a green chair"}, {"bbox": [0.094125, 0.5570833333333333, 0.254640625, 0.8197916666666667], "label": "a brown chair"}, {"bbox": [0.27478125000000003, 0.5605416666666667, 0.43165624999999996, 0.808125], "label": "a blue chair"}, {"bbox": [0.0, 0.7011875, 0.150984375, 0.9566874999999999], "label": "a yellow chair"}, {"bbox": [0.0016875000000000002, 0.23108333333333334, 0.143265625, 0.38614583333333335], "label": "a blue umbrella"}], "image_id": "328403"}, "10": {"caption": "a photo of a red cat and a yellow chair and a white bicycle ", "segment": [{"bbox": [0.33475, 0.3480416666666667, 0.6797500000000001, 0.6467708333333333], "label": "a red cat"}, {"bbox": [0.732328125, 0.0, 0.998921875, 0.4971041666666667], "label": "a yellow chair"}, {"bbox": [0.004, 0.0010416666666666667, 0.961921875, 0.6948124999999999], "label": "a white bicycle"}], "image_id": "458119"}, "11": {"caption": "a photo of a red motorcycle and a brown motorcycle and a blue motorcycle ", "segment": [{"bbox": [0.5143541666666667, 0.22040625, 0.8599583333333333, 0.614671875], "label": "a red motorcycle"}, {"bbox": [0.4234375, 0.222171875, 0.6568958333333333, 0.5005625], "label": "a brown motorcycle"}, {"bbox": [0.7114999999999999, 0.136765625, 1.0, 0.825109375], "label": "a blue motorcycle"}], "image_id": "421952"}, "12": {"caption": "a photo of a white boat and a red boat ", "segment": [{"bbox": [0.05421875, 0.4264814814814815, 0.45354687499999996, 0.8404398148148149], "label": "a white boat"}, {"bbox": [0.44340624999999995, 0.4285185185185185, 1.0, 0.9154166666666668], "label": "a red boat"}], "image_id": "199125"}, "13": {"caption": "a photo of a white donut and a white bowl ", "segment": [{"bbox": [0.1824375, 0.17454166666666668, 0.8800625, 0.8862708333333332], "label": "a white donut"}, {"bbox": [0.292203125, 0.0026041666666666665, 0.6915625000000001, 0.15843749999999998], "label": "a white bowl"}], "image_id": "310200"}, "14": {"caption": "a photo of a green couch and a black bed ", "segment": [{"bbox": [0.0008437500000000001, 0.4813958333333333, 0.57815625, 1.0], "label": "a green couch"}, {"bbox": [0.593609375, 0.3318333333333333, 1.0, 0.7331875], "label": "a black bed"}], "image_id": "434417"}, "15": {"caption": "a photo of a black spoon and a brown broccoli and a red broccoli and a red bowl and a yellow oven ", "segment": [{"bbox": [0.792796875, 0.060140515222482434, 0.999609375, 0.37290398126463703], "label": "a black spoon"}, {"bbox": [0.292, 0.4, 0.45996875, 0.5788290398126464], "label": "a brown broccoli"}, {"bbox": [0.363, 0.809976580796253, 0.49684375000000003, 0.9801873536299767], "label": "a red broccoli"}, {"bbox": [0.1454375, 0.020234192037470726, 0.9580468750000002, 0.9887587822014051], "label": "a red bowl"}, {"bbox": [0.007484375, 0.0021311475409836068, 0.42784374999999997, 0.5693911007025761], "label": "a yellow oven"}], "image_id": "550643"}, "16": {"caption": "a photo of a white cat and a white bed ", "segment": [{"bbox": [0.377359375, 0.1295784543325527, 0.9512812499999999, 0.617751756440281], "label": "a white cat"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a white bed"}], "image_id": "262626"}, "17": {"caption": "a photo of a yellow vase and a red vase and a brown bench ", "segment": [{"bbox": [0.277609375, 0.26448577680525165, 0.5070625, 0.9296498905908097], "label": "a yellow vase"}, {"bbox": [0.6354375, 0.12065645514223194, 0.8985937500000001, 0.9296498905908096], "label": "a red vase"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a brown bench"}], "image_id": "319687"}, "18": {"caption": "a photo of a black chair and a yellow laptop ", "segment": [{"bbox": [0.5505416666666666, 0.537640625, 1.0, 0.9892499999999999], "label": "a black chair"}, {"bbox": [0.40206250000000004, 0.404203125, 0.6577500000000001, 0.565921875], "label": "a yellow laptop"}], "image_id": "377183"}, "19": {"caption": "a photo of a brown train and a blue train ", "segment": [{"bbox": [0.55640625, 0.2796388888888889, 0.7593593750000001, 0.6371388888888889], "label": "a brown train"}, {"bbox": [0.392859375, 0.31369444444444444, 0.56121875, 0.6220833333333333], "label": "a blue train"}], "image_id": "90560"}, "20": {"caption": "a photo of a green suitcase and a red suitcase and a white suitcase and a blue suitcase ", "segment": [{"bbox": [0.13621900826446282, 0.5175156249999999, 0.8778719008264463, 0.7344687499999999], "label": "a green suitcase"}, {"bbox": [0.11047520661157025, 0.3764375, 0.927293388429752, 0.639734375], "label": "a red suitcase"}, {"bbox": [0.05361570247933884, 0.12162500000000001, 0.9530165289256198, 0.40765624999999994], "label": "a white suitcase"}, {"bbox": [0.02080578512396694, 0.568171875, 0.9746487603305786, 0.9838906250000001], "label": "a blue suitcase"}], "image_id": "411821"}, "21": {"caption": "a photo of a white bird and a white giraffe and a red giraffe ", "segment": [{"bbox": [0.13553125, 0.6815222482435597, 0.333453125, 0.9650351288056206], "label": "a white bird"}, {"bbox": [0.26237499999999997, 0.08088992974238876, 0.953546875, 0.9842622950819673], "label": "a white giraffe"}, {"bbox": [0.0388125, 0.06285714285714286, 0.683609375, 1.0], "label": "a red giraffe"}], "image_id": "424219"}, "22": {"caption": "a photo of a white bowl and a blue broccoli and a red broccoli and a red broccoli ", "segment": [{"bbox": [0.060281249999999995, 0.022426778242677827, 0.9109843750000002, 0.9327405857740586], "label": "a white bowl"}, {"bbox": [0.44520312500000003, 0.3919037656903766, 0.648015625, 0.6023221757322176], "label": "a blue broccoli"}, {"bbox": [0.409765625, 0.013556485355648537, 0.58640625, 0.15830543933054395], "label": "a red broccoli"}, {"bbox": [0.61653125, 0.20165271966527196, 0.801484375, 0.35730125523012557], "label": "a red broccoli"}], "image_id": "543762"}, "23": {"caption": "a photo of a black dining table and a green chair and a red teddy bear and a red teddy bear and a white teddy bear and a yellow teddy bear ", "segment": [{"bbox": [0.006945606694560669, 0.7714218749999999, 0.34081589958159, 0.992203125], "label": "a black dining table"}, {"bbox": [0.2942050209205021, 0.792265625, 0.610857740585774, 1.0], "label": "a green chair"}, {"bbox": [0.512489539748954, 0.146328125, 0.7252719665271967, 0.34990625], "label": "a red teddy bear"}, {"bbox": [0.36299163179916316, 0.673015625, 0.505, 0.812109375], "label": "a red teddy bear"}, {"bbox": [0.26836820083682006, 0.49734375000000003, 0.42148535564853556, 0.625578125], "label": "a white teddy bear"}, {"bbox": [0.38284518828451886, 0.271578125, 0.5087029288702929, 0.41065625], "label": "a yellow teddy bear"}], "image_id": "138573"}, "24": {"caption": "a photo of a yellow cat and a green car ", "segment": [{"bbox": [0.141375, 0.06610416666666667, 1.0, 0.998375], "label": "a yellow cat"}, {"bbox": [0.0035312499999999997, 0.32547916666666665, 1.0, 0.9882083333333334], "label": "a green car"}], "image_id": "38769"}, "25": {"caption": "a photo of a red cat and a black suitcase and a black bed ", "segment": [{"bbox": [0.41600000000000004, 0.4371428571428571, 0.921625, 0.7169086651053864], "label": "a red cat"}, {"bbox": [0.18665625, 0.293559718969555, 0.8576406249999999, 0.9544028103044496], "label": "a black suitcase"}, {"bbox": [0.0693125, 0.025550351288056206, 1.0, 0.9865807962529275], "label": "a black bed"}], "image_id": "324857"}, "26": {"caption": "a photo of a brown cow and a yellow cow and a white motorcycle and a green cow ", "segment": [{"bbox": [0.168625, 0.6309791666666666, 0.37901562499999997, 0.9307708333333333], "label": "a brown cow"}, {"bbox": [0.499140625, 0.6392916666666667, 0.6473437499999999, 0.9879166666666668], "label": "a yellow cow"}, {"bbox": [0.0141875, 0.32077083333333334, 0.14240625, 0.5726875], "label": "a white motorcycle"}, {"bbox": [0.54540625, 0.5636875, 0.71521875, 0.8270625], "label": "a green cow"}], "image_id": "195800"}, "27": {"caption": "a photo of a brown umbrella and a black bench and a yellow bench and a green chair and a red dining table and a black chair ", "segment": [{"bbox": [0.15281045751633987, 0.09818627450980393, 0.946062091503268, 0.4195424836601307], "label": "a brown umbrella"}, {"bbox": [0.03132352941176471, 0.6937254901960784, 0.6845588235294118, 0.9823202614379086], "label": "a black bench"}, {"bbox": [0.03145424836601307, 0.7325816993464052, 0.2269607843137255, 0.9303431372549019], "label": "a yellow bench"}, {"bbox": [0.6489542483660131, 0.7777124183006535, 0.8925000000000001, 0.9635620915032679], "label": "a green chair"}, {"bbox": [0.040326797385620915, 0.7013562091503268, 0.6735620915032681, 0.9672875816993465], "label": "a red dining table"}, {"bbox": [0.031094771241830067, 0.7386437908496732, 0.3290196078431373, 0.9433006535947712], "label": "a black chair"}], "image_id": "121506"}, "28": {"caption": "a photo of a red cat and a blue couch ", "segment": [{"bbox": [0.26124, 0.37751999999999997, 0.8292200000000001, 0.8539200000000001], "label": "a red cat"}, {"bbox": [0.0, 0.0, 1.0, 0.9870399999999999], "label": "a blue couch"}], "image_id": "76522"}, "29": {"caption": "a photo of a yellow laptop and a white bed ", "segment": [{"bbox": [0.22753125000000002, 0.013479166666666665, 1.0, 0.9887708333333334], "label": "a yellow laptop"}, {"bbox": [0.0, 0.0641875, 1.0, 0.9853541666666668], "label": "a white bed"}], "image_id": "477474"}, "30": {"caption": "a photo of a red bus and a green bus ", "segment": [{"bbox": [0.695234375, 0.40499999999999997, 0.8375, 0.6409669811320754], "label": "a red bus"}, {"bbox": [0.41340625, 0.4744575471698113, 0.5449531249999999, 0.6141509433962263], "label": "a green bus"}], "image_id": "15338"}, "31": {"caption": "a photo of a red toilet and a red sink ", "segment": [{"bbox": [0.20720833333333333, 0.6047343749999999, 0.5915833333333332, 0.9358124999999999], "label": "a red toilet"}, {"bbox": [0.5536875, 0.650375, 0.8711249999999999, 0.8393593750000001], "label": "a red sink"}], "image_id": "29449"}, "32": {"caption": "a photo of a yellow cat and a brown chair and a brown backpack ", "segment": [{"bbox": [0.00484375, 0.2144375, 0.863140625, 0.8545208333333334], "label": "a yellow cat"}, {"bbox": [0.8241875000000001, 0.03160416666666667, 1.0, 0.8552500000000001], "label": "a brown chair"}, {"bbox": [0.2839375, 0.0, 0.5355000000000001, 0.25495833333333334], "label": "a brown backpack"}], "image_id": "367468"}, "33": {"caption": "a photo of a black potted plant and a black chair and a green dining table and a white chair ", "segment": [{"bbox": [0.1572083333333333, 0.158734375, 0.36583333333333334, 0.3310625], "label": "a black potted plant"}, {"bbox": [0.6890416666666667, 0.485671875, 1.0, 0.9196718749999999], "label": "a black chair"}, {"bbox": [0.5817708333333333, 0.503390625, 0.7747083333333333, 0.688390625], "label": "a green dining table"}, {"bbox": [0.27770833333333333, 0.43470312499999997, 0.5671458333333333, 0.725625], "label": "a white chair"}], "image_id": "223671"}, "34": {"caption": "a photo of a white book and a white backpack and a white laptop and a blue book ", "segment": [{"bbox": [0.77190625, 0.13764583333333333, 0.9303437499999999, 0.37135416666666665], "label": "a white book"}, {"bbox": [0.003359375, 0.30866666666666664, 0.42545312499999993, 0.9902916666666667], "label": "a white backpack"}, {"bbox": [0.4453125, 0.5742291666666667, 0.76953125, 0.8737083333333333], "label": "a white laptop"}, {"bbox": [0.77834375, 0.5497291666666667, 0.9491093749999999, 0.8635], "label": "a blue book"}], "image_id": "39663"}, "35": {"caption": "a photo of a blue hot dog and a yellow hot dog and a blue dining table ", "segment": [{"bbox": [0.020359375, 0.3435211267605634, 0.911515625, 0.9882394366197184], "label": "a blue hot dog"}, {"bbox": [0.35709375, 0.11779342723004695, 0.914640625, 0.5342723004694836], "label": "a yellow hot dog"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a blue dining table"}], "image_id": "226130"}, "36": {"caption": "a photo of a black fork and a red knife and a red pizza ", "segment": [{"bbox": [0.097453125, 0.0, 0.339453125, 0.18966666666666668], "label": "a black fork"}, {"bbox": [0.0, 0.10433333333333333, 0.20223437500000002, 0.24804166666666666], "label": "a red knife"}, {"bbox": [0.0471875, 0.0539375, 0.92696875, 0.9865208333333333], "label": "a red pizza"}], "image_id": "357229"}, "37": {"caption": "a photo of a blue horse and a brown horse ", "segment": [{"bbox": [0.47015624999999994, 0.33483588621444205, 0.9980781249999999, 0.9887746170678338], "label": "a blue horse"}, {"bbox": [0.003203125, 0.03527352297592998, 0.48459375, 0.9858205689277899], "label": "a brown horse"}], "image_id": "380142"}, "38": {"caption": "a photo of a black chair and a red dining table and a yellow chair ", "segment": [{"bbox": [0.134625, 0.42526970954356846, 0.34115625, 0.8165975103734441], "label": "a black chair"}, {"bbox": [0.1464375, 0.350103734439834, 0.51534375, 0.7073236514522822], "label": "a red dining table"}, {"bbox": [0.411703125, 0.2731327800829876, 0.607125, 0.5772821576763485], "label": "a yellow chair"}], "image_id": "260974"}, "39": {"caption": "a photo of a black frisbee and a yellow backpack ", "segment": [{"bbox": [0.267125, 0.07602352941176471, 1.0, 0.9884], "label": "a black frisbee"}, {"bbox": [0.0015, 0.006752941176470588, 0.583484375, 0.9887529411764706], "label": "a yellow backpack"}], "image_id": "63399"}, "40": {"caption": "a photo of a red car and a white bus ", "segment": [{"bbox": [0.8547429906542056, 0.443296875, 1.0, 0.628015625], "label": "a red car"}, {"bbox": [0.39988317757009345, 0.37715624999999997, 0.7459813084112149, 0.568171875], "label": "a white bus"}], "image_id": "330408"}, "41": {"caption": "a photo of a green cow and a green cow ", "segment": [{"bbox": [0.259171875, 0.173125, 0.66078125, 0.9344166666666667], "label": "a green cow"}, {"bbox": [0.646765625, 0.3000625, 1.0, 0.8926041666666668], "label": "a green cow"}], "image_id": "509750"}, "42": {"caption": "a photo of a green tv and a black laptop and a black keyboard ", "segment": [{"bbox": [0.32646875, 0.06822916666666666, 0.6441250000000001, 0.44], "label": "a green tv"}, {"bbox": [0.6151718749999999, 0.10525000000000001, 0.958984375, 0.5299583333333334], "label": "a black laptop"}, {"bbox": [0.35729687499999996, 0.6876458333333333, 0.9353906249999999, 0.8584166666666666], "label": "a black keyboard"}], "image_id": "63740"}, "43": {"caption": "a photo of a green oven and a red bowl and a red spoon and a green carrot and a blue carrot and a brown carrot ", "segment": [{"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a green oven"}, {"bbox": [0.1155, 0.0029742388758782204, 0.930453125, 0.9492974238875878], "label": "a red bowl"}, {"bbox": [0.003, 0.5595550351288057, 0.49026562500000004, 0.7820140515222482], "label": "a red spoon"}, {"bbox": [0.60765625, 0.318384074941452, 0.84653125, 0.5931381733021077], "label": "a green carrot"}, {"bbox": [0.518546875, 0.7167447306791569, 0.7397812500000001, 0.9473302107728337], "label": "a blue carrot"}, {"bbox": [0.6797187499999999, 0.5613583138173301, 0.8273906249999999, 0.7621545667447307], "label": "a brown carrot"}], "image_id": "209755"}, "44": {"caption": "a photo of a white bowl and a red bowl and a yellow bowl and a green carrot and a green carrot and a green carrot ", "segment": [{"bbox": [0.014374999999999999, 0.4380616740088106, 0.50646875, 0.9898678414096915], "label": "a white bowl"}, {"bbox": [0.059687500000000004, 0.0017841409691629958, 0.529890625, 0.47004405286343615], "label": "a red bowl"}, {"bbox": [0.547140625, 0.04259911894273128, 0.9908906250000001, 0.5313876651982379], "label": "a yellow bowl"}, {"bbox": [0.545125, 0.6048017621145374, 0.9234375, 0.9984801762114536], "label": "a green carrot"}, {"bbox": [0.714375, 0.7971806167400881, 0.8892187500000001, 1.0], "label": "a green carrot"}, {"bbox": [0.655625, 0.8499779735682819, 0.8141875000000001, 1.0], "label": "a green carrot"}], "image_id": "94103"}, "45": {"caption": "a photo of a white truck and a blue car and a red skateboard and a green car and a brown car and a white car ", "segment": [{"bbox": [0.30422319474835885, 0.402734375, 0.7549890590809627, 0.6288750000000001], "label": "a white truck"}, {"bbox": [0.5310722100656455, 0.433015625, 0.9985995623632385, 0.62246875], "label": "a blue car"}, {"bbox": [0.374507658643326, 0.555625, 0.7269584245076587, 0.76909375], "label": "a red skateboard"}, {"bbox": [0.05652078774617068, 0.46771874999999996, 0.3673741794310722, 0.647078125], "label": "a green car"}, {"bbox": [0.0, 0.520015625, 0.2151203501094092, 0.65165625], "label": "a brown car"}, {"bbox": [0.8633260393873086, 0.466296875, 0.9992560175054706, 0.5982968750000001], "label": "a white car"}], "image_id": "551957"}, "46": {"caption": "a photo of a green vase and a red potted plant and a blue teddy bear ", "segment": [{"bbox": [0.596059405940594, 0.8067343749999999, 0.8043366336633664, 0.9755781249999999], "label": "a green vase"}, {"bbox": [0.4818415841584159, 0.24089062499999997, 0.9966930693069308, 0.9830781249999999], "label": "a red potted plant"}, {"bbox": [0.01316831683168317, 0.02078125, 0.6912673267326732, 0.8233749999999999], "label": "a blue teddy bear"}], "image_id": "565683"}, "47": {"caption": "a photo of a red bowl and a green dining table ", "segment": [{"bbox": [0.037359375, 0.04023529411764706, 0.969109375, 0.9256470588235294], "label": "a red bowl"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a green dining table"}], "image_id": "412036"}, "48": {"caption": "a photo of a yellow zebra and a green zebra ", "segment": [{"bbox": [0.4715625, 0.0022500000000000003, 1.0, 0.9008999999999999], "label": "a yellow zebra"}, {"bbox": [0.289328125, 0.01085, 0.808984375, 0.903], "label": "a green zebra"}], "image_id": "299654"}, "49": {"caption": "a photo of a brown giraffe and a blue giraffe and a green giraffe ", "segment": [{"bbox": [0.5084857142857143, 0.7279800000000001, 0.7290571428571428, 0.9435399999999999], "label": "a brown giraffe"}, {"bbox": [0.6726571428571428, 0.7195199999999999, 0.8782, 0.9452200000000001], "label": "a blue giraffe"}, {"bbox": [0.24771428571428572, 0.63036, 0.38877142857142855, 0.98232], "label": "a green giraffe"}], "image_id": "80974"}, "50": {"caption": "a photo of a brown car and a yellow bus ", "segment": [{"bbox": [0.206703125, 0.544, 0.359765625, 0.702375], "label": "a brown car"}, {"bbox": [0.316859375, 0.2494375, 0.6960625, 0.7595416666666667], "label": "a yellow bus"}], "image_id": "84170"}, "51": {"caption": "a photo of a red bird and a blue bird ", "segment": [{"bbox": [0.457625, 0.23835294117647057, 0.634625, 0.43430588235294115], "label": "a red bird"}, {"bbox": [0.458859375, 0.663435294117647, 0.63265625, 0.9036235294117646], "label": "a blue bird"}], "image_id": "325688"}, "52": {"caption": "a photo of a green bicycle and a yellow bench ", "segment": [{"bbox": [0.05798, 0.18495548961424332, 0.832, 0.937626112759644], "label": "a green bicycle"}, {"bbox": [0.5801000000000001, 0.368160237388724, 0.9739000000000001, 0.7187240356083086], "label": "a yellow bench"}], "image_id": "251124"}, "53": {"caption": "a photo of a black elephant and a yellow elephant ", "segment": [{"bbox": [0.0, 0.25561032863849764, 0.735765625, 0.9842957746478873], "label": "a black elephant"}, {"bbox": [0.485359375, 0.2877699530516432, 1.0, 0.9856807511737089], "label": "a yellow elephant"}], "image_id": "88250"}, "54": {"caption": "a photo of a red potted plant and a yellow train and a green potted plant and a black potted plant ", "segment": [{"bbox": [0.34778125000000004, 0.5964166666666666, 0.62353125, 0.8610416666666666], "label": "a red potted plant"}, {"bbox": [0.0, 0.03820833333333333, 1.0, 0.5101041666666667], "label": "a yellow train"}, {"bbox": [0.0386875, 0.5941875, 0.32628124999999997, 0.8866041666666666], "label": "a green potted plant"}, {"bbox": [0.637328125, 0.4139375, 0.9183749999999999, 0.8673125], "label": "a black potted plant"}], "image_id": "426175"}, "55": {"caption": "a photo of a yellow refrigerator and a red bottle ", "segment": [{"bbox": [0.0029791666666666664, 0.002234375, 1.0, 1.0], "label": "a yellow refrigerator"}, {"bbox": [0.0625, 0.51875, 0.9979166666666667, 0.9609375], "label": "a red bottle"}], "image_id": "256337"}, "56": {"caption": "a photo of a black cat and a yellow sink and a black bottle ", "segment": [{"bbox": [0.140578125, 0.3231239669421488, 0.761953125, 0.8533057851239669], "label": "a black cat"}, {"bbox": [0.031859375, 0.0022479338842975208, 0.911328125, 0.9775206611570247], "label": "a yellow sink"}, {"bbox": [0.83059375, 0.3700495867768595, 1.0, 0.574694214876033], "label": "a black bottle"}], "image_id": "39828"}, "57": {"caption": "a photo of a brown cup and a blue scissors and a brown book and a black teddy bear and a brown teddy bear ", "segment": [{"bbox": [0.82024, 0.2972368421052632, 1.0, 0.7160526315789474], "label": "a brown cup"}, {"bbox": [0.40134, 0.44494736842105265, 0.8419800000000001, 0.6898947368421053], "label": "a blue scissors"}, {"bbox": [0.26254, 0.056710526315789475, 0.43232000000000004, 0.4047631578947368], "label": "a brown book"}, {"bbox": [0.304, 0.8155789473684211, 0.5172, 0.9584473684210527], "label": "a black teddy bear"}, {"bbox": [0.7219800000000001, 0.854421052631579, 0.8794200000000001, 0.9997368421052631], "label": "a brown teddy bear"}], "image_id": "499957"}, "58": {"caption": "a photo of a green dog and a white sheep ", "segment": [{"bbox": [0.5562968749999999, 0.198734375, 1.0, 0.7935625], "label": "a green dog"}, {"bbox": [0.010734375, 0.0, 0.581546875, 0.7038593750000001], "label": "a white sheep"}], "image_id": "178761"}, "59": {"caption": "a photo of a yellow broccoli and a red broccoli ", "segment": [{"bbox": [0.480375, 0.5733957845433255, 0.62165625, 0.825152224824356], "label": "a yellow broccoli"}, {"bbox": [0.10092187500000001, 0.19348946135831382, 0.951171875, 1.0], "label": "a red broccoli"}], "image_id": "99647"}, "60": {"caption": "a photo of a red horse and a black horse ", "segment": [{"bbox": [0.379984375, 0.5059807073954984, 0.57925, 0.970289389067524], "label": "a red horse"}, {"bbox": [0.34353125, 0.5438263665594855, 0.503328125, 0.9398070739549839], "label": "a black horse"}], "image_id": "398726"}, "61": {"caption": "a photo of a white dog and a black bench ", "segment": [{"bbox": [0.419515625, 0.18145833333333333, 0.87978125, 0.9963541666666667], "label": "a white dog"}, {"bbox": [0.0063437499999999996, 0.0030833333333333333, 1.0, 0.9875416666666668], "label": "a black bench"}], "image_id": "391139"}, "62": {"caption": "a photo of a white train and a brown train ", "segment": [{"bbox": [0.0017500000000000003, 0.35985849056603775, 0.546078125, 0.5515801886792453], "label": "a white train"}, {"bbox": [0.5329843750000001, 0.45617924528301884, 1.0, 0.6202358490566038], "label": "a brown train"}], "image_id": "505933"}, "63": {"caption": "a photo of a white bed and a white tv ", "segment": [{"bbox": [0.006736526946107785, 0.5662999999999999, 0.5483532934131736, 0.9572999999999999], "label": "a white bed"}, {"bbox": [0.6930538922155688, 0.37560000000000004, 0.8324251497005987, 0.50324], "label": "a white tv"}], "image_id": "450488"}, "64": {"caption": "a photo of a red cat and a blue chair and a blue cup ", "segment": [{"bbox": [0.0050625, 0.4202291666666667, 0.9016875000000001, 0.9955], "label": "a red cat"}, {"bbox": [0.401296875, 0.0883125, 0.81428125, 0.46493750000000006], "label": "a blue chair"}, {"bbox": [0.4581875, 0.24383333333333335, 0.764125, 1.0], "label": "a blue cup"}], "image_id": "249599"}, "65": {"caption": "a photo of a green dog and a red couch and a yellow couch and a yellow book and a blue chair ", "segment": [{"bbox": [0.46272, 0.33344, 0.59048, 0.51712], "label": "a green dog"}, {"bbox": [0.19326, 0.28213333333333335, 0.8555, 0.8196000000000001], "label": "a red couch"}, {"bbox": [0.55186, 0.6828266666666667, 0.94984, 1.0], "label": "a yellow couch"}, {"bbox": [0.8460599999999999, 0.4764, 1.0, 0.6404533333333334], "label": "a yellow book"}, {"bbox": [0.5879, 0.6888000000000001, 0.92774, 0.98568], "label": "a blue chair"}], "image_id": "392642"}, "66": {"caption": "a photo of a white truck and a brown car and a red chair ", "segment": [{"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a white truck"}, {"bbox": [0.01946, 0.017987987987987987, 0.26489999999999997, 0.25618618618618616], "label": "a brown car"}, {"bbox": [0.44630000000000003, 0.31948948948948946, 0.7767200000000001, 0.787027027027027], "label": "a red chair"}], "image_id": "402903"}, "67": {"caption": "a photo of a brown handbag and a black handbag and a white backpack and a black tv ", "segment": [{"bbox": [0.7655437665782494, 0.48916000000000004, 0.9094429708222812, 0.62874], "label": "a brown handbag"}, {"bbox": [0.7196021220159152, 0.30344, 0.8594960212201592, 0.4772], "label": "a black handbag"}, {"bbox": [0.8347214854111406, 0.3093, 1.0, 0.50994], "label": "a white backpack"}, {"bbox": [0.0, 0.43622000000000005, 0.17172413793103447, 0.8172], "label": "a black tv"}], "image_id": "150830"}, "68": {"caption": "a photo of a brown train and a green train ", "segment": [{"bbox": [0.395171875, 0.2735416666666667, 1.0, 0.7982083333333333], "label": "a brown train"}, {"bbox": [0.082578125, 0.305625, 0.42809375000000005, 0.8584166666666666], "label": "a green train"}], "image_id": "410951"}, "69": {"caption": "a photo of a white bus and a black bench and a blue car ", "segment": [{"bbox": [0.12134375, 0.301125, 0.640453125, 0.8], "label": "a white bus"}, {"bbox": [0.70134375, 0.6039375, 0.9037656250000001, 0.7721458333333333], "label": "a black bench"}, {"bbox": [0.0, 0.48954166666666665, 0.12740625, 0.7118749999999999], "label": "a blue car"}], "image_id": "4988"}, "70": {"caption": "a photo of a brown bicycle and a green cat ", "segment": [{"bbox": [0.40278125, 0.48409836065573775, 0.68503125, 0.7780093676814989], "label": "a brown bicycle"}, {"bbox": [0.799640625, 0.3144964871194379, 0.9981562499999999, 0.710327868852459], "label": "a green cat"}], "image_id": "28714"}, "71": {"caption": "a photo of a white airplane and a white airplane ", "segment": [{"bbox": [0.042046875, 0.3744375, 0.8744375, 0.6883333333333332], "label": "a white airplane"}, {"bbox": [0.12290625, 0.3370625, 0.6428437499999999, 0.530875], "label": "a white airplane"}], "image_id": "400507"}, "72": {"caption": "a photo of a brown fire hydrant and a yellow car and a green truck ", "segment": [{"bbox": [0.41685937500000003, 0.5621041666666666, 0.5675156250000001, 0.9304166666666667], "label": "a brown fire hydrant"}, {"bbox": [0.608484375, 0.4740625, 0.9976406250000001, 0.8773541666666667], "label": "a yellow car"}, {"bbox": [0.48703124999999997, 0.12839583333333335, 0.9925937499999999, 0.36543749999999997], "label": "a green truck"}], "image_id": "516372"}, "73": {"caption": "a photo of a blue spoon and a brown bowl and a black carrot ", "segment": [{"bbox": [0.49779687499999997, 0.09758782201405153, 0.999046875, 0.473231850117096], "label": "a blue spoon"}, {"bbox": [0.0, 0.0, 1.0, 0.9818266978922717], "label": "a brown bowl"}, {"bbox": [0.0, 0.20374707259953162, 0.9328125, 0.7962529274004684], "label": "a black carrot"}], "image_id": "436467"}, "74": {"caption": "a photo of a yellow zebra and a red zebra and a white zebra and a blue zebra ", "segment": [{"bbox": [0.352453125, 0.4358177570093458, 0.7485781250000001, 0.8344626168224298], "label": "a yellow zebra"}, {"bbox": [0.665640625, 0.46521028037383183, 0.97028125, 0.7956308411214953], "label": "a red zebra"}, {"bbox": [0.1681875, 0.4385046728971963, 0.48510937500000006, 0.8392757009345795], "label": "a white zebra"}, {"bbox": [0.05946875, 0.45974299065420565, 0.372140625, 0.8500233644859813], "label": "a blue zebra"}], "image_id": "463787"}, "75": {"caption": "a photo of a green wine glass and a yellow laptop and a brown laptop ", "segment": [{"bbox": [0.1779460580912863, 0.724421875, 0.3627385892116182, 0.939765625], "label": "a green wine glass"}, {"bbox": [0.4050207468879668, 0.466703125, 0.9924896265560166, 1.0], "label": "a yellow laptop"}, {"bbox": [0.38224066390041495, 0.372671875, 0.8242323651452281, 0.74375], "label": "a brown laptop"}], "image_id": "272630"}, "76": {"caption": "a photo of a red elephant and a red elephant ", "segment": [{"bbox": [0.26351562500000003, 0.3547291666666667, 0.802359375, 0.7939166666666667], "label": "a red elephant"}, {"bbox": [0.06925, 0.34460416666666666, 0.34290624999999997, 0.7004583333333334], "label": "a red elephant"}], "image_id": "411043"}, "77": {"caption": "a photo of a blue train and a red train ", "segment": [{"bbox": [0.0026093749999999997, 0.27147916666666666, 0.7528125, 0.8433333333333334], "label": "a blue train"}, {"bbox": [0.678234375, 0.37697916666666664, 1.0, 0.5403333333333333], "label": "a red train"}], "image_id": "519673"}, "78": {"caption": "a photo of a blue bottle and a green bottle and a red bottle and a black cup and a green carrot ", "segment": [{"bbox": [0.38589333333333337, 0.0016200000000000001, 0.7170666666666666, 0.42062], "label": "a blue bottle"}, {"bbox": [0.0, 0.00132, 0.20306666666666667, 0.22028], "label": "a green bottle"}, {"bbox": [0.8419466666666667, 0.00862, 1.0, 0.21120000000000003], "label": "a red bottle"}, {"bbox": [0.6731733333333333, 0.1286, 0.9692, 0.48305999999999993], "label": "a black cup"}, {"bbox": [0.2869066666666667, 0.4244, 0.6020533333333333, 0.61402], "label": "a green carrot"}], "image_id": "247333"}, "79": {"caption": "a photo of a yellow cat and a brown bottle and a brown sink ", "segment": [{"bbox": [0.3258125, 0.23441666666666666, 0.7774218749999999, 0.8301041666666666], "label": "a yellow cat"}, {"bbox": [0.72096875, 0.012895833333333334, 0.85484375, 0.30108333333333337], "label": "a brown bottle"}, {"bbox": [0.163484375, 0.0, 1.0, 0.9730416666666667], "label": "a brown sink"}], "image_id": "501523"}, "80": {"caption": "a photo of a green sandwich and a yellow dining table and a white cup ", "segment": [{"bbox": [0.21742187500000001, 0.17623831775700935, 0.7647187499999999, 0.7659112149532711], "label": "a green sandwich"}, {"bbox": [0.0015, 0.2308411214953271, 1.0, 1.0], "label": "a yellow dining table"}, {"bbox": [0.5334375, 0.049205607476635514, 0.7602187499999999, 0.3384579439252336], "label": "a white cup"}], "image_id": "354527"}, "81": {"caption": "a photo of a black chair and a red chair and a blue dining table and a brown refrigerator ", "segment": [{"bbox": [0.09938730853391685, 0.44946875000000003, 0.5300656455142232, 0.98709375], "label": "a black chair"}, {"bbox": [0.5103501094091903, 0.41070312500000006, 0.7837636761487965, 0.812], "label": "a red chair"}, {"bbox": [0.03286652078774617, 0.4779375, 0.9040481400437637, 0.982625], "label": "a blue dining table"}, {"bbox": [0.037592997811816194, 0.226265625, 0.34461706783369805, 0.5663125], "label": "a brown refrigerator"}], "image_id": "186980"}, "82": {"caption": "a photo of a black bus and a yellow train ", "segment": [{"bbox": [0.074953125, 0.5936458333333333, 0.5244843749999999, 0.8127708333333333], "label": "a black bus"}, {"bbox": [0.0033750000000000004, 0.06572916666666667, 0.7045000000000001, 0.4612291666666667], "label": "a yellow train"}], "image_id": "381463"}, "83": {"caption": "a photo of a brown banana and a green orange and a brown apple and a blue apple and a black apple ", "segment": [{"bbox": [0.0, 0.31998000000000004, 0.9117417417417418, 0.9768600000000001], "label": "a brown banana"}, {"bbox": [0.0106006006006006, 0.0047, 0.6041441441441442, 0.42588], "label": "a green orange"}, {"bbox": [0.27666666666666667, 0.3573, 0.9852552552552554, 0.80898], "label": "a brown apple"}, {"bbox": [0.5036936936936937, 0.060899999999999996, 0.9203303303303304, 0.38865999999999995], "label": "a blue apple"}, {"bbox": [0.8742342342342343, 0.15396, 1.0, 0.54686], "label": "a black apple"}], "image_id": "56714"}, "84": {"caption": "a photo of a blue refrigerator and a white chair and a black chair and a black dining table and a white bottle ", "segment": [{"bbox": [0.8747187500000001, 0.26516666666666666, 1.0, 0.907875], "label": "a blue refrigerator"}, {"bbox": [0.18434375, 0.6968541666666667, 0.393734375, 1.0], "label": "a white chair"}, {"bbox": [0.52284375, 0.7559791666666666, 0.6588437500000001, 1.0], "label": "a black chair"}, {"bbox": [0.37815625, 0.6635208333333333, 0.6810937499999999, 0.99575], "label": "a black dining table"}, {"bbox": [0.0328125, 0.30416666666666664, 0.2296875, 0.61875], "label": "a white bottle"}], "image_id": "283816"}, "85": {"caption": "a photo of a brown cat and a yellow book and a green bed and a brown vase ", "segment": [{"bbox": [0.050109375, 0.24460416666666665, 0.26509375, 0.39547916666666666], "label": "a brown cat"}, {"bbox": [0.690875, 0.6880624999999999, 1.0, 0.9763541666666666], "label": "a yellow book"}, {"bbox": [0.0, 0.0, 0.527921875, 0.5896041666666666], "label": "a green bed"}, {"bbox": [0.6777031250000001, 0.15097916666666666, 0.81096875, 0.35685416666666664], "label": "a brown vase"}], "image_id": "43851"}, "86": {"caption": "a photo of a green airplane and a white airplane and a brown airplane and a brown airplane ", "segment": [{"bbox": [0.745796875, 0.4256807511737089, 0.999015625, 0.5882629107981221], "label": "a green airplane"}, {"bbox": [0.0, 0.2898826291079812, 0.2004375, 0.6000000000000001], "label": "a white airplane"}, {"bbox": [0.103859375, 0.3596713615023474, 0.838484375, 0.49983568075117374], "label": "a brown airplane"}, {"bbox": [0.10184375000000001, 0.33274647887323944, 0.76071875, 0.5906807511737089], "label": "a brown airplane"}], "image_id": "265584"}, "87": {"caption": "a photo of a black tv and a brown couch and a brown couch and a brown couch ", "segment": [{"bbox": [0.00138, 0.3542942942942943, 0.17576, 0.7563663663663663], "label": "a black tv"}, {"bbox": [0.17334, 0.4548048048048048, 0.43944000000000005, 0.7649249249249248], "label": "a brown couch"}, {"bbox": [0.39218000000000003, 0.38564564564564563, 0.84284, 0.6511711711711711], "label": "a brown couch"}, {"bbox": [0.84608, 0.6738138138138138, 1.0, 0.993123123123123], "label": "a brown couch"}], "image_id": "348083"}, "88": {"caption": "a photo of a white dog and a brown sheep and a red sheep and a white sheep and a red sheep ", "segment": [{"bbox": [0.088015625, 0.5788165680473373, 0.35925, 0.9351479289940828], "label": "a white dog"}, {"bbox": [0.232328125, 0.14076923076923076, 0.589328125, 0.6815384615384615], "label": "a brown sheep"}, {"bbox": [0.5722343750000001, 0.08798816568047337, 0.7644843750000001, 0.28071005917159764], "label": "a red sheep"}, {"bbox": [0.568921875, 0.0527810650887574, 0.8817187499999999, 0.5270414201183432], "label": "a white sheep"}, {"bbox": [0.499625, 0.21142011834319524, 0.76715625, 0.6579289940828402], "label": "a red sheep"}], "image_id": "62875"}, "89": {"caption": "a photo of a green bowl and a brown broccoli and a brown broccoli and a red broccoli and a yellow orange ", "segment": [{"bbox": [0.00303125, 0.27828703703703705, 1.0, 0.9883796296296297], "label": "a green bowl"}, {"bbox": [0.19628125000000002, 0.0017824074074074075, 0.45159374999999996, 0.3563888888888889], "label": "a brown broccoli"}, {"bbox": [0.193765625, 0.34118055555555554, 0.47329687500000006, 0.564699074074074], "label": "a brown broccoli"}, {"bbox": [0.077359375, 0.1363888888888889, 0.27303125, 0.5476388888888889], "label": "a red broccoli"}, {"bbox": [0.5628124999999999, 0.0, 0.9140937499999999, 0.48800925925925925], "label": "a yellow orange"}], "image_id": "47648"}, "90": {"caption": "a photo of a red teddy bear and a brown bed and a black bed ", "segment": [{"bbox": [0.170125, 0.0584235294117647, 0.756578125, 0.950564705882353], "label": "a red teddy bear"}, {"bbox": [0.0, 0.015623529411764705, 0.36834375, 0.9869882352941176], "label": "a brown bed"}, {"bbox": [0.22767187500000002, 0.0025882352941176473, 1.0, 0.9818117647058825], "label": "a black bed"}], "image_id": "436603"}, "91": {"caption": "a photo of a yellow dog and a black frisbee ", "segment": [{"bbox": [0.003, 0.20370526315789475, 0.59225, 0.9855157894736842], "label": "a yellow dog"}, {"bbox": [0.354375, 0.6250105263157895, 0.6719843750000001, 0.9290526315789472], "label": "a black frisbee"}], "image_id": "403421"}, "92": {"caption": "a photo of a blue horse and a white horse ", "segment": [{"bbox": [0.671640625, 0.7014018691588785, 0.8348593750000001, 0.8892990654205608], "label": "a blue horse"}, {"bbox": [0.5510937499999999, 0.7154906542056075, 0.6989375, 0.8666355140186917], "label": "a white horse"}], "image_id": "78499"}, "93": {"caption": "a photo of a red giraffe and a green giraffe ", "segment": [{"bbox": [0.114625, 0.3451869158878505, 0.374203125, 0.9110747663551402], "label": "a red giraffe"}, {"bbox": [0.63328125, 0.4783177570093458, 0.78528125, 0.7611448598130841], "label": "a green giraffe"}], "image_id": "474471"}, "94": {"caption": "a photo of a red stop sign and a blue car ", "segment": [{"bbox": [0.039359375, 0.027166666666666665, 0.24901562500000002, 0.307875], "label": "a red stop sign"}, {"bbox": [0.672875, 0.6468541666666667, 1.0, 0.9989166666666667], "label": "a blue car"}], "image_id": "181518"}, "95": {"caption": "a photo of a yellow sports ball and a black clock ", "segment": [{"bbox": [0.7387254901960785, 0.8177614379084968, 0.8803104575163399, 0.9593464052287581], "label": "a yellow sports ball"}, {"bbox": [0.15534313725490195, 0.03222222222222222, 0.7620098039215686, 0.9864215686274511], "label": "a black clock"}], "image_id": "99927"}, "96": {"caption": "a photo of a red truck and a white truck and a blue truck and a yellow truck ", "segment": [{"bbox": [0.6783496732026143, 0.09117647058823529, 0.9683660130718954, 0.7549836601307189], "label": "a red truck"}, {"bbox": [0.040539215686274506, 0.041666666666666664, 0.3265686274509804, 0.956078431372549], "label": "a white truck"}, {"bbox": [0.3011274509803921, 0.296781045751634, 0.5303431372549019, 0.6608169934640522], "label": "a blue truck"}, {"bbox": [0.5416176470588235, 0.4254575163398693, 0.7023202614379086, 0.6164869281045751], "label": "a yellow truck"}], "image_id": "192620"}, "97": {"caption": "a photo of a red bicycle and a yellow bicycle and a yellow couch and a black dining table ", "segment": [{"bbox": [0.22639583333333332, 0.585921875, 0.46025000000000005, 0.724265625], "label": "a red bicycle"}, {"bbox": [0.23016666666666669, 0.17685937499999999, 0.3922916666666667, 0.43001562500000007], "label": "a yellow bicycle"}, {"bbox": [0.22222916666666667, 0.6575, 0.978625, 0.954375], "label": "a yellow couch"}, {"bbox": [0.4291875, 0.84509375, 1.0, 1.0], "label": "a black dining table"}], "image_id": "416733"}, "98": {"caption": "a photo of a black dog and a red dog ", "segment": [{"bbox": [0.291, 0.04690391459074733, 0.5912200000000001, 0.6592170818505338], "label": "a black dog"}, {"bbox": [0.5129400000000001, 0.15288256227758007, 0.8389800000000001, 0.6886120996441281], "label": "a red dog"}], "image_id": "89880"}, "99": {"caption": "a photo of a black giraffe and a yellow giraffe ", "segment": [{"bbox": [0.08964, 0.38509333333333334, 0.44514, 0.8869600000000001], "label": "a black giraffe"}, {"bbox": [0.55164, 0.38589333333333337, 0.9285599999999999, 0.8142400000000001], "label": "a yellow giraffe"}], "image_id": "578238"}, "100": {"caption": "a photo of a brown traffic light and a blue traffic light ", "segment": [{"bbox": [0.4932214765100671, 0.4471875, 0.6790604026845637, 0.7213392857142856], "label": "a brown traffic light"}, {"bbox": [0.308758389261745, 0.43968749999999995, 0.49211409395973155, 0.7266071428571428], "label": "a blue traffic light"}], "image_id": "457558"}, "101": {"caption": "a photo of a yellow car and a black car ", "segment": [{"bbox": [0.7828999999999999, 0.40402666666666665, 0.9768600000000001, 0.6051733333333333], "label": "a yellow car"}, {"bbox": [0.00035999999999999997, 0.40232, 0.1955, 0.54296], "label": "a black car"}], "image_id": "547202"}, "102": {"caption": "a photo of a brown broccoli and a green broccoli and a green broccoli and a red carrot ", "segment": [{"bbox": [0.389703125, 0.07929245283018867, 0.765375, 0.5757547169811321], "label": "a brown broccoli"}, {"bbox": [0.8568906249999999, 0.1340330188679245, 1.0, 0.6152594339622641], "label": "a green broccoli"}, {"bbox": [0.54259375, 0.0, 0.78390625, 0.2561792452830189], "label": "a green broccoli"}, {"bbox": [0.08715625, 0.20485849056603772, 0.2700625, 0.45089622641509436], "label": "a red carrot"}], "image_id": "335733"}, "103": {"caption": "a photo of a yellow tv and a red tv ", "segment": [{"bbox": [0.21967187500000002, 0.30591666666666667, 0.49948437500000004, 0.5994791666666667], "label": "a yellow tv"}, {"bbox": [0.47740625000000003, 0.31964583333333335, 0.7484531249999999, 0.6050625000000001], "label": "a red tv"}], "image_id": "472678"}, "104": {"caption": "a photo of a white cow and a brown cow and a brown cow and a brown cow ", "segment": [{"bbox": [0.47181249999999997, 0.4460573476702509, 0.9890000000000001, 0.9008602150537635], "label": "a white cow"}, {"bbox": [0.5221875, 0.23225806451612901, 0.9243749999999998, 0.6473118279569893], "label": "a brown cow"}, {"bbox": [0.5866875, 0.15035842293906812, 0.8572968750000001, 0.4073835125448029], "label": "a brown cow"}, {"bbox": [0.645875, 0.10164874551971326, 0.845875, 0.2527956989247312], "label": "a brown cow"}], "image_id": "405547"}, "105": {"caption": "a photo of a white couch and a brown couch and a green dining table and a green bowl and a green chair ", "segment": [{"bbox": [0.18075000000000002, 0.5915962441314554, 0.638375, 0.9859859154929577], "label": "a white couch"}, {"bbox": [0.71440625, 0.6109859154929577, 0.9984375, 0.9773708920187794], "label": "a brown couch"}, {"bbox": [0.035453125, 0.7015258215962442, 0.377171875, 0.9860328638497653], "label": "a green dining table"}, {"bbox": [0.1795, 0.6577464788732394, 0.314109375, 0.8105399061032863], "label": "a green bowl"}, {"bbox": [0.7081875, 0.6626291079812205, 0.9995312500000001, 0.9996478873239436], "label": "a green chair"}], "image_id": "369185"}, "106": {"caption": "a photo of a black car and a yellow traffic light ", "segment": [{"bbox": [0.5005468750000001, 0.7103958333333333, 0.640125, 0.8410208333333333], "label": "a black car"}, {"bbox": [0.1015625, 0.49375, 0.99375, 0.7104166666666667], "label": "a yellow traffic light"}], "image_id": "578848"}, "107": {"caption": "a photo of a blue cat and a red cat and a red bowl ", "segment": [{"bbox": [0.308078125, 0.4539252336448598, 0.62065625, 0.9865186915887851], "label": "a blue cat"}, {"bbox": [0.5058906249999999, 0.25429906542056074, 0.962765625, 0.7370794392523365], "label": "a red cat"}, {"bbox": [0.269484375, 0.6035747663551402, 0.433015625, 0.7342990654205607], "label": "a red bowl"}], "image_id": "379869"}, "108": {"caption": "a photo of a brown elephant and a brown elephant ", "segment": [{"bbox": [0.244390625, 0.08988290398126464, 0.766140625, 0.9707962529274003], "label": "a brown elephant"}, {"bbox": [0.7076718750000001, 0.011381733021077284, 1.0, 0.966440281030445], "label": "a brown elephant"}], "image_id": "514979"}, "109": {"caption": "a photo of a red cat and a blue bottle ", "segment": [{"bbox": [0.0, 0.08372365339578454, 0.442890625, 0.9873536299765808], "label": "a red cat"}, {"bbox": [0.73878125, 0.198711943793911, 0.93921875, 0.8832552693208431], "label": "a blue bottle"}], "image_id": "519094"}, "110": {"caption": "a photo of a red book and a green chair ", "segment": [{"bbox": [0.79, 0.083140625, 0.9959389671361504, 0.38651562500000003], "label": "a red book"}, {"bbox": [0.007793427230046948, 0.7116875, 0.9911502347417841, 1.0], "label": "a green chair"}], "image_id": "154230"}, "111": {"caption": "a photo of a red dog and a blue tv and a white chair ", "segment": [{"bbox": [0.4390625, 0.41425, 0.750015625, 0.9827708333333334], "label": "a red dog"}, {"bbox": [0.11460937499999999, 0.0050625, 0.642140625, 0.4342708333333334], "label": "a blue tv"}, {"bbox": [0.67903125, 0.26666666666666666, 1.0, 0.9591458333333333], "label": "a white chair"}], "image_id": "326937"}, "112": {"caption": "a photo of a white carrot and a blue knife and a red carrot and a yellow spoon and a black carrot and a blue carrot ", "segment": [{"bbox": [0.22825, 0.44447306791569086, 0.5609531249999999, 1.0], "label": "a white carrot"}, {"bbox": [0.597703125, 0.5002107728337236, 1.0, 0.822903981264637], "label": "a blue knife"}, {"bbox": [0.324953125, 0.5011709601873536, 0.5886875, 0.9858782201405153], "label": "a red carrot"}, {"bbox": [0.594796875, 0.49829039812646375, 0.933546875, 0.7063934426229508], "label": "a yellow spoon"}, {"bbox": [0.315546875, 0.6541217798594848, 0.519625, 0.9882435597189696], "label": "a black carrot"}, {"bbox": [0.167578125, 0.6492974238875878, 0.311671875, 1.0], "label": "a blue carrot"}], "image_id": "555387"}, "113": {"caption": "a photo of a blue boat and a red truck ", "segment": [{"bbox": [0.01940625, 0.38839999999999997, 0.49990625, 0.6288470588235294], "label": "a blue boat"}, {"bbox": [0.46110937500000004, 0.3528, 0.9520781250000001, 0.6741647058823529], "label": "a red truck"}], "image_id": "496845"}, "114": {"caption": "a photo of a brown bed and a white bed ", "segment": [{"bbox": [0.1713125, 0.11871495327102805, 0.725859375, 0.9861448598130841], "label": "a brown bed"}, {"bbox": [0.544296875, 0.0447196261682243, 1.0, 0.6792523364485981], "label": "a white bed"}], "image_id": "197859"}, "115": {"caption": "a photo of a brown dog and a blue keyboard and a red book ", "segment": [{"bbox": [0.0030210772833723656, 0.22362500000000002, 0.7539344262295082, 0.8735312499999999], "label": "a brown dog"}, {"bbox": [0.7544730679156909, 0.18651562500000002, 0.9969789227166277, 1.0], "label": "a blue keyboard"}, {"bbox": [0.4100234192037471, 0.105515625, 0.691264637002342, 0.254578125], "label": "a red book"}], "image_id": "179690"}, "116": {"caption": "a photo of a yellow surfboard and a black bicycle ", "segment": [{"bbox": [0.2345, 0.40306000000000003, 0.66522, 0.82556], "label": "a yellow surfboard"}, {"bbox": [0.14158, 0.36460000000000004, 0.3618, 0.75562], "label": "a black bicycle"}], "image_id": "164115"}, "117": {"caption": "a photo of a white potted plant and a blue chair and a yellow chair and a green dining table and a brown vase ", "segment": [{"bbox": [0.163484375, 0.16785416666666667, 0.9033749999999999, 0.9835833333333334], "label": "a white potted plant"}, {"bbox": [0.0, 0.3114166666666666, 0.23015625, 0.935875], "label": "a blue chair"}, {"bbox": [0.577046875, 0.44072916666666667, 0.777484375, 0.6972083333333334], "label": "a yellow chair"}, {"bbox": [0.059859375000000006, 0.6187708333333333, 0.8908437500000002, 0.9896666666666666], "label": "a green dining table"}, {"bbox": [0.39278124999999997, 0.5904583333333334, 0.5657656249999999, 0.9910833333333334], "label": "a brown vase"}], "image_id": "143526"}, "118": {"caption": "a photo of a red car and a yellow potted plant and a blue truck and a yellow stop sign ", "segment": [{"bbox": [0.011466666666666667, 0.44695999999999997, 0.19784, 0.5738399999999999], "label": "a red car"}, {"bbox": [0.05162666666666667, 0.62264, 0.22650666666666666, 0.7815599999999999], "label": "a yellow potted plant"}, {"bbox": [0.13314666666666666, 0.4562, 0.65632, 0.6781], "label": "a blue truck"}, {"bbox": [0.19429333333333335, 0.13012, 0.41642666666666667, 0.30838], "label": "a yellow stop sign"}], "image_id": "547435"}, "119": {"caption": "a photo of a blue vase and a blue book ", "segment": [{"bbox": [0.338, 0.5291940298507463, 0.53886, 0.8743283582089552], "label": "a blue vase"}, {"bbox": [0.6265, 0.39435820895522394, 0.91364, 0.8541194029850746], "label": "a blue book"}], "image_id": "49473"}, "120": {"caption": "a photo of a yellow zebra and a brown zebra and a yellow zebra and a black zebra ", "segment": [{"bbox": [0.14952000000000001, 0.43799401197604787, 0.5140800000000001, 0.8178443113772454], "label": "a yellow zebra"}, {"bbox": [0.59374, 0.3448802395209581, 0.8686, 0.7195808383233533], "label": "a brown zebra"}, {"bbox": [0.41431999999999997, 0.34763473053892213, 0.6199600000000001, 0.7431437125748502], "label": "a yellow zebra"}, {"bbox": [0.11331999999999999, 0.3962574850299401, 0.37754000000000004, 0.7655688622754491], "label": "a black zebra"}], "image_id": "69106"}, "121": {"caption": "a photo of a yellow pizza and a blue dining table ", "segment": [{"bbox": [0.0, 0.098875, 0.99775, 0.932578125], "label": "a yellow pizza"}, {"bbox": [0.0, 0.022468750000000003, 1.0, 0.986515625], "label": "a blue dining table"}], "image_id": "155714"}, "122": {"caption": "a photo of a red remote and a brown remote and a red remote and a red remote and a blue remote ", "segment": [{"bbox": [0.80636, 0.03371191135734072, 0.97836, 0.9415789473684211], "label": "a red remote"}, {"bbox": [0.41928, 0.07163434903047092, 0.6345799999999999, 0.9079501385041552], "label": "a brown remote"}, {"bbox": [0.62466, 0.1349861495844875, 0.8128599999999999, 0.8248753462603879], "label": "a red remote"}, {"bbox": [0.01688, 0.01623268698060942, 0.20066, 0.9331301939058172], "label": "a red remote"}, {"bbox": [0.19366, 0.006509695290858726, 0.42116, 0.9804709141274239], "label": "a blue remote"}], "image_id": "32416"}, "123": {"caption": "a photo of a green cell phone and a white cell phone ", "segment": [{"bbox": [0.458421875, 0.266734375, 0.7887656249999999, 0.558859375], "label": "a green cell phone"}, {"bbox": [0.34009375, 0.44820312500000004, 0.608109375, 0.702703125], "label": "a white cell phone"}], "image_id": "430380"}, "124": {"caption": "a photo of a brown airplane and a white car and a white truck and a white truck ", "segment": [{"bbox": [0.2895625, 0.005971896955503512, 0.998546875, 0.14913348946135832], "label": "a brown airplane"}, {"bbox": [0.144, 0.5744964871194379, 0.44954687500000007, 0.7825058548009367], "label": "a white car"}, {"bbox": [0.44387499999999996, 0.6519203747072599, 0.81546875, 0.7827166276346604], "label": "a white truck"}, {"bbox": [0.142234375, 0.5616393442622951, 0.442578125, 0.77711943793911], "label": "a white truck"}], "image_id": "457054"}, "125": {"caption": "a photo of a black toilet and a white toilet ", "segment": [{"bbox": [0.0, 0.64674, 0.2528, 0.9890399999999999], "label": "a black toilet"}, {"bbox": [0.0, 0.49888, 0.1955, 0.6539400000000001], "label": "a white toilet"}], "image_id": "1803"}, "126": {"caption": "a photo of a brown mouse and a white keyboard ", "segment": [{"bbox": [0.434890625, 0.0, 1.0, 0.7752924791086351], "label": "a brown mouse"}, {"bbox": [0.001453125, 0.0028969359331476323, 1.0, 0.9692200557103066], "label": "a white keyboard"}], "image_id": "9721"}, "127": {"caption": "a photo of a blue pizza and a red pizza and a green pizza and a brown pizza ", "segment": [{"bbox": [0.08506276150627615, 0.251765625, 0.9986610878661089, 0.85646875], "label": "a blue pizza"}, {"bbox": [0.5076778242677824, 0.002328125, 1.0, 0.439765625], "label": "a red pizza"}, {"bbox": [0.0042050209205020915, 0.142703125, 0.4759832635983263, 0.504046875], "label": "a green pizza"}, {"bbox": [0.0034728033472803347, 0.0, 0.3919665271966527, 0.138859375], "label": "a brown pizza"}], "image_id": "84493"}, "128": {"caption": "a photo of a white cat and a brown bird ", "segment": [{"bbox": [0.12165625, 0.027957244655581946, 0.83746875, 0.8301187648456057], "label": "a white cat"}, {"bbox": [0.230734375, 0.7987173396674584, 0.3738125, 0.9679097387173397], "label": "a brown bird"}], "image_id": "227218"}, "129": {"caption": "a photo of a red sink and a black sink ", "segment": [{"bbox": [0.6152031250000001, 0.6175409836065574, 0.93996875, 0.9429742388758782], "label": "a red sink"}, {"bbox": [0.24521874999999999, 0.8025058548009368, 0.4520156249999999, 0.9549882903981265], "label": "a black sink"}], "image_id": "251062"}, "130": {"caption": "a photo of a green cat and a brown sink ", "segment": [{"bbox": [0.2275, 0.144171875, 1.0, 0.9735468749999999], "label": "a green cat"}, {"bbox": [0.0, 0.79215625, 1.0, 1.0], "label": "a brown sink"}], "image_id": "457768"}, "131": {"caption": "a photo of a brown refrigerator and a yellow chair ", "segment": [{"bbox": [0.2323, 0.3138235294117647, 0.50744, 0.7268449197860963], "label": "a brown refrigerator"}, {"bbox": [0.12896000000000002, 0.824144385026738, 0.40532000000000007, 0.9891711229946525], "label": "a yellow chair"}], "image_id": "453755"}, "132": {"caption": "a photo of a brown car and a blue bicycle and a green bicycle ", "segment": [{"bbox": [0.09577777777777777, 0.668109375, 0.6513333333333333, 0.8599062499999999], "label": "a brown car"}, {"bbox": [0.6054444444444445, 0.8439687499999999, 0.9219166666666666, 0.9991249999999999], "label": "a blue bicycle"}, {"bbox": [0.2514166666666667, 0.813484375, 0.7685000000000001, 1.0], "label": "a green bicycle"}], "image_id": "147793"}, "133": {"caption": "a photo of a brown train and a white train ", "segment": [{"bbox": [0.522953125, 0.499875, 0.93046875, 0.6638541666666666], "label": "a brown train"}, {"bbox": [0.0037031250000000003, 0.0, 0.624078125, 0.8691458333333333], "label": "a white train"}], "image_id": "185903"}, "134": {"caption": "a photo of a red couch and a brown couch and a green bed and a red chair ", "segment": [{"bbox": [0.0013281249999999999, 0.48674999999999996, 0.3415, 0.8855625], "label": "a red couch"}, {"bbox": [0.0, 0.8532291666666667, 0.178640625, 0.9905625], "label": "a brown couch"}, {"bbox": [0.36228125, 0.3401666666666667, 0.7445468749999999, 0.6627916666666667], "label": "a green bed"}, {"bbox": [0.780578125, 0.5566875, 0.9764531249999999, 0.6844374999999999], "label": "a red chair"}], "image_id": "205089"}, "135": {"caption": "a photo of a black bottle and a red dining table ", "segment": [{"bbox": [0.18637499999999999, 0.00609375, 0.7942708333333334, 0.8663124999999999], "label": "a black bottle"}, {"bbox": [0.0, 0.0025937499999999997, 1.0, 0.987015625], "label": "a red dining table"}], "image_id": "352794"}, "136": {"caption": "a photo of a brown bicycle and a brown bicycle and a brown bicycle and a red bicycle and a yellow bicycle ", "segment": [{"bbox": [0.23159375, 0.49412500000000004, 0.37542187499999996, 0.7600208333333334], "label": "a brown bicycle"}, {"bbox": [0.10893749999999999, 0.6004583333333334, 0.2685, 0.8015625], "label": "a brown bicycle"}, {"bbox": [0.7817968750000001, 0.5107708333333333, 0.9212031250000001, 0.6365416666666666], "label": "a brown bicycle"}, {"bbox": [0.83475, 0.43704166666666666, 0.97171875, 0.5906458333333333], "label": "a red bicycle"}, {"bbox": [0.0, 0.5254375, 0.333625, 0.9989375], "label": "a yellow bicycle"}], "image_id": "241466"}, "137": {"caption": "a photo of a yellow bowl and a yellow carrot and a black apple and a black apple and a green sandwich and a white sandwich ", "segment": [{"bbox": [0.592796875, 0.4515625, 0.9184843749999999, 0.9400833333333334], "label": "a yellow bowl"}, {"bbox": [0.23943750000000003, 0.467375, 0.46478125000000003, 0.9532916666666668], "label": "a yellow carrot"}, {"bbox": [0.5845, 0.24647916666666667, 0.8327500000000001, 0.4835625], "label": "a black apple"}, {"bbox": [0.593046875, 0.034541666666666665, 0.8187656249999999, 0.2727083333333333], "label": "a black apple"}, {"bbox": [0.11665624999999999, 0.8009583333333333, 0.32665625, 0.9578541666666667], "label": "a green sandwich"}, {"bbox": [0.13479687499999998, 0.6791874999999999, 0.267109375, 0.8258958333333334], "label": "a white sandwich"}], "image_id": "54092"}, "138": {"caption": "a photo of a yellow airplane and a green truck ", "segment": [{"bbox": [0.16471875, 0.2859414225941423, 0.6057812499999999, 0.4855439330543933], "label": "a yellow airplane"}, {"bbox": [0.57228125, 0.1454602510460251, 0.96609375, 0.6285774058577407], "label": "a green truck"}], "image_id": "109900"}, "139": {"caption": "a photo of a brown tv and a white mouse and a green keyboard ", "segment": [{"bbox": [0.0, 0.00021021021021021022, 0.53198, 0.40471471471471465], "label": "a brown tv"}, {"bbox": [0.6595, 0.10663663663663663, 0.9309, 0.25819819819819817], "label": "a white mouse"}, {"bbox": [0.0011200000000000001, 0.1887987987987988, 1.0, 0.9991291291291291], "label": "a green keyboard"}], "image_id": "366723"}, "140": {"caption": "a photo of a green umbrella and a yellow car and a white car ", "segment": [{"bbox": [0.379125, 0.33355971896955505, 0.570171875, 0.5170023419203746], "label": "a green umbrella"}, {"bbox": [0.8188124999999999, 0.29988290398126466, 1.0, 0.8483372365339579], "label": "a yellow car"}, {"bbox": [0.69371875, 0.29, 0.8991093750000001, 0.6644262295081966], "label": "a white car"}], "image_id": "575243"}, "141": {"caption": "a photo of a red orange and a black potted plant and a yellow potted plant ", "segment": [{"bbox": [0.10991666666666666, 0.091140625, 0.9143541666666667, 0.5487656249999999], "label": "a red orange"}, {"bbox": [0.6005, 0.0, 0.8594583333333333, 0.1575625], "label": "a black potted plant"}, {"bbox": [0.23318750000000002, 0.0044843750000000005, 0.49924999999999997, 0.139015625], "label": "a yellow potted plant"}], "image_id": "367689"}, "142": {"caption": "a photo of a white car and a red bus and a yellow bus and a red truck and a blue bus ", "segment": [{"bbox": [0.018125, 0.4306041666666667, 0.16995312499999998, 0.5884166666666667], "label": "a white car"}, {"bbox": [0.389390625, 0.3498958333333333, 0.60778125, 0.5981875], "label": "a red bus"}, {"bbox": [0.606734375, 0.342125, 0.87303125, 0.5780833333333334], "label": "a yellow bus"}, {"bbox": [0.72471875, 0.26066666666666666, 0.9977499999999999, 0.494375], "label": "a red truck"}, {"bbox": [0.1851875, 0.35802083333333334, 0.368515625, 0.5950624999999999], "label": "a blue bus"}], "image_id": "171464"}, "143": {"caption": "a photo of a red bed and a brown bed ", "segment": [{"bbox": [0.50238, 0.10548, 0.7358199999999999, 0.25039999999999996], "label": "a red bed"}, {"bbox": [0.11304, 0.86856, 0.25178, 1.0], "label": "a brown bed"}], "image_id": "542959"}, "144": {"caption": "a photo of a red spoon and a blue cake and a blue dining table ", "segment": [{"bbox": [0.5807187500000001, 0.2065625, 0.9496249999999999, 0.6859791666666666], "label": "a red spoon"}, {"bbox": [0.318546875, 0.058416666666666665, 0.788765625, 0.6584166666666668], "label": "a blue cake"}, {"bbox": [0.0033750000000000004, 0.0028125000000000003, 1.0, 0.9915833333333334], "label": "a blue dining table"}], "image_id": "98003"}, "145": {"caption": "a photo of a yellow bird and a blue clock ", "segment": [{"bbox": [0.4770443349753694, 0.384265625, 0.6919376026272578, 0.57078125], "label": "a yellow bird"}, {"bbox": [0.19111658456486041, 0.10846875, 0.7738587848932676, 0.928109375], "label": "a blue clock"}], "image_id": "240082"}, "146": {"caption": "a photo of a blue giraffe and a black giraffe ", "segment": [{"bbox": [0.6533, 0.2400301204819277, 0.95434, 0.9394578313253011], "label": "a blue giraffe"}, {"bbox": [0.14768, 0.29659638554216866, 0.44458, 0.8636144578313254], "label": "a black giraffe"}], "image_id": "531607"}, "147": {"caption": "a photo of a green giraffe and a brown giraffe and a blue giraffe and a blue giraffe and a yellow giraffe ", "segment": [{"bbox": [0.8398021978021978, 0.19836842105263156, 0.965076923076923, 0.7784210526315788], "label": "a green giraffe"}, {"bbox": [0.7329670329670329, 0.18352631578947368, 0.8624395604395604, 0.6475263157894737], "label": "a brown giraffe"}, {"bbox": [0.24065934065934066, 0.15789473684210525, 0.3791208791208791, 0.7657894736842106], "label": "a blue giraffe"}, {"bbox": [0.09235164835164836, 0.3753157894736842, 0.23232967032967033, 0.7466315789473685], "label": "a blue giraffe"}, {"bbox": [0.5709450549450549, 0.23126315789473684, 0.7167912087912087, 0.723157894736842], "label": "a yellow giraffe"}], "image_id": "521285"}, "148": {"caption": "a photo of a brown car and a black motorcycle and a green refrigerator ", "segment": [{"bbox": [0.0007968750000000001, 0.6124375000000001, 0.39954687499999997, 0.857375], "label": "a brown car"}, {"bbox": [0.606046875, 0.6138333333333333, 0.9354375000000001, 0.9425], "label": "a black motorcycle"}, {"bbox": [0.652046875, 0.5125208333333333, 0.778703125, 0.725375], "label": "a green refrigerator"}], "image_id": "208991"}, "149": {"caption": "a photo of a blue zebra and a red zebra and a red zebra ", "segment": [{"bbox": [0.133453125, 0.14302083333333335, 0.6266875000000001, 1.0], "label": "a blue zebra"}, {"bbox": [0.0016875000000000002, 0.23645833333333333, 0.321671875, 0.9249375000000001], "label": "a red zebra"}, {"bbox": [0.3539375, 0.06741666666666667, 0.9286562500000001, 0.8898958333333334], "label": "a red zebra"}], "image_id": "1228"}, "150": {"caption": "a photo of a green bed and a white chair ", "segment": [{"bbox": [0.0, 0.39612499999999995, 0.708125, 1.0], "label": "a green bed"}, {"bbox": [0.483109375, 0.38175000000000003, 0.636828125, 0.625], "label": "a white chair"}], "image_id": "208688"}, "151": {"caption": "a photo of a red bus and a yellow bus ", "segment": [{"bbox": [0.43559931506849314, 0.15852657004830917, 0.7741780821917809, 0.5790579710144927], "label": "a red bus"}, {"bbox": [0.20549657534246576, 0.13219806763285025, 0.3552568493150685, 0.37714975845410625], "label": "a yellow bus"}], "image_id": "242034"}, "152": {"caption": "a photo of a green zebra and a white zebra and a blue zebra ", "segment": [{"bbox": [0.42906, 0.17456, 0.8631800000000001, 0.7758933333333333], "label": "a green zebra"}, {"bbox": [0.24156, 0.35472000000000004, 0.5118199999999999, 0.9876], "label": "a white zebra"}, {"bbox": [0.21230000000000002, 0.2730933333333333, 0.42966000000000004, 0.5324533333333333], "label": "a blue zebra"}], "image_id": "356368"}, "153": {"caption": "a photo of a black chair and a white dining table and a black dining table ", "segment": [{"bbox": [0.326484375, 0.8236666666666667, 0.45978125, 1.0], "label": "a black chair"}, {"bbox": [0.7429375, 0.5623541666666667, 0.954703125, 0.8164791666666668], "label": "a white dining table"}, {"bbox": [0.225390625, 0.5974166666666666, 0.660625, 0.9834166666666666], "label": "a black dining table"}], "image_id": "147545"}, "154": {"caption": "a photo of a green elephant and a green elephant ", "segment": [{"bbox": [0.455875, 0.4263333333333333, 0.600484375, 0.5879166666666666], "label": "a green elephant"}, {"bbox": [0.391015625, 0.38795833333333335, 0.57340625, 0.5887291666666667], "label": "a green elephant"}], "image_id": "474170"}, "155": {"caption": "a photo of a yellow toothbrush and a blue dining table ", "segment": [{"bbox": [0.053593749999999996, 0.8285377358490567, 1.0, 0.9813443396226416], "label": "a yellow toothbrush"}, {"bbox": [0.007484375, 0.003938679245283018, 0.9989843749999998, 0.9858962264150944], "label": "a blue dining table"}], "image_id": "476172"}, "156": {"caption": "a photo of a green umbrella and a brown handbag and a red handbag and a brown backpack ", "segment": [{"bbox": [0.25960937500000003, 0.266875, 0.414953125, 0.5756875], "label": "a green umbrella"}, {"bbox": [0.7398906249999999, 0.11872916666666668, 0.9471874999999998, 0.39962500000000006], "label": "a brown handbag"}, {"bbox": [0.8327656250000001, 0.3074375, 0.9763437500000001, 0.6047291666666667], "label": "a red handbag"}, {"bbox": [0.001953125, 0.19220833333333334, 0.24740625, 0.9662291666666666], "label": "a brown backpack"}], "image_id": "193498"}, "157": {"caption": "a photo of a white teddy bear and a red teddy bear and a red chair ", "segment": [{"bbox": [0.24621875000000001, 0.015741176470588238, 0.8580625, 0.9865176470588235], "label": "a white teddy bear"}, {"bbox": [0.371578125, 0.4022588235294118, 0.7521093750000001, 0.9887529411764706], "label": "a red teddy bear"}, {"bbox": [0.0, 0.0, 0.385, 1.0], "label": "a red chair"}], "image_id": "575867"}, "158": {"caption": "a photo of a brown car and a brown train and a yellow train and a green train ", "segment": [{"bbox": [0.45482812499999997, 0.7790690690690691, 0.64221875, 0.9394294294294294], "label": "a brown car"}, {"bbox": [0.062859375, 0.32684684684684684, 0.854390625, 0.8033333333333333], "label": "a brown train"}, {"bbox": [0.564640625, 0.3744444444444444, 0.912296875, 0.7690690690690691], "label": "a yellow train"}, {"bbox": [0.48998437499999997, 0.31165165165165165, 0.9239687499999999, 0.7018018018018017], "label": "a green train"}], "image_id": "137822"}, "159": {"caption": "a photo of a brown broccoli and a red fork and a red knife ", "segment": [{"bbox": [0.38471875, 0.6712708333333333, 0.58959375, 0.9297708333333332], "label": "a brown broccoli"}, {"bbox": [0.487015625, 0.11125, 0.9565000000000001, 0.5424166666666667], "label": "a red fork"}, {"bbox": [0.703203125, 0.027770833333333335, 0.870671875, 0.8072499999999999], "label": "a red knife"}], "image_id": "561889"}, "160": {"caption": "a photo of a black sheep and a yellow sheep ", "segment": [{"bbox": [0.5880156249999999, 0.41631250000000003, 0.9087500000000001, 0.971375], "label": "a black sheep"}, {"bbox": [0.32440625, 0.18445833333333334, 0.74678125, 0.6919583333333333], "label": "a yellow sheep"}], "image_id": "427643"}, "161": {"caption": "a photo of a red banana and a blue banana and a green banana and a red orange and a red bowl and a red orange ", "segment": [{"bbox": [0.4933646616541354, 0.24376562499999999, 0.7468045112781956, 0.6538906250000001], "label": "a red banana"}, {"bbox": [0.22257518796992481, 0.0470625, 0.422593984962406, 0.342140625], "label": "a blue banana"}, {"bbox": [0.17172932330827068, 0.23128125000000002, 0.4233834586466166, 0.44215625000000003], "label": "a green banana"}, {"bbox": [0.3511278195488722, 0.23378125, 0.5745488721804511, 0.402625], "label": "a red orange"}, {"bbox": [0.12928571428571428, 0.032828125, 0.8115789473684211, 0.64478125], "label": "a red bowl"}, {"bbox": [0.48080827067669174, 0.113625, 0.6892669172932331, 0.27925], "label": "a red orange"}], "image_id": "484651"}, "162": {"caption": "a photo of a yellow pizza and a white oven ", "segment": [{"bbox": [0.168546875, 0.16629166666666664, 0.8207812499999999, 0.9146041666666667], "label": "a yellow pizza"}, {"bbox": [0.001953125, 0.0, 1.0, 0.9865833333333334], "label": "a white oven"}], "image_id": "67065"}, "163": {"caption": "a photo of a white tv and a red cat and a black keyboard ", "segment": [{"bbox": [0.047843750000000004, 0.0, 0.82715625, 0.7097708333333334], "label": "a white tv"}, {"bbox": [0.206453125, 0.034416666666666665, 0.9919374999999999, 0.9871041666666667], "label": "a red cat"}, {"bbox": [0.0033750000000000004, 0.8337083333333334, 0.456734375, 0.9887708333333334], "label": "a black keyboard"}], "image_id": "142890"}, "164": {"caption": "a photo of a black car and a brown motorcycle and a blue truck ", "segment": [{"bbox": [0.094171875, 0.1695, 0.47421875, 0.5080625], "label": "a black car"}, {"bbox": [0.3055625, 0.0049375, 1.0, 0.9876458333333333], "label": "a brown motorcycle"}, {"bbox": [0.076328125, 0.169625, 0.22949999999999998, 0.31054166666666666], "label": "a blue truck"}], "image_id": "491213"}, "165": {"caption": "a photo of a green fork and a yellow bowl and a black dining table ", "segment": [{"bbox": [0.5879583333333334, 0.571328125, 0.9989791666666666, 0.7849999999999999], "label": "a green fork"}, {"bbox": [0.499625, 0.004765625, 0.9749375, 0.3115], "label": "a yellow bowl"}, {"bbox": [0.006, 0.0045, 1.0, 0.9887656249999999], "label": "a black dining table"}], "image_id": "19723"}, "166": {"caption": "a photo of a green sheep and a yellow sheep and a red sheep and a blue sheep and a brown sheep and a green sheep ", "segment": [{"bbox": [0.693546875, 0.32258333333333333, 0.8612968750000001, 0.9720416666666668], "label": "a green sheep"}, {"bbox": [0.0, 0.3299166666666667, 0.24784375, 0.6322916666666667], "label": "a yellow sheep"}, {"bbox": [0.42167187500000003, 0.32102083333333337, 0.59871875, 0.6321875000000001], "label": "a red sheep"}, {"bbox": [0.57096875, 0.31612500000000004, 0.69678125, 0.6387083333333334], "label": "a blue sheep"}, {"bbox": [0.012843750000000001, 0.46702083333333333, 0.2055625, 0.6704375], "label": "a brown sheep"}, {"bbox": [0.8049687499999999, 0.2265, 0.9420624999999999, 0.4667291666666667], "label": "a green sheep"}], "image_id": "71281"}, "167": {"caption": "a photo of a black car and a black truck and a black bus ", "segment": [{"bbox": [0.07506818181818183, 0.412546875, 0.997840909090909, 0.9845937499999999], "label": "a black car"}, {"bbox": [0.07934090909090909, 0.41039062499999995, 1.0, 0.9870156250000001], "label": "a black truck"}, {"bbox": [0.0, 0.251578125, 0.2253181818181818, 0.5653750000000001], "label": "a black bus"}], "image_id": "237324"}, "168": {"caption": "a photo of a blue pizza and a green pizza and a green pizza and a red pizza and a yellow pizza and a yellow pizza ", "segment": [{"bbox": [0.31904, 0.37751999999999997, 0.7478666666666667, 0.6239199999999999], "label": "a blue pizza"}, {"bbox": [0.0, 0.47266, 0.31944, 0.72526], "label": "a green pizza"}, {"bbox": [0.1828533333333333, 0.12132, 0.5741333333333333, 0.31314], "label": "a green pizza"}, {"bbox": [0.7364533333333334, 0.22496000000000002, 1.0, 0.43942000000000003], "label": "a red pizza"}, {"bbox": [0.5694666666666667, 0.06704, 0.9119200000000001, 0.21545999999999998], "label": "a yellow pizza"}, {"bbox": [0.0, 0.19712000000000002, 0.17874666666666666, 0.35194], "label": "a yellow pizza"}], "image_id": "271986"}, "169": {"caption": "a photo of a red sandwich and a blue sandwich and a black fork and a black dining table ", "segment": [{"bbox": [0.4173125, 0.17307692307692307, 0.778921875, 0.6132307692307692], "label": "a red sandwich"}, {"bbox": [0.175734375, 0.13483516483516483, 0.452125, 0.5168571428571428], "label": "a blue sandwich"}, {"bbox": [0.38821875, 0.5865274725274725, 0.960171875, 0.9033626373626373], "label": "a black fork"}, {"bbox": [0.005546875, 0.0032527472527472527, 1.0, 0.9876703296703297], "label": "a black dining table"}], "image_id": "256945"}, "170": {"caption": "a photo of a white spoon and a red banana and a yellow dining table and a black dining table ", "segment": [{"bbox": [0.32134375, 0.52965625, 0.7887656249999999, 0.985828125], "label": "a white spoon"}, {"bbox": [0.330265625, 0.17976562499999998, 1.0, 1.0], "label": "a red banana"}, {"bbox": [0.0, 0.0, 0.23098437500000002, 0.317546875], "label": "a yellow dining table"}, {"bbox": [0.0062656249999999995, 0.6376875, 0.19656250000000003, 0.9976406250000001], "label": "a black dining table"}], "image_id": "96327"}, "171": {"caption": "a photo of a yellow bowl and a green banana and a white apple and a blue chair and a brown microwave ", "segment": [{"bbox": [0.0033750000000000004, 0.04045833333333334, 1.0, 0.9865208333333334], "label": "a yellow bowl"}, {"bbox": [0.293265625, 0.21139583333333334, 0.9842656250000001, 0.9484583333333333], "label": "a green banana"}, {"bbox": [0.303890625, 0.470125, 0.5474062500000001, 0.7610416666666666], "label": "a white apple"}, {"bbox": [0.388046875, 0.0, 0.7800625, 0.28808333333333336], "label": "a blue chair"}, {"bbox": [0.822578125, 0.01825, 0.998234375, 0.2383125], "label": "a brown microwave"}], "image_id": "482719"}, "172": {"caption": "a photo of a red horse and a blue horse ", "segment": [{"bbox": [0.512015625, 0.0009624413145539906, 0.913640625, 0.9894131455399061], "label": "a red horse"}, {"bbox": [0.0, 0.0002112676056338028, 0.6000625, 0.9941784037558685], "label": "a blue horse"}], "image_id": "272518"}, "173": {"caption": "a photo of a blue couch and a brown refrigerator ", "segment": [{"bbox": [0.334953125, 0.5591314553990611, 0.9991562500000001, 0.9870892018779343], "label": "a blue couch"}, {"bbox": [0.644359375, 0.2882863849765258, 0.7732812499999999, 0.5611267605633803], "label": "a brown refrigerator"}], "image_id": "512223"}, "174": {"caption": "a photo of a blue sheep and a green sheep and a black sheep and a black sheep and a black sheep and a white sheep ", "segment": [{"bbox": [0.07954687499999999, 0.16988847583643124, 0.59115625, 0.987100371747212], "label": "a blue sheep"}, {"bbox": [0.5429999999999999, 0.19739776951672863, 0.832734375, 0.6713197026022305], "label": "a green sheep"}, {"bbox": [0.735546875, 0.5721933085501858, 1.0, 0.9859851301115242], "label": "a black sheep"}, {"bbox": [0.640046875, 0.1545910780669145, 0.9561093749999999, 0.36600371747211896], "label": "a black sheep"}, {"bbox": [0.775, 0.38007434944237917, 0.9835312500000001, 0.663717472118959], "label": "a black sheep"}, {"bbox": [0.6725, 0.08386617100371747, 0.9020937499999999, 0.22795539033457246], "label": "a white sheep"}], "image_id": "430856"}, "175": {"caption": "a photo of a green tv and a blue keyboard ", "segment": [{"bbox": [0.42484374999999996, 0.0022482435597189696, 0.8048124999999999, 0.726463700234192], "label": "a green tv"}, {"bbox": [0.26390625, 0.6413583138173302, 0.5174375, 0.7842857142857143], "label": "a blue keyboard"}], "image_id": "186282"}, "176": {"caption": "a photo of a green elephant and a black elephant ", "segment": [{"bbox": [0.7264062499999999, 0.07472916666666667, 1.0, 0.9893333333333333], "label": "a green elephant"}, {"bbox": [0.0, 0.021395833333333333, 0.8260156249999999, 0.989875], "label": "a black elephant"}], "image_id": "246931"}, "177": {"caption": "a photo of a blue dining table and a red bottle and a black cup and a white fork and a green spoon ", "segment": [{"bbox": [0.0, 0.007065462753950339, 0.998375, 0.9882392776523703], "label": "a blue dining table"}, {"bbox": [0.55375, 0.002257336343115124, 0.76840625, 0.41124153498871335], "label": "a red bottle"}, {"bbox": [0.371765625, 0.011241534988713319, 0.544421875, 0.42697516930022567], "label": "a black cup"}, {"bbox": [0.08882812500000001, 0.23318284424379232, 0.272453125, 0.45568848758465014], "label": "a white fork"}, {"bbox": [0.14434375, 0.21808126410835213, 0.325953125, 0.41266365688487583], "label": "a green spoon"}], "image_id": "353536"}, "178": {"caption": "a photo of a red tv and a blue couch and a blue couch ", "segment": [{"bbox": [0.66314, 0.06421333333333333, 0.8268399999999999, 0.36488], "label": "a red tv"}, {"bbox": [0.00122, 0.5333866666666667, 0.18336, 0.7592533333333334], "label": "a blue couch"}, {"bbox": [0.23063999999999998, 0.48733333333333334, 0.52282, 0.70136], "label": "a blue couch"}], "image_id": "292617"}, "179": {"caption": "a photo of a white umbrella and a brown dining table ", "segment": [{"bbox": [0.28171875, 0.05805620608899297, 0.55903125, 0.33761124121779856], "label": "a white umbrella"}, {"bbox": [0.16684375, 0.24002341920374706, 0.337015625, 0.45086651053864163], "label": "a brown dining table"}], "image_id": "408057"}, "180": {"caption": "a photo of a brown cup and a yellow vase and a green dining table ", "segment": [{"bbox": [0.67771875, 0.7539457202505219, 0.8127656250000002, 0.9504384133611691], "label": "a brown cup"}, {"bbox": [0.416171875, 0.4932776617954071, 0.595734375, 0.8834029227557411], "label": "a yellow vase"}, {"bbox": [0.007781250000000001, 0.7116910229645094, 1.0, 0.9870146137787056], "label": "a green dining table"}], "image_id": "264625"}, "181": {"caption": "a photo of a green potted plant and a brown vase ", "segment": [{"bbox": [0.098390625, 0.004291666666666667, 0.9032187500000001, 0.926875], "label": "a green potted plant"}, {"bbox": [0.616859375, 0.5219166666666667, 0.7735937500000001, 0.9331458333333332], "label": "a brown vase"}], "image_id": "577735"}, "182": {"caption": "a photo of a white pizza and a black pizza ", "segment": [{"bbox": [0.547453125, 0.3168544600938967, 0.9572968750000002, 0.7730281690140846], "label": "a white pizza"}, {"bbox": [0.134625, 0.3348356807511737, 0.49959375, 0.8494366197183099], "label": "a black pizza"}], "image_id": "249884"}, "183": {"caption": "a photo of a yellow bird and a black bear ", "segment": [{"bbox": [0.24084374999999997, 0.4512735849056604, 0.9221562500000001, 0.9474528301886793], "label": "a yellow bird"}, {"bbox": [0.22778125, 0.1704009433962264, 0.53, 0.5794103773584905], "label": "a black bear"}], "image_id": "572517"}, "184": {"caption": "a photo of a red laptop and a black cup and a brown cake ", "segment": [{"bbox": [0.23932812499999997, 0.0045000000000000005, 1.0, 0.9865208333333334], "label": "a red laptop"}, {"bbox": [0.187078125, 0.0022500000000000003, 0.3505625, 0.5101041666666667], "label": "a black cup"}, {"bbox": [0.01875, 0.524875, 0.152609375, 0.7347083333333333], "label": "a brown cake"}], "image_id": "518592"}, "185": {"caption": "a photo of a yellow dog and a white dog and a yellow car ", "segment": [{"bbox": [0.3258125, 0.4551990632318501, 0.576828125, 0.7862295081967213], "label": "a yellow dog"}, {"bbox": [0.754859375, 0.4839110070257611, 0.8996562499999999, 0.794192037470726], "label": "a white dog"}, {"bbox": [0.056515625, 0.10515222482435597, 0.8916718749999999, 0.7639812646370022], "label": "a yellow car"}], "image_id": "98194"}, "186": {"caption": "a photo of a black truck and a white truck ", "segment": [{"bbox": [0.0, 0.04494145199063232, 0.757140625, 0.8719203747072599], "label": "a black truck"}, {"bbox": [0.7689375, 0.4616393442622951, 0.926765625, 0.5992271662763466], "label": "a white truck"}], "image_id": "396851"}, "187": {"caption": "a photo of a black dining table and a red cake and a yellow cake and a blue cake ", "segment": [{"bbox": [0.005078125, 0.34029166666666666, 1.0, 0.9881458333333335], "label": "a black dining table"}, {"bbox": [0.619125, 0.36933333333333335, 0.8204687500000001, 0.5662083333333333], "label": "a red cake"}, {"bbox": [0.00840625, 0.7937291666666667, 0.139578125, 0.9417083333333333], "label": "a yellow cake"}, {"bbox": [0.0375, 0.4166666666666667, 0.6515625, 0.7729166666666667], "label": "a blue cake"}], "image_id": "318455"}, "188": {"caption": "a photo of a yellow toilet and a blue toilet and a blue sink ", "segment": [{"bbox": [0.70921875, 0.018583333333333334, 0.996734375, 0.5799791666666667], "label": "a yellow toilet"}, {"bbox": [0.0, 0.3595416666666667, 0.183703125, 0.9887708333333334], "label": "a blue toilet"}, {"bbox": [0.283734375, 0.0720625, 0.674390625, 0.4313541666666667], "label": "a blue sink"}], "image_id": "332532"}, "189": {"caption": "a photo of a white bed and a white teddy bear and a black teddy bear ", "segment": [{"bbox": [0.0, 0.004580498866213152, 1.0, 0.9995464852607708], "label": "a white bed"}, {"bbox": [0.009296875, 0.3370748299319728, 0.24775, 0.7910204081632654], "label": "a white teddy bear"}, {"bbox": [0.636421875, 0.08764172335600906, 0.9863593749999999, 0.7168480725623583], "label": "a black teddy bear"}], "image_id": "128813"}, "190": {"caption": "a photo of a green bowl and a brown cup and a yellow fork and a red spoon and a white cup and a yellow cup ", "segment": [{"bbox": [0.09214052287581699, 0.0022549019607843133, 0.5707843137254902, 0.3595424836601307], "label": "a green bowl"}, {"bbox": [0.6995588235294118, 0.2838562091503268, 0.9618790849673202, 0.5170424836601307], "label": "a brown cup"}, {"bbox": [0.002238562091503268, 0.47782679738562095, 0.18166666666666667, 0.7711928104575164], "label": "a yellow fork"}, {"bbox": [0.38563725490196077, 0.0008496732026143792, 0.6668464052287582, 0.1878921568627451], "label": "a red spoon"}, {"bbox": [0.026519607843137255, 0.0003104575163398693, 0.19106209150326797, 0.16161764705882353], "label": "a white cup"}, {"bbox": [0.4533333333333333, 0.02168300653594771, 0.6069117647058824, 0.15178104575163398], "label": "a yellow cup"}], "image_id": "321008"}, "191": {"caption": "a photo of a green car and a black car and a blue fire hydrant ", "segment": [{"bbox": [0.0005970149253731343, 0.30666000000000004, 0.2707462686567164, 0.43870000000000003], "label": "a green car"}, {"bbox": [0.2192537313432836, 0.2978, 0.841044776119403, 0.46218], "label": "a black car"}, {"bbox": [0.24525373134328357, 0.49272000000000005, 0.4971343283582089, 0.95172], "label": "a blue fire hydrant"}], "image_id": "293071"}, "192": {"caption": "a photo of a white sink and a blue donut ", "segment": [{"bbox": [0.242546875, 0.04663551401869159, 0.528421875, 0.20467289719626167], "label": "a white sink"}, {"bbox": [0.075, 0.2850467289719626, 0.525, 0.6892523364485982], "label": "a blue donut"}], "image_id": "329475"}, "193": {"caption": "a photo of a brown wine glass and a yellow wine glass and a blue cup and a blue bowl and a blue sandwich and a white apple ", "segment": [{"bbox": [0.268125, 0.005078125, 0.7579375, 0.457828125], "label": "a brown wine glass"}, {"bbox": [0.08689583333333334, 0.001875, 0.37752083333333336, 0.282765625], "label": "a yellow wine glass"}, {"bbox": [0.7071666666666666, 0.001, 0.9338541666666667, 0.18028125], "label": "a blue cup"}, {"bbox": [0.0021875, 0.11725000000000001, 0.3099791666666667, 0.244421875], "label": "a blue bowl"}, {"bbox": [0.006, 0.298875, 0.797, 0.865171875], "label": "a blue sandwich"}, {"bbox": [0.5229374999999999, 0.5216406250000001, 0.8935, 0.869703125], "label": "a white apple"}], "image_id": "360209"}, "194": {"caption": "a photo of a white giraffe and a red giraffe ", "segment": [{"bbox": [0.31732, 0.21517333333333333, 0.50698, 0.79784], "label": "a white giraffe"}, {"bbox": [0.42613999999999996, 0.37984, 0.63636, 0.8470133333333333], "label": "a red giraffe"}], "image_id": "422253"}, "195": {"caption": "a photo of a green tv and a red bed and a brown toilet ", "segment": [{"bbox": [0.44829687500000004, 0.44508196721311477, 0.59221875, 0.6765573770491803], "label": "a green tv"}, {"bbox": [0.6776875, 0.6900468384074941, 1.0, 0.9866744730679156], "label": "a red bed"}, {"bbox": [0.092375, 0.6277985948477751, 0.242328125, 0.8986651053864169], "label": "a brown toilet"}], "image_id": "72018"}, "196": {"caption": "a photo of a green car and a yellow car ", "segment": [{"bbox": [0.0016875000000000002, 0.7701041666666666, 0.187078125, 0.9835833333333334], "label": "a green car"}, {"bbox": [0.35164062500000004, 0.7535416666666667, 0.6569375, 1.0], "label": "a yellow car"}], "image_id": "1532"}, "197": {"caption": "a photo of a green cat and a blue sink ", "segment": [{"bbox": [0.34804, 0.3612912912912913, 0.6731600000000001, 0.9354954954954955], "label": "a green cat"}, {"bbox": [0.13456, 0.428918918918919, 0.8996400000000001, 1.0], "label": "a blue sink"}], "image_id": "325356"}, "198": {"caption": "a photo of a yellow potted plant and a black potted plant and a green dining table ", "segment": [{"bbox": [0.5794859813084112, 0.657421875, 0.8144859813084113, 0.81459375], "label": "a yellow potted plant"}, {"bbox": [0.758481308411215, 0.5445, 0.9292289719626168, 0.685046875], "label": "a black potted plant"}, {"bbox": [0.291518691588785, 0.57840625, 0.5932943925233645, 0.736375], "label": "a green dining table"}], "image_id": "52368"}, "199": {"caption": "a photo of a red cow and a green cow ", "segment": [{"bbox": [0.408921875, 0.5867447306791569, 0.555265625, 0.9716861826697891], "label": "a red cow"}, {"bbox": [0.5836875, 0.49053864168618266, 0.9515625, 1.0], "label": "a green cow"}], "image_id": "535950"}, "200": {"caption": "a photo of a yellow giraffe and a black giraffe and a black giraffe and a white giraffe and a black giraffe and a yellow giraffe ", "segment": [{"bbox": [0.5031041666666667, 0.37321875000000004, 0.7499166666666668, 0.9800156250000001], "label": "a yellow giraffe"}, {"bbox": [0.4080625, 0.44515625, 0.7857916666666667, 0.90140625], "label": "a black giraffe"}, {"bbox": [0.533625, 0.39715625, 0.834375, 0.9288437500000001], "label": "a black giraffe"}, {"bbox": [0.10691666666666667, 0.4968125, 0.33029166666666665, 0.8066875], "label": "a white giraffe"}, {"bbox": [0.7400833333333333, 0.49214062500000005, 1.0, 0.9528125], "label": "a black giraffe"}, {"bbox": [0.4075, 0.37303125000000004, 0.6112291666666666, 0.898875], "label": "a yellow giraffe"}], "image_id": "296816"}, "201": {"caption": "a photo of a yellow cat and a brown suitcase and a green book ", "segment": [{"bbox": [0.30162, 0.15698666666666666, 0.9903200000000001, 0.7526933333333333], "label": "a yellow cat"}, {"bbox": [0.0, 0.00021333333333333333, 1.0, 0.9890399999999999], "label": "a brown suitcase"}, {"bbox": [0.40758, 0.08861333333333332, 0.55004, 0.26016], "label": "a green book"}], "image_id": "224861"}, "202": {"caption": "a photo of a blue sheep and a black sheep and a blue sheep and a green sheep and a brown dog and a green sheep ", "segment": [{"bbox": [0.324484375, 0.5420287253141832, 0.78965625, 0.8135727109515261], "label": "a blue sheep"}, {"bbox": [0.0062656249999999995, 0.2454398563734291, 0.33184375, 0.5547935368043088], "label": "a black sheep"}, {"bbox": [0.18717187500000002, 0.2636445242369838, 0.473125, 0.5697307001795333], "label": "a blue sheep"}, {"bbox": [0.40971875, 0.22138240574506285, 0.6228125, 0.5093895870736086], "label": "a green sheep"}, {"bbox": [0.565828125, 0.0796588868940754, 0.7265312500000001, 0.308096947935368], "label": "a brown dog"}, {"bbox": [0.794640625, 0.2750987432675045, 0.9384062500000001, 0.481867145421903], "label": "a green sheep"}], "image_id": "483994"}, "203": {"caption": "a photo of a red bear and a brown bear ", "segment": [{"bbox": [0.27340624999999996, 0.054423529411764704, 0.97353125, 0.8274823529411764], "label": "a red bear"}, {"bbox": [0.14090625, 0.27256470588235293, 0.598109375, 0.9430117647058823], "label": "a brown bear"}], "image_id": "502084"}, "204": {"caption": "a photo of a brown car and a yellow suitcase ", "segment": [{"bbox": [0.08036, 0.5429782082324455, 0.93812, 0.9864164648910412], "label": "a brown car"}, {"bbox": [0.45533999999999997, 0.23099273607748186, 0.69616, 0.4801937046004843], "label": "a yellow suitcase"}], "image_id": "27530"}, "205": {"caption": "a photo of a black bed and a red bed ", "segment": [{"bbox": [0.032125, 0.29663934426229505, 0.714515625, 0.9865300546448087], "label": "a black bed"}, {"bbox": [0.40589062499999995, 0.24415300546448088, 0.9038437500000001, 0.9176229508196722], "label": "a red bed"}], "image_id": "270239"}, "206": {"caption": "a photo of a white potted plant and a black potted plant and a red vase and a black vase ", "segment": [{"bbox": [0.0033723653395784543, 0.440453125, 0.5422716627634661, 0.9797812499999999], "label": "a white potted plant"}, {"bbox": [0.5113583138173302, 0.34353125, 1.0, 0.988234375], "label": "a black potted plant"}, {"bbox": [0.5356440281030445, 0.793796875, 0.8846135831381734, 0.9955], "label": "a red vase"}, {"bbox": [0.15519906323185012, 0.763671875, 0.5074941451990632, 0.971859375], "label": "a black vase"}], "image_id": "163447"}, "207": {"caption": "a photo of a blue broccoli and a black dining table ", "segment": [{"bbox": [0.47050000000000003, 0.22288056206088994, 0.692359375, 0.5011709601873536], "label": "a blue broccoli"}, {"bbox": [0.0, 0.0025995316159250588, 0.993828125, 0.9895784543325528], "label": "a black dining table"}], "image_id": "169736"}, "208": {"caption": "a photo of a brown suitcase and a white suitcase and a green suitcase and a black suitcase and a red suitcase and a black suitcase ", "segment": [{"bbox": [0.0, 0.15954166666666666, 0.42303125, 0.9280833333333333], "label": "a brown suitcase"}, {"bbox": [0.52871875, 0.40539583333333334, 1.0, 0.9864791666666667], "label": "a white suitcase"}, {"bbox": [0.122484375, 0.36933333333333335, 0.29865624999999996, 0.9800833333333334], "label": "a green suitcase"}, {"bbox": [0.0735, 0.09441666666666666, 0.534953125, 0.26787500000000003], "label": "a black suitcase"}, {"bbox": [0.20903125, 0.04120833333333333, 0.6180468749999999, 0.22991666666666666], "label": "a red suitcase"}, {"bbox": [0.768109375, 0.6701666666666667, 0.9997187499999999, 0.996625], "label": "a black suitcase"}], "image_id": "507783"}, "209": {"caption": "a photo of a yellow cow and a black cow and a brown cow and a red cow and a red cow ", "segment": [{"bbox": [0.8116562500000001, 0.46214583333333337, 0.9915312500000001, 0.5884791666666668], "label": "a yellow cow"}, {"bbox": [0.280359375, 0.4609166666666667, 0.49678125, 0.6306041666666666], "label": "a black cow"}, {"bbox": [0.49409375000000005, 0.4515, 0.691203125, 0.5908541666666667], "label": "a brown cow"}, {"bbox": [0.53096875, 0.48895833333333333, 0.7252656249999999, 0.6647916666666667], "label": "a red cow"}, {"bbox": [0.051234375, 0.4774791666666667, 0.20495312499999999, 0.6585], "label": "a red cow"}], "image_id": "105367"}, "210": {"caption": "a photo of a yellow cake and a green cake and a red cake and a red cake and a black cake ", "segment": [{"bbox": [0.21331999999999998, 0.6924266666666667, 0.42494, 0.8978666666666668], "label": "a yellow cake"}, {"bbox": [0.29698, 0.7742666666666668, 0.5839000000000001, 0.9890400000000001], "label": "a green cake"}, {"bbox": [0.30842, 0.3370666666666667, 0.50394, 0.4629333333333334], "label": "a red cake"}, {"bbox": [0.2793, 0.7413333333333333, 0.46826, 0.9290666666666666], "label": "a red cake"}, {"bbox": [0.144, 0.632, 0.732, 0.8426666666666667], "label": "a black cake"}], "image_id": "330237"}, "211": {"caption": "a photo of a red zebra and a brown zebra and a white giraffe ", "segment": [{"bbox": [0.4318905472636816, 0.52998, 0.705547263681592, 0.8654400000000001], "label": "a red zebra"}, {"bbox": [0.6540298507462687, 0.50718, 0.9838557213930348, 0.7746000000000001], "label": "a brown zebra"}, {"bbox": [0.0, 0.20188, 0.6484328358208956, 0.7457], "label": "a white giraffe"}], "image_id": "383282"}, "212": {"caption": "a photo of a brown dining table and a white wine glass ", "segment": [{"bbox": [0.15314583333333334, 0.005625, 1.0, 0.989859375], "label": "a brown dining table"}, {"bbox": [0.8184166666666666, 0.044437500000000005, 0.9950416666666667, 0.2678125], "label": "a white wine glass"}], "image_id": "31625"}, "213": {"caption": "a photo of a brown car and a white truck ", "segment": [{"bbox": [0.8270312499999999, 0.7655625, 0.992, 0.932875], "label": "a brown car"}, {"bbox": [0.8267187500000001, 0.7613541666666667, 0.99103125, 0.9261041666666666], "label": "a white truck"}], "image_id": "216790"}, "214": {"caption": "a photo of a white cat and a red bed and a white cat ", "segment": [{"bbox": [0.114890625, 0.5640625, 0.48421875, 0.7125833333333333], "label": "a white cat"}, {"bbox": [0.0016875000000000002, 0.30258333333333337, 0.9972031250000001, 0.9819583333333334], "label": "a red bed"}, {"bbox": [0.587296875, 0.5075416666666667, 0.86915625, 0.7252083333333333], "label": "a white cat"}], "image_id": "553547"}, "215": {"caption": "a photo of a yellow tv and a black sink ", "segment": [{"bbox": [0.421296875, 0.4814519906323185, 0.559234375, 0.6297658079625293], "label": "a yellow tv"}, {"bbox": [0.0, 0.6898829039812646, 0.1364375, 0.9887587822014051], "label": "a black sink"}], "image_id": "239041"}, "216": {"caption": "a photo of a black chair and a red dining table ", "segment": [{"bbox": [0.0, 0.291265625, 0.7074117647058823, 1.0], "label": "a black chair"}, {"bbox": [0.0, 0.36553125, 0.15915294117647058, 0.539390625], "label": "a red dining table"}], "image_id": "362023"}, "217": {"caption": "a photo of a brown bird and a black bird ", "segment": [{"bbox": [0.31639062500000004, 0.24482517482517482, 0.46618750000000003, 0.7825174825174825], "label": "a brown bird"}, {"bbox": [0.42625, 0.3824475524475524, 0.5962343750000001, 0.8226573426573426], "label": "a black bird"}], "image_id": "531136"}, "218": {"caption": "a photo of a black car and a blue clock ", "segment": [{"bbox": [0.037484375, 0.45618266978922717, 0.419796875, 0.9280796252927399], "label": "a black car"}, {"bbox": [0.241859375, 0.0747775175644028, 0.7812812499999999, 0.5605152224824356], "label": "a blue clock"}], "image_id": "16838"}, "219": {"caption": "a photo of a red horse and a white motorcycle and a blue motorcycle ", "segment": [{"bbox": [0.10900000000000001, 0.26477083333333334, 0.28117187499999996, 0.484], "label": "a red horse"}, {"bbox": [0.11485937500000001, 0.16104166666666667, 0.9408749999999999, 0.8592291666666667], "label": "a white motorcycle"}, {"bbox": [0.015171875000000001, 0.2612291666666667, 0.3438125, 0.6859583333333333], "label": "a blue motorcycle"}], "image_id": "262394"}, "220": {"caption": "a photo of a blue sheep and a brown sheep ", "segment": [{"bbox": [0.43776562500000005, 0.39829166666666665, 0.5681406250000001, 0.5613750000000001], "label": "a blue sheep"}, {"bbox": [0.736125, 0.441375, 0.916953125, 0.6529583333333334], "label": "a brown sheep"}], "image_id": "391825"}, "221": {"caption": "a photo of a brown tv and a yellow chair and a yellow chair and a red bus and a black chair ", "segment": [{"bbox": [0.722984375, 0.2948125, 0.8700468749999999, 0.43472916666666667], "label": "a brown tv"}, {"bbox": [0.0, 0.5738333333333333, 0.3580625, 0.9888958333333332], "label": "a yellow chair"}, {"bbox": [0.207375, 0.57375, 0.47103125000000007, 0.942125], "label": "a yellow chair"}, {"bbox": [0.0016875000000000002, 0.00975, 1.0, 0.989875], "label": "a red bus"}, {"bbox": [0.85078125, 0.76625, 1.0, 0.935], "label": "a black chair"}], "image_id": "363286"}, "222": {"caption": "a photo of a white toilet and a brown sink and a blue book and a blue book ", "segment": [{"bbox": [0.41881250000000003, 0.811244131455399, 0.8226875, 0.9887558685446008], "label": "a white toilet"}, {"bbox": [0.003, 0.6283802816901408, 0.17690625, 0.9684741784037558], "label": "a brown sink"}, {"bbox": [0.625984375, 0.2188262910798122, 0.967546875, 0.6257042253521127], "label": "a blue book"}, {"bbox": [0.46325000000000005, 0.811244131455399, 0.738859375, 1.0], "label": "a blue book"}], "image_id": "314016"}, "223": {"caption": "a photo of a brown bicycle and a green bus and a white bicycle ", "segment": [{"bbox": [0.691421875, 0.5490833333333334, 0.8716875, 0.8500208333333333], "label": "a brown bicycle"}, {"bbox": [0.0016875000000000002, 0.10562500000000001, 0.9977500000000001, 0.896625], "label": "a green bus"}, {"bbox": [0.0, 0.78625, 0.20875, 1.0], "label": "a white bicycle"}], "image_id": "196843"}, "224": {"caption": "a photo of a blue traffic light and a red traffic light ", "segment": [{"bbox": [0.29317187499999997, 0.30338028169014086, 0.5444687500000001, 0.8471830985915493], "label": "a blue traffic light"}, {"bbox": [0.50984375, 0.295868544600939, 0.6595000000000001, 0.5357042253521127], "label": "a red traffic light"}], "image_id": "455170"}, "225": {"caption": "a photo of a red cake and a green cake and a white cake and a yellow cake and a black cake and a blue oven ", "segment": [{"bbox": [0.11965624999999999, 0.5428, 0.5354375, 0.8108000000000001], "label": "a red cake"}, {"bbox": [0.5805, 0.4853882352941176, 0.9281874999999999, 0.6921411764705881], "label": "a green cake"}, {"bbox": [0.38821875, 0.2973647058823529, 0.70034375, 0.4601176470588236], "label": "a white cake"}, {"bbox": [0.003546875, 0.10962352941176472, 1.0, 0.5508], "label": "a yellow cake"}, {"bbox": [0.005156249999999999, 0.34887058823529415, 0.3303125, 0.5276235294117647], "label": "a black cake"}, {"bbox": [0.0, 0.024776470588235292, 1.0, 1.0], "label": "a blue oven"}], "image_id": "352671"}, "226": {"caption": "a photo of a white bed and a blue bed ", "segment": [{"bbox": [0.31357999999999997, 0.46324324324324323, 0.9049200000000001, 1.0], "label": "a white bed"}, {"bbox": [0.18516, 0.47009009009009006, 0.56296, 0.8243543543543543], "label": "a blue bed"}], "image_id": "105866"}, "227": {"caption": "a photo of a blue chair and a white dining table and a white chair and a blue oven ", "segment": [{"bbox": [0.651515625, 0.6302708333333332, 0.78346875, 0.9503125], "label": "a blue chair"}, {"bbox": [0.45081249999999995, 0.4875833333333333, 0.78, 0.8396458333333333], "label": "a white dining table"}, {"bbox": [0.431453125, 0.52825, 0.596625, 0.815875], "label": "a white chair"}, {"bbox": [0.27023437499999997, 0.35683333333333334, 0.41925, 0.6248333333333332], "label": "a blue oven"}], "image_id": "448795"}, "228": {"caption": "a photo of a white sheep and a white sheep and a yellow sheep ", "segment": [{"bbox": [0.15132812499999998, 0.3688028169014085, 0.6384531250000001, 0.909037558685446], "label": "a white sheep"}, {"bbox": [0.67275, 0.19199530516431926, 0.9692187499999999, 0.573169014084507], "label": "a white sheep"}, {"bbox": [0.391375, 0.28884976525821593, 0.7927500000000001, 0.7931220657276995], "label": "a yellow sheep"}], "image_id": "424289"}, "229": {"caption": "a photo of a black kite and a brown kite and a green kite and a red kite and a red kite and a black kite ", "segment": [{"bbox": [0.435046875, 0.7338333333333333, 0.6110156250000001, 0.9789583333333333], "label": "a black kite"}, {"bbox": [0.234625, 0.7760416666666666, 0.38575, 1.0], "label": "a brown kite"}, {"bbox": [0.161796875, 0.08314583333333332, 0.8022499999999999, 0.8404583333333332], "label": "a green kite"}, {"bbox": [0.26440625, 0.15833333333333333, 0.531140625, 0.46379166666666666], "label": "a red kite"}, {"bbox": [0.40532812500000004, 0.191, 0.605671875, 0.4625833333333334], "label": "a red kite"}, {"bbox": [0.0015625, 0.5791666666666667, 0.8421875, 0.9979166666666667], "label": "a black kite"}], "image_id": "329946"}, "230": {"caption": "a photo of a blue car and a yellow bus and a green truck ", "segment": [{"bbox": [0.0, 0.6516822429906542, 0.38771875, 0.9887616822429908], "label": "a blue car"}, {"bbox": [0.25246875, 0.25, 1.0, 0.7174065420560748], "label": "a yellow bus"}, {"bbox": [0.0, 0.6292056074766356, 0.389234375, 0.9887616822429907], "label": "a green truck"}], "image_id": "154168"}, "231": {"caption": "a photo of a black cat and a blue bed ", "segment": [{"bbox": [0.07503125000000001, 0.25416666666666665, 0.76728125, 0.8689791666666667], "label": "a black cat"}, {"bbox": [0.0, 0.0, 1.0, 0.9887708333333334], "label": "a blue bed"}], "image_id": "357391"}, "232": {"caption": "a photo of a black boat and a yellow boat ", "segment": [{"bbox": [0.02239740820734341, 0.178296875, 0.6283153347732182, 0.35290625000000003], "label": "a black boat"}, {"bbox": [0.14023758099352054, 0.012578125, 0.7488984881209504, 0.246828125], "label": "a yellow boat"}], "image_id": "324785"}, "233": {"caption": "a photo of a blue cup and a blue fork and a yellow pizza and a brown pizza and a red dining table ", "segment": [{"bbox": [0.2690625, 0.005833333333333333, 0.4305, 0.277125], "label": "a blue cup"}, {"bbox": [0.07753125, 0.6981875, 0.41798437499999996, 0.9835833333333334], "label": "a blue fork"}, {"bbox": [0.0016718750000000002, 0.21497916666666667, 1.0, 1.0], "label": "a yellow pizza"}, {"bbox": [0.0, 0.008354166666666666, 0.286328125, 0.247625], "label": "a brown pizza"}, {"bbox": [0.006734374999999999, 0.0022500000000000003, 1.0, 0.4471875], "label": "a red dining table"}], "image_id": "163611"}, "234": {"caption": "a photo of a black toilet and a yellow sink ", "segment": [{"bbox": [0.0, 0.507859375, 0.3535625, 0.9977499999999999], "label": "a black toilet"}, {"bbox": [0.08408333333333333, 0.40653125, 0.46845833333333337, 0.550671875], "label": "a yellow sink"}], "image_id": "470348"}, "235": {"caption": "a photo of a white cow and a blue cow and a yellow cow ", "segment": [{"bbox": [0.19665625, 0.4858614564831261, 0.352421875, 0.705417406749556], "label": "a white cow"}, {"bbox": [0.002453125, 0.5469449378330373, 0.187703125, 0.8549023090586145], "label": "a blue cow"}, {"bbox": [0.06889062500000001, 0.32902309058614565, 0.367515625, 0.6197868561278863], "label": "a yellow cow"}], "image_id": "137576"}, "236": {"caption": "a photo of a red knife and a white scissors and a brown sink ", "segment": [{"bbox": [0.74946875, 0.38054166666666667, 0.940796875, 0.5891666666666667], "label": "a red knife"}, {"bbox": [0.500796875, 0.075375, 0.7254687499999999, 0.982], "label": "a white scissors"}, {"bbox": [0.805625, 0.32583333333333336, 0.99521875, 0.9797916666666666], "label": "a brown sink"}], "image_id": "456223"}, "237": {"caption": "a photo of a blue oven and a blue oven ", "segment": [{"bbox": [0.42040625, 0.5188333333333334, 0.6271718749999999, 0.6500625], "label": "a blue oven"}, {"bbox": [0.64675, 0.4155833333333333, 0.9116875, 0.9194791666666667], "label": "a blue oven"}], "image_id": "18918"}, "238": {"caption": "a photo of a blue refrigerator and a black oven ", "segment": [{"bbox": [0.32709375, 0.41032786885245903, 0.48778125, 0.8233723653395786], "label": "a blue refrigerator"}, {"bbox": [0.5855625, 0.42529274004683837, 0.727234375, 0.8445433255269321], "label": "a black oven"}], "image_id": "553129"}, "239": {"caption": "a photo of a blue car and a yellow car and a yellow bus and a yellow truck and a yellow truck ", "segment": [{"bbox": [0.144921875, 0.574192037470726, 0.4132187500000001, 0.8279625292740047], "label": "a blue car"}, {"bbox": [0.269875, 0.5052459016393442, 0.45128124999999997, 0.7434426229508196], "label": "a yellow car"}, {"bbox": [0.61171875, 0.24718969555035128, 0.8456093750000001, 0.6943793911007026], "label": "a yellow bus"}, {"bbox": [0.46003125, 0.4607728337236534, 0.60271875, 0.6932786885245901], "label": "a yellow truck"}, {"bbox": [0.052468749999999995, 0.5011241217798594, 0.259375, 0.6876346604215456], "label": "a yellow truck"}], "image_id": "172478"}, "240": {"caption": "a photo of a white dog and a blue bed and a brown handbag ", "segment": [{"bbox": [0.2964375, 0.3512206572769953, 0.592859375, 0.7560798122065728], "label": "a white dog"}, {"bbox": [0.184640625, 0.39842723004694836, 1.0, 0.7451877934272301], "label": "a blue bed"}, {"bbox": [0.495109375, 0.09661971830985915, 0.717984375, 0.2696713615023474], "label": "a brown handbag"}], "image_id": "100196"}, "241": {"caption": "a photo of a white apple and a green apple ", "segment": [{"bbox": [0.38932812499999997, 0.703375, 0.5545, 0.9123541666666667], "label": "a white apple"}, {"bbox": [0.241546875, 0.2668958333333334, 0.7719531249999999, 0.7826666666666667], "label": "a green apple"}], "image_id": "201717"}, "242": {"caption": "a photo of a white couch and a brown dining table ", "segment": [{"bbox": [0.8567031249999999, 0.5964772727272728, 1.0, 0.9952272727272728], "label": "a white couch"}, {"bbox": [0.41460937500000006, 0.7472727272727273, 0.715890625, 0.9996590909090909], "label": "a brown dining table"}], "image_id": "102947"}, "243": {"caption": "a photo of a yellow car and a black car and a white car ", "segment": [{"bbox": [0.5520416666666667, 0.503546875, 0.8546041666666667, 0.71646875], "label": "a yellow car"}, {"bbox": [0.29362499999999997, 0.40225, 0.9857708333333334, 0.986515625], "label": "a black car"}, {"bbox": [0.49022916666666666, 0.84140625, 0.6391249999999999, 0.99603125], "label": "a white car"}], "image_id": "473050"}, "244": {"caption": "a photo of a white horse and a green horse ", "segment": [{"bbox": [0.481984375, 0.05742990654205607, 0.945890625, 0.9898598130841121], "label": "a white horse"}, {"bbox": [0.403828125, 0.4114485981308411, 0.57709375, 0.9082242990654206], "label": "a green horse"}], "image_id": "335450"}, "245": {"caption": "a photo of a red chair and a green dining table ", "segment": [{"bbox": [0.37901562499999997, 0.516375, 0.5605, 0.9788958333333333], "label": "a red chair"}, {"bbox": [0.028234375, 0.44706250000000003, 0.557640625, 1.0], "label": "a green dining table"}], "image_id": "92998"}, "246": {"caption": "a photo of a white car and a brown car and a black motorcycle ", "segment": [{"bbox": [0.01583333333333333, 0.305328125, 0.6159166666666668, 0.702703125], "label": "a white car"}, {"bbox": [0.0, 0.33825, 0.19260416666666666, 0.492125], "label": "a brown car"}, {"bbox": [0.0074375, 0.45726562499999995, 0.9636250000000001, 0.9868124999999999], "label": "a black motorcycle"}], "image_id": "567171"}, "247": {"caption": "a photo of a yellow toilet and a brown sink ", "segment": [{"bbox": [0.7191803278688524, 0.54484375, 0.9275175644028102, 0.7668125], "label": "a yellow toilet"}, {"bbox": [0.07908665105386417, 0.5009375, 0.42074941451990633, 0.665140625], "label": "a brown sink"}], "image_id": "345401"}, "248": {"caption": "a photo of a yellow vase and a blue vase and a red vase and a brown vase and a red vase ", "segment": [{"bbox": [0.39028125, 0.37040485829959513, 0.5689375, 0.7883805668016194], "label": "a yellow vase"}, {"bbox": [0.25715625000000003, 0.25279352226720647, 0.41540625000000003, 0.6581983805668016], "label": "a blue vase"}, {"bbox": [0.547984375, 0.26730769230769236, 0.686640625, 0.6875506072874493], "label": "a red vase"}, {"bbox": [0.725046875, 0.34607287449392715, 0.9089062499999999, 0.7820242914979758], "label": "a brown vase"}, {"bbox": [0.08499999999999999, 0.3011336032388664, 0.234171875, 0.7460728744939271], "label": "a red vase"}], "image_id": "165795"}, "249": {"caption": "a photo of a black dining table and a blue sandwich and a green cup and a white fork and a brown bowl ", "segment": [{"bbox": [0.0, 0.270327868852459, 0.9641875000000001, 0.9885948477751756], "label": "a black dining table"}, {"bbox": [0.314140625, 0.2780327868852459, 0.5564843749999999, 0.8565105386416862], "label": "a blue sandwich"}, {"bbox": [0.003, 0.04269320843091335, 0.259375, 0.5056206088992974], "label": "a green cup"}, {"bbox": [0.73946875, 0.0, 0.941796875, 0.5047306791569087], "label": "a white fork"}, {"bbox": [0.539453125, 0.5979625292740047, 0.730296875, 0.7916627634660423], "label": "a brown bowl"}], "image_id": "373374"}, "250": {"caption": "a photo of a brown laptop and a yellow handbag ", "segment": [{"bbox": [0.32875, 0.3464959016393443, 0.9793749999999999, 0.9604918032786885], "label": "a brown laptop"}, {"bbox": [0.04840625, 0.07028688524590164, 0.781515625, 0.7165573770491803], "label": "a yellow handbag"}], "image_id": "293837"}, "251": {"caption": "a photo of a red bench and a green bench and a green bench ", "segment": [{"bbox": [0.143484375, 0.725988909426987, 0.461609375, 0.8944547134935305], "label": "a red bench"}, {"bbox": [0.48445312500000004, 0.7308133086876155, 0.7910781250000001, 0.8951940850277265], "label": "a green bench"}, {"bbox": [0.0, 0.6560443622920518, 0.134203125, 0.7831238447319778], "label": "a green bench"}], "image_id": "192192"}, "252": {"caption": "a photo of a green teddy bear and a yellow teddy bear and a green teddy bear and a white couch ", "segment": [{"bbox": [0.00965625, 0.15506550218340612, 0.48565625, 0.9258515283842794], "label": "a green teddy bear"}, {"bbox": [0.34168750000000003, 0.07657205240174672, 0.63503125, 0.8063100436681223], "label": "a yellow teddy bear"}, {"bbox": [0.564453125, 0.07639737991266377, 0.9954374999999999, 0.8853930131004366], "label": "a green teddy bear"}, {"bbox": [0.0017812499999999998, 0.0018558951965065502, 1.0, 0.9820087336244543], "label": "a white couch"}], "image_id": "520636"}, "253": {"caption": "a photo of a green tv and a red couch and a red chair ", "segment": [{"bbox": [0.338203125, 0.30093457943925234, 0.5953593749999999, 0.5238084112149533], "label": "a green tv"}, {"bbox": [0.756484375, 0.5013084112149533, 0.9952187499999999, 0.9572196261682243], "label": "a red couch"}, {"bbox": [0.75440625, 0.5049299065420562, 1.0, 0.9139252336448599], "label": "a red chair"}], "image_id": "132540"}, "254": {"caption": "a photo of a brown cat and a white bed ", "segment": [{"bbox": [0.01821875, 0.0042925659472422065, 1.0, 0.9892565947242207], "label": "a brown cat"}, {"bbox": [0.0, 0.562158273381295, 0.77109375, 1.0], "label": "a white bed"}], "image_id": "405306"}, "255": {"caption": "a photo of a green wine glass and a yellow pizza and a green pizza and a blue pizza and a brown pizza and a blue dining table ", "segment": [{"bbox": [0.65809375, 0.02023529411764706, 1.0, 0.5685411764705882], "label": "a green wine glass"}, {"bbox": [0.34173437500000003, 0.38425882352941176, 0.61034375, 0.7707764705882354], "label": "a yellow pizza"}, {"bbox": [0.2734375, 0.27941176470588236, 0.553984375, 0.6564235294117647], "label": "a green pizza"}, {"bbox": [0.116390625, 0.5236, 0.33875, 0.9865176470588235], "label": "a blue pizza"}, {"bbox": [0.310765625, 0.8044941176470589, 0.655109375, 1.0], "label": "a brown pizza"}, {"bbox": [0.0018124999999999999, 0.0, 1.0, 1.0], "label": "a blue dining table"}], "image_id": "440123"}, "256": {"caption": "a photo of a green elephant and a red elephant ", "segment": [{"bbox": [0.206703125, 0.23154296875, 0.69134375, 0.7841796875], "label": "a green elephant"}, {"bbox": [0.370828125, 0.484375, 0.5208281250000001, 0.7994726562500001], "label": "a red elephant"}], "image_id": "94852"}, "257": {"caption": "a photo of a blue bus and a brown car ", "segment": [{"bbox": [0.181421875, 0.40674473067915695, 0.8471093749999999, 0.7348243559718969], "label": "a blue bus"}, {"bbox": [0.0015625, 0.5717564402810305, 0.230765625, 0.7882435597189695], "label": "a brown car"}], "image_id": "566823"}, "258": {"caption": "a photo of a white cell phone and a yellow remote ", "segment": [{"bbox": [0.6191875, 0.5665411764705882, 0.7854687499999999, 0.8648705882352941], "label": "a white cell phone"}, {"bbox": [0.6697968750000001, 0.4940470588235294, 0.817734375, 0.6869647058823529], "label": "a yellow remote"}], "image_id": "205906"}, "259": {"caption": "a photo of a yellow car and a red truck ", "segment": [{"bbox": [0.86875, 0.4747764705882353, 1.0, 0.6676235294117647], "label": "a yellow car"}, {"bbox": [0.248640625, 0.2379529411764706, 0.8228125000000001, 0.8564705882352941], "label": "a red truck"}], "image_id": "500613"}, "260": {"caption": "a photo of a yellow broccoli and a black broccoli and a green broccoli and a white knife and a yellow fork and a brown bowl ", "segment": [{"bbox": [0.346875, 0.13647058823529412, 0.565625, 0.4588235294117647], "label": "a yellow broccoli"}, {"bbox": [0.28215625, 0.5988235294117648, 0.49103125, 0.8077411764705883], "label": "a black broccoli"}, {"bbox": [0.29096875, 0.31625882352941176, 0.47701562499999994, 0.605035294117647], "label": "a green broccoli"}, {"bbox": [0.34173437500000003, 0.02472941176470588, 1.0, 0.5910117647058823], "label": "a white knife"}, {"bbox": [0.145109375, 0.3151294117647059, 0.415109375, 1.0], "label": "a yellow fork"}, {"bbox": [0.0, 0.0, 0.998671875, 1.0], "label": "a brown bowl"}], "image_id": "209142"}, "261": {"caption": "a photo of a green potted plant and a brown couch and a green chair and a yellow chair and a yellow couch and a green chair ", "segment": [{"bbox": [0.7835, 0.02425587467362924, 0.959125, 0.37415143603133155], "label": "a green potted plant"}, {"bbox": [0.0012812499999999998, 0.537780678851175, 0.346734375, 0.9841253263707571], "label": "a brown couch"}, {"bbox": [0.604875, 0.42579634464751964, 0.7760312500000001, 0.7849347258485639], "label": "a green chair"}, {"bbox": [0.63046875, 0.5163707571801567, 0.99825, 0.987467362924282], "label": "a yellow chair"}, {"bbox": [0.43840625, 0.44723237597911225, 0.6330625, 0.6678590078328982], "label": "a yellow couch"}, {"bbox": [0.44089062500000004, 0.44725848563968673, 0.6221093750000001, 0.6710182767624021], "label": "a green chair"}], "image_id": "83059"}, "262": {"caption": "a photo of a brown fork and a green cake and a black dining table ", "segment": [{"bbox": [0.0033750000000000004, 0.45325, 0.731453125, 0.8105416666666667], "label": "a brown fork"}, {"bbox": [0.27534375, 0.09033333333333333, 0.936984375, 0.9558125000000001], "label": "a green cake"}, {"bbox": [0.00584375, 0.0032500000000000003, 1.0, 0.9824583333333333], "label": "a black dining table"}], "image_id": "112818"}, "263": {"caption": "a photo of a green truck and a yellow truck ", "segment": [{"bbox": [0.22191999999999998, 0.37752293577981655, 0.97438, 0.9191131498470948], "label": "a green truck"}, {"bbox": [0.01502, 0.5511926605504588, 0.22472, 0.7574311926605505], "label": "a yellow truck"}], "image_id": "172201"}, "264": {"caption": "a photo of a red spoon and a brown broccoli and a yellow broccoli and a red broccoli and a yellow oven ", "segment": [{"bbox": [0.381640625, 0.5438349514563107, 0.9793125, 0.8100485436893204], "label": "a red spoon"}, {"bbox": [0.218765625, 0.5548058252427185, 0.39731249999999996, 0.8150728155339806], "label": "a brown broccoli"}, {"bbox": [0.44498437500000004, 0.4270631067961165, 0.8064375, 0.667888349514563], "label": "a yellow broccoli"}, {"bbox": [0.07165625, 0.5984466019417476, 0.33664062499999997, 0.810995145631068], "label": "a red broccoli"}, {"bbox": [0.17054687500000001, 0.14286407766990292, 1.0, 0.6753155339805825], "label": "a yellow oven"}], "image_id": "144200"}, "265": {"caption": "a photo of a brown tv and a blue laptop and a blue keyboard and a brown tv ", "segment": [{"bbox": [0.19443749999999999, 0.05616666666666667, 0.6264062499999999, 0.4058125], "label": "a brown tv"}, {"bbox": [0.076015625, 0.375, 0.42229687499999996, 0.8502291666666667], "label": "a blue laptop"}, {"bbox": [0.245515625, 0.7356458333333333, 0.612109375, 0.9239999999999999], "label": "a blue keyboard"}, {"bbox": [0.641328125, 0.15154166666666666, 0.9011875, 0.38129166666666664], "label": "a brown tv"}], "image_id": "270096"}, "266": {"caption": "a photo of a white couch and a white chair ", "segment": [{"bbox": [0.001437246963562753, 0.5225757575757576, 0.4798178137651822, 0.9978484848484848], "label": "a white couch"}, {"bbox": [0.20641700404858299, 0.46693939393939393, 0.33688259109311747, 0.6793939393939393], "label": "a white chair"}], "image_id": "96402"}, "267": {"caption": "a photo of a blue sheep and a yellow sheep and a blue sheep and a brown sheep and a white sheep ", "segment": [{"bbox": [0.27928125000000004, 0.4409133489461359, 0.673078125, 0.9859250585480094], "label": "a blue sheep"}, {"bbox": [0.28409375, 0.2537704918032787, 0.6671875, 0.703231850117096], "label": "a yellow sheep"}, {"bbox": [0.0071874999999999994, 0.3178922716627635, 0.301953125, 0.8178922716627635], "label": "a blue sheep"}, {"bbox": [0.0014375, 0.11182669789227166, 0.20231249999999998, 0.4494613583138173], "label": "a brown sheep"}, {"bbox": [0.6209374999999999, 0.34398126463700235, 1.0, 1.0], "label": "a white sheep"}], "image_id": "269196"}, "268": {"caption": "a photo of a red teddy bear and a green teddy bear ", "segment": [{"bbox": [0.0948125, 0.09425, 0.6162500000000001, 0.827875], "label": "a red teddy bear"}, {"bbox": [0.488765625, 0.19102083333333333, 0.95225, 0.6471874999999999], "label": "a green teddy bear"}], "image_id": "394132"}, "269": {"caption": "a photo of a green apple and a green apple ", "segment": [{"bbox": [0.182203125, 0.3894054054054054, 0.373703125, 0.5905225225225226], "label": "a green apple"}, {"bbox": [0.21578124999999998, 0.10798198198198199, 0.364375, 0.3145585585585586], "label": "a green apple"}], "image_id": "379055"}, "270": {"caption": "a photo of a yellow cat and a green couch and a blue potted plant ", "segment": [{"bbox": [0.575046875, 0.26943750000000005, 1.0, 0.7337916666666667], "label": "a yellow cat"}, {"bbox": [0.46517187499999996, 0.6827708333333333, 0.9977499999999999, 0.9883958333333334], "label": "a green couch"}, {"bbox": [0.12823437499999998, 0.0, 0.9307031250000002, 0.3409375], "label": "a blue potted plant"}], "image_id": "226220"}, "271": {"caption": "a photo of a white potted plant and a brown book ", "segment": [{"bbox": [0.3342, 0.4694933333333333, 0.6287999999999999, 0.7704], "label": "a white potted plant"}, {"bbox": [0.71642, 0.7918133333333334, 0.9725, 0.9591466666666667], "label": "a brown book"}], "image_id": "271117"}, "272": {"caption": "a photo of a white donut and a blue donut and a yellow donut and a blue donut and a green donut and a yellow donut ", "segment": [{"bbox": [0.6661666666666667, 0.65075, 0.948625, 0.8428125], "label": "a white donut"}, {"bbox": [0.6531874999999999, 0.467421875, 0.9528125, 0.635953125], "label": "a blue donut"}, {"bbox": [0.08731249999999999, 0.223, 0.3341458333333333, 0.389328125], "label": "a yellow donut"}, {"bbox": [0.3714166666666667, 0.271734375, 0.62875, 0.42040625], "label": "a blue donut"}, {"bbox": [0.6272708333333333, 0.266265625, 0.8604166666666667, 0.421484375], "label": "a green donut"}, {"bbox": [0.3746875, 0.13303125, 0.5858958333333334, 0.267140625], "label": "a yellow donut"}], "image_id": "382629"}, "273": {"caption": "a photo of a red vase and a red vase ", "segment": [{"bbox": [0.47228125, 0.32135514018691586, 0.626265625, 0.8853971962616822], "label": "a red vase"}, {"bbox": [0.691125, 0.6141355140186916, 0.8332968749999999, 0.9266355140186916], "label": "a red vase"}], "image_id": "426852"}, "274": {"caption": "a photo of a brown horse and a yellow horse and a white horse ", "segment": [{"bbox": [0.020984375, 0.4044964871194379, 0.21290625, 0.6314519906323185], "label": "a brown horse"}, {"bbox": [0.235734375, 0.37278688524590164, 0.44575, 0.64903981264637], "label": "a yellow horse"}, {"bbox": [0.42603125000000003, 0.4174473067915691, 0.5845312500000001, 0.6661592505854801], "label": "a white horse"}], "image_id": "547886"}, "275": {"caption": "a photo of a black dog and a brown dog ", "segment": [{"bbox": [0.45458666666666664, 0.35822000000000004, 0.8481333333333334, 0.99782], "label": "a black dog"}, {"bbox": [0.13624, 0.25164, 0.53992, 0.99746], "label": "a brown dog"}], "image_id": "370210"}, "276": {"caption": "a photo of a red bottle and a red sink and a blue bird and a white bird ", "segment": [{"bbox": [0.8296458333333334, 0.66865625, 0.9817708333333334, 0.8290625], "label": "a red bottle"}, {"bbox": [0.5243541666666667, 0.77753125, 1.0, 0.9977499999999999], "label": "a red sink"}, {"bbox": [0.058333333333333334, 0.8446093749999999, 0.214125, 1.0], "label": "a blue bird"}, {"bbox": [0.8355833333333333, 0.21359374999999997, 0.9631666666666666, 0.423453125], "label": "a white bird"}], "image_id": "146276"}, "277": {"caption": "a photo of a brown cat and a red cat ", "segment": [{"bbox": [0.0033750000000000004, 0.22920833333333332, 0.937078125, 0.9887708333333333], "label": "a brown cat"}, {"bbox": [0.0, 0.2584166666666667, 0.45337500000000003, 0.9842708333333334], "label": "a red cat"}], "image_id": "230151"}, "278": {"caption": "a photo of a green motorcycle and a white motorcycle and a brown motorcycle and a blue motorcycle and a yellow truck and a white motorcycle ", "segment": [{"bbox": [0.07646875, 0.0314519906323185, 0.8515937499999999, 0.9595550351288057], "label": "a green motorcycle"}, {"bbox": [0.730921875, 0.026604215456674473, 0.9426875000000001, 0.2602341920374707], "label": "a white motorcycle"}, {"bbox": [0.00775, 0.06412177985948478, 0.18082812499999998, 0.19704918032786886], "label": "a brown motorcycle"}, {"bbox": [0.787734375, 0.052974238875878224, 0.96578125, 0.21381733021077287], "label": "a blue motorcycle"}, {"bbox": [0.646953125, 0.0, 1.0, 0.20138173302107726], "label": "a yellow truck"}, {"bbox": [0.532546875, 0.049320843091334894, 0.718046875, 0.2331850117096019], "label": "a white motorcycle"}], "image_id": "487059"}, "279": {"caption": "a photo of a brown zebra and a green zebra ", "segment": [{"bbox": [0.5912200000000001, 0.14077333333333333, 0.76858, 0.52816], "label": "a brown zebra"}, {"bbox": [0.13682, 0.14413333333333334, 0.375, 0.5292800000000001], "label": "a green zebra"}], "image_id": "379235"}, "280": {"caption": "a photo of a red refrigerator and a black sink and a yellow oven and a red potted plant ", "segment": [{"bbox": [0.1825, 0.23901639344262296, 0.454765625, 0.8533723653395784], "label": "a red refrigerator"}, {"bbox": [0.088140625, 0.6660655737704919, 0.2444375, 0.8350819672131149], "label": "a black sink"}, {"bbox": [0.6384531250000001, 0.541288056206089, 0.833, 0.8408196721311475], "label": "a yellow oven"}, {"bbox": [0.091125, 0.027142857142857142, 0.431953125, 0.476768149882904], "label": "a red potted plant"}], "image_id": "38963"}, "281": {"caption": "a photo of a green donut and a white donut and a green donut and a white dining table ", "segment": [{"bbox": [0.44420312500000003, 0.057494145199063235, 0.99721875, 0.787423887587822], "label": "a green donut"}, {"bbox": [0.20840625, 0.25618266978922716, 0.48278125000000005, 0.6831381733021077], "label": "a white donut"}, {"bbox": [0.362828125, 0.13707259953161594, 0.572734375, 0.32807962529274004], "label": "a green donut"}, {"bbox": [0.0025781249999999997, 0.006744730679156909, 0.99703125, 0.9958548009367681], "label": "a white dining table"}], "image_id": "149022"}, "282": {"caption": "a photo of a yellow car and a yellow motorcycle ", "segment": [{"bbox": [0.58226, 0.036213333333333333, 0.9532200000000001, 0.5286666666666666], "label": "a yellow car"}, {"bbox": [0.09731999999999999, 0.022586666666666668, 0.8808799999999999, 0.9845600000000001], "label": "a yellow motorcycle"}], "image_id": "178078"}, "283": {"caption": "a photo of a green toilet and a red sink ", "segment": [{"bbox": [0.19444, 0.41728365384615385, 0.51976, 0.9116826923076923], "label": "a green toilet"}, {"bbox": [0.4079, 0.39197115384615383, 0.98462, 0.7580288461538462], "label": "a red sink"}], "image_id": "79446"}, "284": {"caption": "a photo of a white chair and a brown chair and a blue chair and a black cup and a blue pizza ", "segment": [{"bbox": [0.5081562500000001, 0.025350467289719625, 0.6971718750000001, 0.25128504672897195], "label": "a white chair"}, {"bbox": [0.6871562499999999, 0.0, 0.84959375, 0.2669859813084112], "label": "a brown chair"}, {"bbox": [0.0, 0.14476635514018693, 0.19971875, 0.4654205607476636], "label": "a blue chair"}, {"bbox": [0.007515625, 0.212803738317757, 0.160796875, 0.6375233644859813], "label": "a black cup"}, {"bbox": [0.038578125000000005, 0.2164252336448598, 0.99646875, 0.729696261682243], "label": "a blue pizza"}], "image_id": "384822"}, "285": {"caption": "a photo of a green hot dog and a yellow hot dog and a blue hot dog ", "segment": [{"bbox": [0.0017656249999999998, 0.0023541666666666663, 0.3219375, 0.9481041666666666], "label": "a green hot dog"}, {"bbox": [0.289890625, 0.0, 0.7196562500000001, 0.9842708333333333], "label": "a yellow hot dog"}, {"bbox": [0.597953125, 0.0, 1.0, 0.9459791666666667], "label": "a blue hot dog"}], "image_id": "388211"}, "286": {"caption": "a photo of a green cat and a white car ", "segment": [{"bbox": [0.41703124999999996, 0.3652916666666667, 0.60453125, 0.5355624999999999], "label": "a green cat"}, {"bbox": [0.0033750000000000004, 0.041666666666666664, 0.9983124999999999, 0.9876041666666667], "label": "a white car"}], "image_id": "181963"}, "287": {"caption": "a photo of a blue bottle and a yellow refrigerator ", "segment": [{"bbox": [0.6070625, 0.7944375, 0.7805156249999999, 0.9978541666666666], "label": "a blue bottle"}, {"bbox": [0.0016875000000000002, 0.0018750000000000001, 0.9994375, 0.9883958333333333], "label": "a yellow refrigerator"}], "image_id": "575834"}, "288": {"caption": "a photo of a green dining table and a brown chair ", "segment": [{"bbox": [0.778390625, 0.5401647058823529, 0.9987187500000001, 0.8291058823529411], "label": "a green dining table"}, {"bbox": [0.21190625000000002, 0.5415764705882352, 0.43276562500000004, 0.8719058823529411], "label": "a brown chair"}], "image_id": "303970"}, "289": {"caption": "a photo of a red boat and a brown boat and a yellow boat and a yellow boat ", "segment": [{"bbox": [0.003359375, 0.43856249999999997, 0.5852031249999999, 1.0], "label": "a red boat"}, {"bbox": [0.239796875, 0.24489583333333334, 1.0, 0.5691666666666666], "label": "a brown boat"}, {"bbox": [0.396265625, 0.0, 0.8979531250000001, 0.2335625], "label": "a yellow boat"}, {"bbox": [0.043625000000000004, 0.08075, 0.44631250000000006, 0.37829166666666664], "label": "a yellow boat"}], "image_id": "400547"}, "290": {"caption": "a photo of a red cat and a yellow couch and a white suitcase ", "segment": [{"bbox": [0.349859375, 0.37527083333333333, 0.6553125, 0.5758958333333334], "label": "a red cat"}, {"bbox": [0.682109375, 0.0021458333333333334, 1.0, 0.3857708333333333], "label": "a yellow couch"}, {"bbox": [0.12640625, 0.46291666666666664, 1.0, 0.9887708333333334], "label": "a white suitcase"}], "image_id": "274800"}, "291": {"caption": "a photo of a brown mouse and a blue keyboard ", "segment": [{"bbox": [0.33545045045045047, 0.6915, 0.6243243243243243, 0.8192999999999999], "label": "a brown mouse"}, {"bbox": [0.0025225225225225228, 0.15506, 1.0, 0.33484], "label": "a blue keyboard"}], "image_id": "107954"}, "292": {"caption": "a photo of a yellow bench and a white potted plant and a white potted plant and a green potted plant and a blue potted plant and a brown cat ", "segment": [{"bbox": [0.302359375, 0.3063125, 0.731421875, 0.7972916666666666], "label": "a yellow bench"}, {"bbox": [0.003359375, 0.19047916666666667, 0.258390625, 0.8571458333333334], "label": "a white potted plant"}, {"bbox": [0.442265625, 0.6475416666666667, 0.8122187500000001, 0.9995416666666667], "label": "a white potted plant"}, {"bbox": [0.0185, 0.008958333333333334, 0.245515625, 0.36995833333333333], "label": "a green potted plant"}, {"bbox": [0.22753125000000002, 0.0490625, 0.43482812499999995, 0.4108541666666667], "label": "a blue potted plant"}, {"bbox": [0.16218749999999998, 0.6728541666666668, 0.32265625, 0.9756666666666668], "label": "a brown cat"}], "image_id": "279145"}, "293": {"caption": "a photo of a brown potted plant and a white vase ", "segment": [{"bbox": [0.0, 0.05168, 0.9964473684210525, 0.98876], "label": "a brown potted plant"}, {"bbox": [0.17742105263157895, 0.7483200000000001, 0.7185, 0.98652], "label": "a white vase"}], "image_id": "323615"}, "294": {"caption": "a photo of a red bottle and a green sandwich and a green dining table and a brown bowl and a red chair ", "segment": [{"bbox": [0.4836, 0.00408, 0.7056533333333334, 0.48324], "label": "a red bottle"}, {"bbox": [0.002986666666666667, 0.5125, 0.55432, 0.9799200000000001], "label": "a green sandwich"}, {"bbox": [0.0, 0.17078, 0.9947466666666666, 1.0], "label": "a green dining table"}, {"bbox": [0.46266666666666667, 0.15268, 1.0, 0.37956], "label": "a brown bowl"}, {"bbox": [0.15560000000000002, 0.0, 0.5477333333333333, 0.17588], "label": "a red chair"}], "image_id": "321496"}, "295": {"caption": "a photo of a green airplane and a green car and a blue airplane ", "segment": [{"bbox": [0.000171875, 0.25842245989304813, 0.3278125, 0.4539304812834225], "label": "a green airplane"}, {"bbox": [0.371640625, 0.4651604278074866, 0.664484375, 0.7887700534759359], "label": "a green car"}, {"bbox": [0.17181249999999998, 0.21058823529411766, 0.4878125, 0.4445989304812834], "label": "a blue airplane"}], "image_id": "133279"}, "296": {"caption": "a photo of a green cat and a brown laptop and a white bottle ", "segment": [{"bbox": [0.041203125, 0.29678082191780825, 0.977265625, 0.834406392694064], "label": "a green cat"}, {"bbox": [0.006125, 0.0046803652968036525, 0.9997656249999999, 0.9331050228310502], "label": "a brown laptop"}, {"bbox": [0.858734375, 0.0, 0.994953125, 0.3923744292237443], "label": "a white bottle"}], "image_id": "80949"}, "297": {"caption": "a photo of a yellow car and a white car and a green motorcycle and a white backpack ", "segment": [{"bbox": [0.329265625, 0.010753138075313806, 0.67459375, 0.19140167364016736], "label": "a yellow car"}, {"bbox": [0.852375, 0.004372384937238493, 0.9997343749999998, 0.13217573221757323], "label": "a white car"}, {"bbox": [0.098578125, 0.15244769874476988, 0.867171875, 0.82581589958159], "label": "a green motorcycle"}, {"bbox": [0.784015625, 0.6248326359832637, 0.9978281250000001, 0.8091422594142259], "label": "a white backpack"}], "image_id": "255279"}, "298": {"caption": "a photo of a yellow tv and a blue keyboard ", "segment": [{"bbox": [0.19424999999999998, 0.012395833333333333, 0.831078125, 0.6835625000000001], "label": "a yellow tv"}, {"bbox": [0.21979687499999997, 0.7876875, 0.81040625, 0.9554791666666667], "label": "a blue keyboard"}], "image_id": "361527"}, "299": {"caption": "a photo of a black bicycle and a white cell phone ", "segment": [{"bbox": [0.7195733333333333, 0.6479600000000001, 1.0, 0.9232], "label": "a black bicycle"}, {"bbox": [0.3258666666666667, 0.24364, 0.568, 0.6023999999999999], "label": "a white cell phone"}], "image_id": "87493"}, "300": {"caption": "a photo of a blue couch and a brown chair and a white book and a black book ", "segment": [{"bbox": [0.13545197740112996, 0.5065333333333333, 0.8255932203389831, 0.8603466666666667], "label": "a blue couch"}, {"bbox": [0.1833050847457627, 0.5696, 0.6951129943502825, 0.9988266666666666], "label": "a brown chair"}, {"bbox": [0.6456214689265537, 0.11312, 0.8751412429378531, 0.25994666666666666], "label": "a white book"}, {"bbox": [0.10734463276836158, 0.192, 0.9830508474576272, 0.5786666666666667], "label": "a black book"}], "image_id": "350961"}, "301": {"caption": "a photo of a yellow dining table and a yellow dining table and a green umbrella and a black umbrella and a red umbrella and a black umbrella ", "segment": [{"bbox": [0.241015625, 0.5780833333333334, 0.416296875, 0.9601041666666668], "label": "a yellow dining table"}, {"bbox": [0.593265625, 0.5528125, 0.8106718749999999, 0.8022500000000001], "label": "a yellow dining table"}, {"bbox": [0.0455, 0.2561875, 0.510671875, 0.703375], "label": "a green umbrella"}, {"bbox": [0.490453125, 0.10972916666666667, 0.765171875, 0.2468125], "label": "a black umbrella"}, {"bbox": [0.1865, 0.09575, 0.44403125, 0.2667291666666667], "label": "a red umbrella"}, {"bbox": [0.512140625, 0.2567083333333333, 0.96453125, 0.507875], "label": "a black umbrella"}], "image_id": "142826"}, "302": {"caption": "a photo of a white dog and a white bed ", "segment": [{"bbox": [0.3917979797979798, 0.023625, 0.9794949494949495, 0.9731249999999999], "label": "a white dog"}, {"bbox": [0.42806060606060603, 0.0033750000000000004, 0.992989898989899, 0.9358124999999999], "label": "a white bed"}], "image_id": "511307"}, "303": {"caption": "a photo of a blue dining table and a red couch ", "segment": [{"bbox": [0.361703125, 0.547875, 0.61346875, 0.734625], "label": "a blue dining table"}, {"bbox": [0.115375, 0.48575, 0.316734375, 0.6462083333333334], "label": "a red couch"}], "image_id": "11305"}, "304": {"caption": "a photo of a yellow toilet and a white sink ", "segment": [{"bbox": [0.5852031249999999, 0.461875, 0.7920468749999999, 0.9137708333333333], "label": "a yellow toilet"}, {"bbox": [0.48457812499999997, 0.5183125, 0.62765625, 0.8575833333333333], "label": "a white sink"}], "image_id": "34701"}, "305": {"caption": "a photo of a black umbrella and a red bottle and a black bench and a red bench and a yellow dining table and a red bench ", "segment": [{"bbox": [0.0, 0.00014583333333333335, 0.783703125, 0.8450833333333333], "label": "a black umbrella"}, {"bbox": [0.701609375, 0.0017916666666666667, 0.9983906250000001, 0.9867291666666667], "label": "a red bottle"}, {"bbox": [0.327703125, 0.6542708333333334, 0.706078125, 0.9876041666666667], "label": "a black bench"}, {"bbox": [0.0033750000000000004, 0.59775, 0.165171875, 0.9887708333333334], "label": "a red bench"}, {"bbox": [0.0, 0.5754791666666667, 0.2200625, 0.8440416666666667], "label": "a yellow dining table"}, {"bbox": [0.5646093750000001, 0.5546875, 0.701125, 0.70075], "label": "a red bench"}], "image_id": "404526"}, "306": {"caption": "a photo of a red truck and a white truck and a yellow truck ", "segment": [{"bbox": [0.32684375, 0.2067447306791569, 0.833609375, 0.8089929742388761], "label": "a red truck"}, {"bbox": [0.810796875, 0.3174941451990632, 0.966375, 0.651569086651054], "label": "a white truck"}, {"bbox": [0.1454375, 0.37283372365339573, 0.34987500000000005, 0.5829508196721311], "label": "a yellow truck"}], "image_id": "137211"}, "307": {"caption": "a photo of a brown bicycle and a green backpack ", "segment": [{"bbox": [0.1858125, 0.1804375, 0.846703125, 0.8676250000000001], "label": "a brown bicycle"}, {"bbox": [0.487140625, 0.4813125, 0.63428125, 0.6394166666666667], "label": "a green backpack"}], "image_id": "292819"}, "308": {"caption": "a photo of a green sports ball and a blue baseball glove and a blue bench ", "segment": [{"bbox": [0.39409375, 0.4106759906759907, 0.633609375, 0.7739160839160839], "label": "a green sports ball"}, {"bbox": [0.20635937499999998, 0.0, 0.9595312499999998, 0.9865268065268066], "label": "a blue baseball glove"}, {"bbox": [0.0, 0.0, 0.9976406250000001, 0.987016317016317], "label": "a blue bench"}], "image_id": "5934"}, "309": {"caption": "a photo of a blue spoon and a black cake ", "segment": [{"bbox": [0.7924800000000001, 0.04368, 1.0, 0.6243733333333333], "label": "a blue spoon"}, {"bbox": [0.24606, 0.09850666666666666, 0.6623600000000001, 0.5456799999999999], "label": "a black cake"}], "image_id": "573196"}, "310": {"caption": "a photo of a red bowl and a green banana and a red apple and a red orange and a brown cup and a black dining table ", "segment": [{"bbox": [0.07815359477124183, 0.5534640522875818, 0.44679738562091503, 0.926078431372549], "label": "a red bowl"}, {"bbox": [0.5126797385620915, 0.43098039215686273, 0.9549346405228759, 0.8675980392156863], "label": "a green banana"}, {"bbox": [0.6959313725490196, 0.10200980392156862, 0.9311764705882353, 0.3268464052287582], "label": "a red apple"}, {"bbox": [0.16745098039215686, 0.08727124183006535, 0.39150326797385626, 0.3207516339869281], "label": "a red orange"}, {"bbox": [0.4205718954248366, 0.12380718954248365, 0.5916993464052288, 0.36272875816993466], "label": "a brown cup"}, {"bbox": [0.0363562091503268, 0.03895424836601307, 0.971421568627451, 0.9688235294117649], "label": "a black dining table"}], "image_id": "490871"}, "311": {"caption": "a photo of a red cow and a red cow ", "segment": [{"bbox": [0.383828125, 0.4236619718309859, 0.579703125, 0.5962206572769954], "label": "a red cow"}, {"bbox": [0.692921875, 0.41119718309859155, 0.915640625, 0.638943661971831], "label": "a red cow"}], "image_id": "173401"}, "312": {"caption": "a photo of a green giraffe and a white giraffe ", "segment": [{"bbox": [0.0017343750000000002, 0.0, 0.7521093750000001, 0.9324590163934426], "label": "a green giraffe"}, {"bbox": [0.580546875, 0.0, 0.9444531250000001, 0.4597423887587822], "label": "a white giraffe"}], "image_id": "254965"}, "313": {"caption": "a photo of a black dog and a yellow teddy bear ", "segment": [{"bbox": [0.04224400871459695, 0.008078125, 0.9999782135076253, 0.767671875], "label": "a black dog"}, {"bbox": [0.025119825708061, 0.5045, 0.6783224400871459, 0.9864843750000001], "label": "a yellow teddy bear"}], "image_id": "215554"}, "314": {"caption": "a photo of a black dog and a brown chair and a green dining table ", "segment": [{"bbox": [0.25809375, 0.20545833333333335, 0.64371875, 0.584], "label": "a black dog"}, {"bbox": [0.01225, 0.06854166666666667, 0.5836875, 0.8992708333333332], "label": "a brown chair"}, {"bbox": [0.0, 0.3285416666666666, 0.2776875, 1.0], "label": "a green dining table"}], "image_id": "372294"}, "315": {"caption": "a photo of a black donut and a red bowl ", "segment": [{"bbox": [0.34550000000000003, 0.5438124999999999, 0.63034375, 0.907875], "label": "a black donut"}, {"bbox": [0.0, 0.0, 0.9932812500000001, 0.9867916666666667], "label": "a red bowl"}], "image_id": "521601"}, "316": {"caption": "a photo of a brown dog and a red bottle ", "segment": [{"bbox": [0.0, 0.05370892018779343, 0.776578125, 0.9976291079812207], "label": "a brown dog"}, {"bbox": [0.338953125, 0.6426291079812206, 0.66875, 1.0], "label": "a red bottle"}], "image_id": "382443"}, "317": {"caption": "a photo of a red toilet and a red toilet ", "segment": [{"bbox": [0.10716346153846154, 0.32771875, 0.7156490384615384, 0.606359375], "label": "a red toilet"}, {"bbox": [0.11701923076923076, 0.393953125, 0.8466586538461538, 0.883890625], "label": "a red toilet"}], "image_id": "243810"}, "318": {"caption": "a photo of a white skis and a brown skis and a blue snowboard and a brown skis and a brown skis and a red skis ", "segment": [{"bbox": [0.257046875, 0.27620833333333333, 0.466546875, 0.9898333333333333], "label": "a white skis"}, {"bbox": [0.104125, 0.29883333333333334, 0.30706249999999996, 0.985875], "label": "a brown skis"}, {"bbox": [0.28314062500000003, 0.2876458333333333, 0.4516875000000001, 0.9865208333333333], "label": "a blue snowboard"}, {"bbox": [0.633515625, 0.3348125, 0.79040625, 0.9416666666666667], "label": "a brown skis"}, {"bbox": [0.545453125, 0.32466666666666666, 0.6837656249999999, 0.8779166666666666], "label": "a brown skis"}, {"bbox": [0.15565625, 0.3967708333333333, 0.28931250000000003, 0.7840625], "label": "a red skis"}], "image_id": "50482"}, "319": {"caption": "a photo of a green bowl and a yellow carrot and a white dining table ", "segment": [{"bbox": [0.08565625, 0.035957943925233646, 0.88665625, 0.9617990654205607], "label": "a green bowl"}, {"bbox": [0.27537500000000004, 0.6301401869158878, 0.41240625, 0.8224532710280373], "label": "a yellow carrot"}, {"bbox": [0.0, 0.0, 1.0, 0.9858411214953271], "label": "a white dining table"}], "image_id": "334884"}, "320": {"caption": "a photo of a green motorcycle and a yellow motorcycle ", "segment": [{"bbox": [0.1865174129353234, 0.46201666666666663, 0.8349751243781095, 0.8757333333333333], "label": "a green motorcycle"}, {"bbox": [0.2971641791044776, 0.09394999999999999, 0.7316417910447761, 0.41395], "label": "a yellow motorcycle"}], "image_id": "443351"}, "321": {"caption": "a photo of a black cup and a black sandwich and a brown dining table and a yellow sandwich and a green sandwich ", "segment": [{"bbox": [0.269125, 0.0034583333333333332, 0.478671875, 0.20049999999999998], "label": "a black cup"}, {"bbox": [0.163484375, 0.42883333333333334, 0.655625, 0.9816458333333334], "label": "a black sandwich"}, {"bbox": [0.751953125, 0.4155833333333333, 1.0, 0.74025], "label": "a brown dining table"}, {"bbox": [0.001859375, 0.3350416666666666, 0.5333281249999999, 0.9547916666666667], "label": "a yellow sandwich"}, {"bbox": [0.66503125, 0.05202083333333333, 0.969828125, 0.31802083333333336], "label": "a green sandwich"}], "image_id": "469356"}, "322": {"caption": "a photo of a green dog and a red cat ", "segment": [{"bbox": [0.036296875, 0.15525, 0.4974843750000001, 0.9637083333333333], "label": "a green dog"}, {"bbox": [0.590328125, 0.6128958333333333, 0.9854843750000001, 0.9483958333333333], "label": "a red cat"}], "image_id": "12764"}, "323": {"caption": "a photo of a black refrigerator and a red oven ", "segment": [{"bbox": [0.10870312499999998, 0.23987179487179489, 0.324453125, 0.8862606837606837], "label": "a black refrigerator"}, {"bbox": [0.5965, 0.5775213675213675, 0.769046875, 0.9235897435897437], "label": "a red oven"}], "image_id": "73280"}, "324": {"caption": "a photo of a green bed and a red refrigerator ", "segment": [{"bbox": [0.47359375000000004, 0.42920833333333336, 0.82246875, 0.6674166666666667], "label": "a green bed"}, {"bbox": [0.21779687499999997, 0.14164583333333333, 0.49159375, 0.9636875], "label": "a red refrigerator"}], "image_id": "336001"}, "325": {"caption": "a photo of a brown cow and a brown cow ", "segment": [{"bbox": [0.01846875, 0.5006060606060606, 0.22381249999999997, 0.9736363636363636], "label": "a brown cow"}, {"bbox": [0.443546875, 0.4044903581267218, 0.825921875, 0.9775206611570249], "label": "a brown cow"}], "image_id": "377355"}, "326": {"caption": "a photo of a white chair and a brown teddy bear and a brown bear ", "segment": [{"bbox": [0.05683333333333333, 0.05248437500000001, 1.0, 1.0], "label": "a white chair"}, {"bbox": [0.31760416666666663, 0.031093749999999996, 0.7490624999999999, 0.440078125], "label": "a brown teddy bear"}, {"bbox": [0.32208333333333333, 0.03853125, 0.765375, 0.448921875], "label": "a brown bear"}], "image_id": "417455"}, "327": {"caption": "a photo of a black zebra and a brown zebra and a yellow bird ", "segment": [{"bbox": [0.117984375, 0.10891666666666668, 0.8545, 0.7875833333333333], "label": "a black zebra"}, {"bbox": [0.32359375, 0.02695833333333333, 0.9438124999999999, 0.7550625], "label": "a brown zebra"}, {"bbox": [0.0015625, 0.0020833333333333333, 0.9984375, 0.20416666666666666], "label": "a yellow bird"}], "image_id": "23954"}, "328": {"caption": "a photo of a red bed and a blue chair ", "segment": [{"bbox": [0.0394375, 0.49685912240184754, 0.8100468749999999, 0.9878983833718245], "label": "a red bed"}, {"bbox": [0.11773437499999999, 0.41775981524249417, 0.3444375, 0.5606004618937643], "label": "a blue chair"}], "image_id": "312746"}, "329": {"caption": "a photo of a black sandwich and a white sandwich and a red dining table and a black spoon and a blue bowl ", "segment": [{"bbox": [0.5063125, 0.4417050691244239, 0.8210468750000001, 0.8295852534562211], "label": "a black sandwich"}, {"bbox": [0.49567187500000004, 0.2711981566820277, 0.776953125, 0.6366589861751152], "label": "a white sandwich"}, {"bbox": [0.001515625, 0.004700460829493088, 0.996703125, 0.9890322580645161], "label": "a red dining table"}, {"bbox": [0.42567187500000003, 0.6701382488479262, 0.561015625, 0.8697465437788018], "label": "a black spoon"}, {"bbox": [0.13287500000000002, 0.33670506912442394, 0.496375, 0.7894239631336406], "label": "a blue bowl"}], "image_id": "460507"}, "330": {"caption": "a photo of a yellow banana and a red banana and a yellow banana and a blue banana and a red teddy bear ", "segment": [{"bbox": [0.211203125, 0.48608333333333337, 0.38878124999999997, 0.7560555555555556], "label": "a yellow banana"}, {"bbox": [0.03440625, 0.5294166666666666, 0.209125, 0.7082222222222222], "label": "a red banana"}, {"bbox": [0.6075, 0.7148888888888889, 0.759703125, 0.8701944444444444], "label": "a yellow banana"}, {"bbox": [0.471171875, 0.44, 0.6180937500000001, 0.6305833333333333], "label": "a blue banana"}, {"bbox": [0.169375, 0.0, 0.74578125, 0.3191111111111111], "label": "a red teddy bear"}], "image_id": "236542"}, "331": {"caption": "a photo of a red cat and a brown bed and a red teddy bear ", "segment": [{"bbox": [0.21336000000000002, 0.29096, 0.42672000000000004, 0.7888000000000001], "label": "a red cat"}, {"bbox": [0.09944, 0.23146666666666665, 0.99606, 0.9842666666666667], "label": "a brown bed"}, {"bbox": [0.77308, 0.34336, 1.0, 0.5342133333333333], "label": "a red teddy bear"}], "image_id": "426283"}, "332": {"caption": "a photo of a brown clock and a white bird ", "segment": [{"bbox": [0.32503125, 0.12616666666666668, 0.52353125, 0.38947916666666665], "label": "a brown clock"}, {"bbox": [0.34303125, 0.0022916666666666667, 0.532515625, 0.13179166666666667], "label": "a white bird"}], "image_id": "412443"}, "333": {"caption": "a photo of a blue car and a yellow fire hydrant ", "segment": [{"bbox": [0.7824166666666666, 0.025453125, 1.0, 0.188765625], "label": "a blue car"}, {"bbox": [0.5260625, 0.06928125, 0.8225416666666666, 0.5893124999999999], "label": "a yellow fire hydrant"}], "image_id": "286010"}, "334": {"caption": "a photo of a brown cell phone and a blue teddy bear and a green cat and a green bed ", "segment": [{"bbox": [0.6034375, 0.004375, 0.7835156249999999, 0.15772916666666664], "label": "a brown cell phone"}, {"bbox": [0.38851562500000003, 0.1846875, 0.8952656250000001, 0.9076666666666665], "label": "a blue teddy bear"}, {"bbox": [0.111234375, 0.294375, 0.532578125, 0.7707916666666667], "label": "a green cat"}, {"bbox": [0.0, 0.003916666666666666, 1.0, 0.9882916666666667], "label": "a green bed"}], "image_id": "546896"}, "335": {"caption": "a photo of a yellow potted plant and a blue potted plant and a blue potted plant and a white sink ", "segment": [{"bbox": [0.43742000000000003, 0.13898123324396783, 0.60982, 0.3341018766756032], "label": "a yellow potted plant"}, {"bbox": [0.34198, 0.22037533512064345, 0.47274, 0.3866756032171582], "label": "a blue potted plant"}, {"bbox": [0.17687999999999998, 0.21597855227882037, 0.30716, 0.4715817694369973], "label": "a blue potted plant"}, {"bbox": [0.17434, 0.47640750670241283, 0.6789400000000001, 0.9572922252010724], "label": "a white sink"}], "image_id": "257685"}, "336": {"caption": "a photo of a black broccoli and a green broccoli and a yellow broccoli ", "segment": [{"bbox": [0.44851562500000003, 0.454484375, 0.867390625, 0.8776875000000001], "label": "a black broccoli"}, {"bbox": [0.011796875, 0.38679687500000004, 0.306609375, 0.7476406250000001], "label": "a green broccoli"}, {"bbox": [0.2815, 0.835703125, 0.53409375, 1.0], "label": "a yellow broccoli"}], "image_id": "507536"}, "337": {"caption": "a photo of a yellow stop sign and a red car ", "segment": [{"bbox": [0.30366366366366365, 0.06292, 0.684954954954955, 0.37528], "label": "a yellow stop sign"}, {"bbox": [0.5047147147147147, 0.74086, 1.0, 0.94674], "label": "a red car"}], "image_id": "46099"}, "338": {"caption": "a photo of a red cow and a black cow and a blue cow and a white cow ", "segment": [{"bbox": [0.17209375, 0.5090818363273454, 0.41771874999999997, 0.7792015968063872], "label": "a red cow"}, {"bbox": [0.3999375, 0.5351297405189621, 0.5608593749999999, 0.7621157684630739], "label": "a black cow"}, {"bbox": [0.438171875, 0.5256487025948104, 0.6031718749999999, 0.7281636726546906], "label": "a blue cow"}, {"bbox": [0.5598124999999999, 0.5061876247504989, 0.7471249999999999, 0.805808383233533], "label": "a white cow"}], "image_id": "241453"}, "339": {"caption": "a photo of a green oven and a blue oven and a green sink ", "segment": [{"bbox": [0.5139375, 0.7200416666666667, 0.6504531250000001, 1.0], "label": "a green oven"}, {"bbox": [0.115234375, 0.8059999999999999, 0.3125, 0.9830833333333333], "label": "a blue oven"}, {"bbox": [0.152546875, 0.6465833333333334, 0.4455, 0.8640208333333333], "label": "a green sink"}], "image_id": "541279"}, "340": {"caption": "a photo of a brown toilet and a brown sink ", "segment": [{"bbox": [0.38682812499999997, 0.3063125, 0.856421875, 0.9864791666666667], "label": "a brown toilet"}, {"bbox": [0.694375, 0.494375, 0.9994375, 0.9438124999999999], "label": "a brown sink"}], "image_id": "30432"}, "341": {"caption": "a photo of a green car and a yellow car and a black surfboard ", "segment": [{"bbox": [0.14625, 0.14089411764705884, 1.0, 0.9858352941176471], "label": "a green car"}, {"bbox": [0.770015625, 0.026964705882352943, 0.9983281250000001, 0.5528], "label": "a yellow car"}, {"bbox": [0.35746875, 0.05249411764705882, 0.794609375, 0.23188235294117646], "label": "a black surfboard"}], "image_id": "68852"}, "342": {"caption": "a photo of a yellow teddy bear and a blue teddy bear and a white teddy bear and a red teddy bear and a black teddy bear and a green teddy bear ", "segment": [{"bbox": [0.0053124999999999995, 0.07303125, 0.27877083333333336, 0.328375], "label": "a yellow teddy bear"}, {"bbox": [0.41470833333333335, 0.40531249999999996, 0.6290416666666666, 0.6114374999999999], "label": "a blue teddy bear"}, {"bbox": [0.6570208333333334, 0.120015625, 0.8741875, 0.31640625], "label": "a white teddy bear"}, {"bbox": [0.17295833333333333, 0.0324375, 0.36181250000000004, 0.23553124999999997], "label": "a red teddy bear"}, {"bbox": [0.8183541666666667, 0.415859375, 1.0, 0.619328125], "label": "a black teddy bear"}, {"bbox": [0.27975, 0.42121875, 0.45685416666666673, 0.6045], "label": "a green teddy bear"}], "image_id": "142182"}, "343": {"caption": "a photo of a green sheep and a brown sheep ", "segment": [{"bbox": [0.09273437500000001, 0.4316197183098592, 0.36198437499999997, 0.9889201877934272], "label": "a green sheep"}, {"bbox": [0.540546875, 0.4118544600938967, 0.6909375, 0.7116197183098592], "label": "a brown sheep"}], "image_id": "381786"}, "344": {"caption": "a photo of a brown bowl and a brown bowl and a brown sink and a red sink and a black bottle ", "segment": [{"bbox": [0.5718593750000001, 0.3688916876574307, 0.7827343750000001, 0.7249622166246852], "label": "a brown bowl"}, {"bbox": [0.222546875, 0.41602015113350127, 0.40914062500000004, 0.727758186397985], "label": "a brown bowl"}, {"bbox": [0.15890625, 0.2539294710327456, 0.515765625, 0.8898992443324936], "label": "a brown sink"}, {"bbox": [0.538734375, 0.24914357682619648, 0.88453125, 0.8896221662468514], "label": "a red sink"}, {"bbox": [0.244328125, 0.004710327455919395, 0.380375, 0.20282115869017636], "label": "a black bottle"}], "image_id": "401642"}, "345": {"caption": "a photo of a white broccoli and a yellow broccoli ", "segment": [{"bbox": [0.210359375, 0.34117096018735366, 0.44740625000000006, 0.7105854800936768], "label": "a white broccoli"}, {"bbox": [0.0, 0.3136065573770492, 0.15818749999999998, 0.7807494145199063], "label": "a yellow broccoli"}], "image_id": "264540"}, "346": {"caption": "a photo of a white boat and a black boat and a red boat and a red boat ", "segment": [{"bbox": [0.62978125, 0.09368421052631579, 0.827328125, 0.661578947368421], "label": "a white boat"}, {"bbox": [0.41379687499999995, 0.16137299771167046, 0.6371249999999999, 0.6689016018306636], "label": "a black boat"}, {"bbox": [0.228625, 0.19736842105263158, 0.46799999999999997, 0.7074828375286041], "label": "a red boat"}, {"bbox": [0.089, 0.3691075514874142, 0.38053125000000004, 0.6994279176201372], "label": "a red boat"}], "image_id": "41924"}, "347": {"caption": "a photo of a yellow bed and a green chair ", "segment": [{"bbox": [0.0, 0.11648, 0.8578600000000001, 1.0], "label": "a yellow bed"}, {"bbox": [0.5431, 0.30258666666666667, 0.73554, 0.52664], "label": "a green chair"}], "image_id": "493867"}, "348": {"caption": "a photo of a white giraffe and a white giraffe and a green giraffe and a yellow giraffe and a white giraffe ", "segment": [{"bbox": [0.23184375, 0.37528169014084506, 0.535484375, 0.9865258215962441], "label": "a white giraffe"}, {"bbox": [0.026796874999999998, 0.2574882629107981, 0.3156875, 0.8525586854460094], "label": "a white giraffe"}, {"bbox": [0.5325, 0.29213615023474176, 0.670109375, 0.8921361502347418], "label": "a green giraffe"}, {"bbox": [0.780796875, 0.17753521126760563, 0.96478125, 0.9123708920187794], "label": "a yellow giraffe"}, {"bbox": [0.2279375, 0.2611971830985915, 0.4676406249999999, 0.8504225352112675], "label": "a white giraffe"}], "image_id": "170250"}, "349": {"caption": "a photo of a green tie and a green tie and a green tie and a brown tie and a blue tie and a black tie ", "segment": [{"bbox": [0.6761874999999999, 0.0, 0.9040781250000001, 0.8876346604215456], "label": "a green tie"}, {"bbox": [0.571234375, 0.0, 0.7496562499999999, 0.9460655737704918], "label": "a green tie"}, {"bbox": [0.52025, 0.0, 0.6821875, 0.9685480093676815], "label": "a green tie"}, {"bbox": [0.114203125, 0.0033723653395784543, 0.287015625, 0.8547306791569086], "label": "a brown tie"}, {"bbox": [0.18740625, 0.001873536299765808, 0.33584375, 0.9029976580796253], "label": "a blue tie"}, {"bbox": [0.47528125, 0.0041217798594847775, 0.60271875, 0.9659250585480094], "label": "a black tie"}], "image_id": "340422"}, "350": {"caption": "a photo of a yellow elephant and a white elephant and a yellow elephant and a green elephant ", "segment": [{"bbox": [0.44425, 0.13852083333333332, 0.9831093750000001, 0.8524791666666667], "label": "a yellow elephant"}, {"bbox": [0.738546875, 0.31612500000000004, 1.0, 0.8926250000000001], "label": "a white elephant"}, {"bbox": [0.08503125, 0.3673541666666667, 0.404765625, 0.8594166666666666], "label": "a yellow elephant"}, {"bbox": [0.33690625, 0.10102083333333334, 0.5857812499999999, 0.3177291666666667], "label": "a green elephant"}], "image_id": "451952"}, "351": {"caption": "a photo of a white cup and a brown hot dog and a green sandwich and a green dining table ", "segment": [{"bbox": [0.085140625, 0.228796875, 0.44765625, 0.679921875], "label": "a white cup"}, {"bbox": [0.28103125, 0.5880468750000001, 0.903984375, 0.8737656250000001], "label": "a brown hot dog"}, {"bbox": [0.2706875, 0.588578125, 0.8993281249999999, 0.8771718749999999], "label": "a green sandwich"}, {"bbox": [0.005187499999999999, 0.005187499999999999, 1.0, 0.58290625], "label": "a green dining table"}], "image_id": "188084"}, "352": {"caption": "a photo of a blue dining table and a brown cup and a red bowl and a blue cup and a yellow bowl and a white bowl ", "segment": [{"bbox": [0.0, 0.008208333333333333, 1.0, 1.0], "label": "a blue dining table"}, {"bbox": [0.501140625, 0.0, 0.9555468749999999, 0.38554166666666667], "label": "a brown cup"}, {"bbox": [0.16975, 0.22393749999999998, 0.34587500000000004, 0.4105833333333333], "label": "a red bowl"}, {"bbox": [0.7488125, 0.16672916666666668, 0.9000937499999999, 0.3379791666666667], "label": "a blue cup"}, {"bbox": [0.75065625, 0.16558333333333333, 0.8924531250000001, 0.3346041666666667], "label": "a yellow bowl"}, {"bbox": [0.3479375, 0.0025208333333333333, 0.5095625, 0.13933333333333334], "label": "a white bowl"}], "image_id": "41923"}, "353": {"caption": "a photo of a white cow and a black cow and a green cow and a blue cow and a yellow cow ", "segment": [{"bbox": [0.21973437499999998, 0.165015625, 1.0, 0.8914843749999999], "label": "a white cow"}, {"bbox": [0.004296875, 0.756796875, 1.0, 0.9864062499999999], "label": "a black cow"}, {"bbox": [0.0, 0.450015625, 0.41296875, 0.7886875], "label": "a green cow"}, {"bbox": [0.0021562499999999997, 0.195046875, 0.392234375, 0.550640625], "label": "a blue cow"}, {"bbox": [0.770875, 0.36129687499999996, 1.0, 0.5711562499999999], "label": "a yellow cow"}], "image_id": "483893"}, "354": {"caption": "a photo of a white umbrella and a blue umbrella and a blue chair and a black chair and a white umbrella and a red chair ", "segment": [{"bbox": [0.0, 0.35104166666666664, 0.395359375, 0.6860416666666667], "label": "a white umbrella"}, {"bbox": [0.638765625, 0.31235416666666665, 1.0, 0.5325833333333333], "label": "a blue umbrella"}, {"bbox": [0.21428124999999998, 0.8285625, 0.6292187499999999, 0.9844166666666666], "label": "a blue chair"}, {"bbox": [0.071203125, 0.6920833333333333, 0.24298437499999997, 0.9993541666666667], "label": "a black chair"}, {"bbox": [0.3715625, 0.40591666666666665, 0.569515625, 0.5562708333333333], "label": "a white umbrella"}, {"bbox": [0.482203125, 0.5641458333333333, 0.649859375, 0.7133333333333334], "label": "a red chair"}], "image_id": "207844"}, "355": {"caption": "a photo of a blue teddy bear and a green potted plant and a brown dining table and a red vase ", "segment": [{"bbox": [0.2622916666666667, 0.1213125, 0.7683541666666667, 0.529015625], "label": "a blue teddy bear"}, {"bbox": [0.5662916666666666, 0.053937500000000006, 0.901875, 0.660671875], "label": "a green potted plant"}, {"bbox": [0.0, 0.0641875, 0.9669583333333333, 0.989859375], "label": "a brown dining table"}, {"bbox": [0.5720208333333333, 0.503984375, 0.7599791666666665, 0.66809375], "label": "a red vase"}], "image_id": "508115"}, "356": {"caption": "a photo of a black cat and a white cat and a black hair drier and a black sink and a white sink ", "segment": [{"bbox": [0.154703125, 0.37272916666666667, 1.0, 0.8643541666666666], "label": "a black cat"}, {"bbox": [0.17528125, 0.13033333333333333, 0.790453125, 0.40897916666666667], "label": "a white cat"}, {"bbox": [0.0016875000000000002, 0.6359583333333333, 0.57303125, 0.9887708333333334], "label": "a black hair drier"}, {"bbox": [0.0, 0.1705, 0.183796875, 0.3952916666666667], "label": "a black sink"}, {"bbox": [0.857359375, 0.20418750000000002, 1.0, 0.34875], "label": "a white sink"}], "image_id": "177262"}, "357": {"caption": "a photo of a red dog and a brown dog and a yellow couch ", "segment": [{"bbox": [0.0, 0.06236928104575164, 0.8032516339869281, 0.8534477124183005], "label": "a red dog"}, {"bbox": [0.4404575163398693, 0.39101307189542484, 1.0, 0.9662908496732027], "label": "a brown dog"}, {"bbox": [0.0021568627450980395, 0.005392156862745098, 1.0, 0.9902941176470588], "label": "a yellow couch"}], "image_id": "186589"}, "358": {"caption": "a photo of a blue sheep and a green sheep and a white sheep and a blue sheep and a white sheep and a green sheep ", "segment": [{"bbox": [0.13596875, 0.6712412177985949, 0.495421875, 0.8541451990632319], "label": "a blue sheep"}, {"bbox": [0.1843125, 0.610632318501171, 0.490421875, 0.7933489461358314], "label": "a green sheep"}, {"bbox": [0.13803125, 0.7600468384074942, 0.399640625, 0.949648711943794], "label": "a white sheep"}, {"bbox": [0.2131875, 0.5360889929742388, 0.502859375, 0.6930210772833724], "label": "a blue sheep"}, {"bbox": [0.0014375, 0.7252224824355973, 0.18260937500000002, 0.9321077283372365], "label": "a white sheep"}, {"bbox": [0.34796875, 0.7894379391100702, 0.47710937500000006, 1.0], "label": "a green sheep"}], "image_id": "263428"}, "359": {"caption": "a photo of a black donut and a green donut and a black donut and a blue donut and a brown donut and a black donut ", "segment": [{"bbox": [0.06455882352941177, 0.5792320261437909, 0.2639705882352941, 0.7425], "label": "a black donut"}, {"bbox": [0.6549019607843137, 0.8347712418300653, 0.8472058823529411, 1.0], "label": "a green donut"}, {"bbox": [0.37612745098039213, 0.014640522875816995, 0.6351307189542483, 0.17004901960784313], "label": "a black donut"}, {"bbox": [0.19058823529411764, 0.8344444444444444, 0.40089869281045754, 0.9997549019607843], "label": "a blue donut"}, {"bbox": [0.0022549019607843133, 0.8471895424836602, 0.1662908496732026, 0.9865196078431373], "label": "a brown donut"}, {"bbox": [0.40326797385620916, 0.8448039215686274, 0.5976797385620916, 1.0], "label": "a black donut"}], "image_id": "149444"}, "360": {"caption": "a photo of a brown zebra and a brown zebra and a black zebra and a red zebra and a red cow ", "segment": [{"bbox": [0.12565625, 0.09107728337236534, 0.7994531250000001, 0.936463700234192], "label": "a brown zebra"}, {"bbox": [0.3134375, 0.12550351288056208, 0.5283749999999999, 0.367096018735363], "label": "a brown zebra"}, {"bbox": [0.703984375, 0.11967213114754098, 0.874015625, 0.40339578454332553], "label": "a black zebra"}, {"bbox": [0.0015, 0.3996252927400468, 0.1454375, 0.9119906323185011], "label": "a red zebra"}, {"bbox": [0.6039218749999999, 0.34714285714285714, 0.8752656249999999, 0.7654098360655738], "label": "a red cow"}], "image_id": "80328"}, "361": {"caption": "a photo of a red tv and a yellow refrigerator and a green cat ", "segment": [{"bbox": [0.29515406162464985, 0.0051600000000000005, 0.8160224089635855, 0.28202000000000005], "label": "a red tv"}, {"bbox": [0.009439775910364146, 0.0022400000000000002, 0.2549299719887955, 0.59102], "label": "a yellow refrigerator"}, {"bbox": [0.33103641456582633, 0.61298, 0.5711484593837535, 0.98702], "label": "a green cat"}], "image_id": "240940"}, "362": {"caption": "a photo of a green bowl and a white banana and a white orange and a brown orange ", "segment": [{"bbox": [0.022796875, 0.3608333333333333, 0.39015625000000004, 0.6830625], "label": "a green bowl"}, {"bbox": [0.035390624999999995, 0.3640416666666667, 0.39775, 0.6292083333333333], "label": "a white banana"}, {"bbox": [0.6782812500000001, 0.5844166666666666, 0.803859375, 0.7449583333333333], "label": "a white orange"}, {"bbox": [0.591171875, 0.4413958333333333, 1.0, 0.936625], "label": "a brown orange"}], "image_id": "118065"}, "363": {"caption": "a photo of a yellow car and a black banana and a blue banana and a red car and a yellow banana and a black car ", "segment": [{"bbox": [0.51009375, 0.5606004618937644, 1.0, 0.8716628175519631], "label": "a yellow car"}, {"bbox": [0.63446875, 0.2166512702078522, 0.8859375, 0.4827020785219399], "label": "a black banana"}, {"bbox": [0.6390781249999999, 0.027852193995381063, 0.86378125, 0.24836027713625866], "label": "a blue banana"}, {"bbox": [0.470328125, 0.5386143187066974, 0.652359375, 0.7709699769053118], "label": "a red car"}, {"bbox": [0.627375, 0.4448960739030023, 0.76315625, 0.6937644341801386], "label": "a yellow banana"}, {"bbox": [0.314109375, 0.540323325635104, 0.44182812499999996, 0.697528868360277], "label": "a black car"}], "image_id": "152360"}, "364": {"caption": "a photo of a yellow donut and a green donut and a blue donut and a black donut and a black donut and a white donut ", "segment": [{"bbox": [0.430640625, 0.6859908883826878, 0.624421875, 0.9393394077448747], "label": "a yellow donut"}, {"bbox": [0.051437500000000004, 0.5033485193621868, 0.2511875, 0.7318678815489749], "label": "a green donut"}, {"bbox": [0.22204687500000003, 0.4471981776765376, 0.38453125000000005, 0.6438496583143507], "label": "a blue donut"}, {"bbox": [0.44242187499999996, 0.3961047835990888, 0.59709375, 0.5673120728929385], "label": "a black donut"}, {"bbox": [0.5953125, 0.31378132118451024, 0.7516875, 0.4614350797266515], "label": "a black donut"}, {"bbox": [0.52553125, 0.19806378132118452, 0.6624062499999999, 0.33883826879271073], "label": "a white donut"}], "image_id": "238866"}, "365": {"caption": "a photo of a black cake and a black bowl and a blue bowl and a green bowl and a white bowl and a green spoon ", "segment": [{"bbox": [0.266, 0.6022453703703704, 0.6620799999999999, 0.9887731481481481], "label": "a black cake"}, {"bbox": [0.49174, 0.0, 0.7406200000000001, 0.200625], "label": "a black bowl"}, {"bbox": [0.51698, 0.20386574074074074, 0.7415, 0.4000694444444444], "label": "a blue bowl"}, {"bbox": [0.26412, 0.20493055555555556, 0.49244, 0.39405092592592594], "label": "a green bowl"}, {"bbox": [0.0, 0.20497685185185185, 0.20146, 0.3940740740740741], "label": "a white bowl"}, {"bbox": [0.00628, 0.4065509259259259, 0.15418, 0.6618518518518519], "label": "a green spoon"}], "image_id": "136021"}, "366": {"caption": "a photo of a brown spoon and a black carrot and a red bowl ", "segment": [{"bbox": [0.031546875, 0.15419811320754717, 0.585890625, 0.9659905660377358], "label": "a brown spoon"}, {"bbox": [0.224921875, 0.5011792452830188, 0.511859375, 0.9674292452830189], "label": "a black carrot"}, {"bbox": [0.050624999999999996, 0.08502358490566037, 0.39303125, 0.5322169811320755], "label": "a red bowl"}], "image_id": "356236"}, "367": {"caption": "a photo of a brown cat and a black chair and a red dining table and a black potted plant and a white spoon and a white bowl ", "segment": [{"bbox": [0.34468, 0.0, 0.64162, 0.5730421686746988], "label": "a brown cat"}, {"bbox": [0.22275999999999999, 0.036566265060240966, 0.68828, 0.5247289156626506], "label": "a black chair"}, {"bbox": [0.0, 0.5224698795180723, 0.99834, 0.9885240963855422], "label": "a red dining table"}, {"bbox": [0.30451999999999996, 0.0, 1.0, 0.525933734939759], "label": "a black potted plant"}, {"bbox": [0.6240399999999999, 0.309066265060241, 0.91416, 0.7816867469879517], "label": "a white spoon"}, {"bbox": [0.22018000000000001, 0.38090361445783133, 0.7800199999999999, 0.9721084337349398], "label": "a white bowl"}], "image_id": "363431"}, "368": {"caption": "a photo of a brown bear and a brown bear and a black bear ", "segment": [{"bbox": [0.249921875, 0.5783437499999999, 0.68134375, 1.0], "label": "a brown bear"}, {"bbox": [0.029218749999999998, 0.665171875, 0.38201562499999997, 0.9842656249999999], "label": "a brown bear"}, {"bbox": [0.52478125, 0.575453125, 1.0, 0.985359375], "label": "a black bear"}], "image_id": "112573"}, "369": {"caption": "a photo of a black elephant and a green elephant and a yellow elephant and a red elephant and a brown elephant and a black elephant ", "segment": [{"bbox": [0.44510937500000003, 0.0033713355048859933, 1.0, 0.989869706840391], "label": "a black elephant"}, {"bbox": [0.30975, 0.0313843648208469, 0.718453125, 0.8385667752442997], "label": "a green elephant"}, {"bbox": [0.203109375, 0.0033713355048859933, 0.834046875, 0.7195928338762215], "label": "a yellow elephant"}, {"bbox": [0.16498437500000002, 0.0728501628664495, 0.38621875, 0.6851465798045603], "label": "a red elephant"}, {"bbox": [0.14846874999999998, 0.06742671009771986, 0.33996875, 0.6085016286644951], "label": "a brown elephant"}, {"bbox": [0.13140625, 0.08653094462540717, 0.275875, 0.5435342019543974], "label": "a black elephant"}], "image_id": "79926"}, "370": {"caption": "a photo of a white teddy bear and a brown teddy bear and a green teddy bear and a green teddy bear and a green teddy bear and a blue teddy bear ", "segment": [{"bbox": [0.571546875, 0.46517647058823525, 0.8162812500000001, 0.8719058823529412], "label": "a white teddy bear"}, {"bbox": [0.0850625, 0.5011294117647058, 0.265625, 0.8943764705882353], "label": "a brown teddy bear"}, {"bbox": [0.826125, 0.528235294117647, 0.996046875, 0.8644941176470587], "label": "a green teddy bear"}, {"bbox": [0.402875, 0.5920235294117647, 0.5949375, 0.8831529411764707], "label": "a green teddy bear"}, {"bbox": [0.47328125, 0.3543294117647059, 0.631453125, 0.6968705882352941], "label": "a green teddy bear"}, {"bbox": [0.774734375, 0.36374117647058823, 0.90934375, 0.661035294117647], "label": "a blue teddy bear"}], "image_id": "499631"}, "371": {"caption": "a photo of a brown bicycle and a white motorcycle and a blue motorcycle ", "segment": [{"bbox": [0.13380555555555557, 0.3311875, 1.0, 0.98925], "label": "a brown bicycle"}, {"bbox": [0.0, 0.31460937499999997, 0.24369444444444446, 0.9977499999999999], "label": "a white motorcycle"}, {"bbox": [0.5030277777777777, 0.181546875, 1.0, 0.7620312499999999], "label": "a blue motorcycle"}], "image_id": "337011"}, "372": {"caption": "a photo of a red broccoli and a blue broccoli and a brown broccoli and a green truck and a blue broccoli and a black broccoli ", "segment": [{"bbox": [0.416390625, 0.45518691588785043, 0.569390625, 0.6674532710280373], "label": "a red broccoli"}, {"bbox": [0.37275, 0.21567757009345795, 0.781515625, 0.456892523364486], "label": "a blue broccoli"}, {"bbox": [0.714171875, 0.2008411214953271, 0.882625, 0.45469626168224303], "label": "a brown broccoli"}, {"bbox": [0.09153125, 0.19843457943925236, 0.33718750000000003, 0.32570093457943927], "label": "a green truck"}, {"bbox": [0.286578125, 0.20623831775700935, 0.423796875, 0.3966822429906542], "label": "a blue broccoli"}, {"bbox": [0.00625, 0.17289719626168223, 0.4390625, 0.6892523364485982], "label": "a black broccoli"}], "image_id": "134231"}, "373": {"caption": "a photo of a red banana and a green laptop and a white cake ", "segment": [{"bbox": [0.336453125, 0.6991041666666666, 0.60740625, 0.8958125], "label": "a red banana"}, {"bbox": [0.259953125, 0.18522916666666667, 0.70609375, 0.6887500000000001], "label": "a green laptop"}, {"bbox": [0.400921875, 0.6480833333333333, 0.531265625, 0.7929166666666666], "label": "a white cake"}], "image_id": "59598"}, "374": {"caption": "a photo of a black dining table and a brown cup and a blue cup and a yellow knife and a yellow fork and a yellow bottle ", "segment": [{"bbox": [0.022565359477124184, 0.03781045751633987, 0.9593627450980392, 0.9836274509803922], "label": "a black dining table"}, {"bbox": [0.30044117647058827, 0.11570261437908497, 0.6345261437908497, 0.4901307189542484], "label": "a brown cup"}, {"bbox": [0.040457516339869284, 0.2584313725490196, 0.2741503267973856, 0.7033660130718955], "label": "a blue cup"}, {"bbox": [0.27578431372549017, 0.46849673202614384, 0.878921568627451, 0.6119934640522876], "label": "a yellow knife"}, {"bbox": [0.38063725490196076, 0.5371568627450981, 0.9279248366013072, 0.6655392156862745], "label": "a yellow fork"}, {"bbox": [0.5916666666666667, 0.044444444444444446, 0.7276470588235295, 0.41699346405228754], "label": "a yellow bottle"}], "image_id": "214388"}, "375": {"caption": "a photo of a white apple and a black orange and a yellow book and a brown cell phone and a brown book ", "segment": [{"bbox": [0.6174062499999999, 0.18716666666666668, 0.822453125, 0.5368125], "label": "a white apple"}, {"bbox": [0.436453125, 0.2039375, 0.7286875, 0.5376875], "label": "a black orange"}, {"bbox": [0.0, 0.17266666666666666, 0.367421875, 0.48052083333333334], "label": "a yellow book"}, {"bbox": [0.17109375, 0.7739583333333333, 0.64296875, 0.9635416666666666], "label": "a brown cell phone"}, {"bbox": [0.0, 0.46229166666666666, 0.287421875, 0.5898541666666667], "label": "a brown book"}], "image_id": "286524"}, "376": {"caption": "a photo of a black pizza and a yellow pizza and a green pizza and a black dining table ", "segment": [{"bbox": [0.21785937500000002, 0.06292428198433421, 0.45992187500000004, 0.5101044386422977], "label": "a black pizza"}, {"bbox": [0.4689375, 0.10321148825065274, 0.819140625, 0.4381984334203656], "label": "a yellow pizza"}, {"bbox": [0.37117187500000004, 0.05843342036553525, 0.6710625, 0.46516971279373365], "label": "a green pizza"}, {"bbox": [0.00134375, 0.004490861618798955, 1.0, 0.9887728459530027], "label": "a black dining table"}], "image_id": "167647"}, "377": {"caption": "a photo of a green tv and a white couch and a black couch and a blue couch and a red chair ", "segment": [{"bbox": [0.01390625, 0.40225, 0.14284375, 0.8134722222222223], "label": "a green tv"}, {"bbox": [0.266703125, 0.39116666666666666, 0.572203125, 0.6778055555555556], "label": "a white couch"}, {"bbox": [0.60946875, 0.38811111111111113, 1.0, 0.8237777777777778], "label": "a black couch"}, {"bbox": [0.41643749999999996, 0.6652222222222222, 0.8401250000000001, 0.9849722222222221], "label": "a blue couch"}, {"bbox": [0.416390625, 0.66675, 0.8459375000000001, 0.9810277777777778], "label": "a red chair"}], "image_id": "405068"}, "378": {"caption": "a photo of a red dining table and a brown pizza and a brown chair ", "segment": [{"bbox": [0.0, 0.09315352697095436, 1.0, 1.0], "label": "a red dining table"}, {"bbox": [0.26740624999999996, 0.36817427385892115, 0.6177343750000001, 0.6468257261410788], "label": "a brown pizza"}, {"bbox": [0.6655, 4.149377593360996e-05, 0.8811093750000001, 0.2383817427385892], "label": "a brown chair"}], "image_id": "294475"}, "379": {"caption": "a photo of a brown orange and a white banana and a yellow train and a green banana and a red banana and a blue banana ", "segment": [{"bbox": [0.4134375, 0.6286182669789228, 0.8756562500000001, 0.9971662763466043], "label": "a brown orange"}, {"bbox": [0.0026718749999999998, 0.4700702576112412, 0.31779687500000003, 0.9202341920374707], "label": "a white banana"}, {"bbox": [0.379328125, 0.0314519906323185, 0.692671875, 0.41124121779859485], "label": "a yellow train"}, {"bbox": [0.22789062499999999, 0.4089929742388759, 0.497765625, 0.8224824355971897], "label": "a green banana"}, {"bbox": [0.28209375, 0.778735362997658, 0.5403125, 0.98903981264637], "label": "a red banana"}, {"bbox": [0.019484375, 0.6224824355971897, 0.15142187499999998, 0.9168618266978923], "label": "a blue banana"}], "image_id": "340529"}, "380": {"caption": "a photo of a black dining table and a green spoon and a yellow bowl and a yellow bowl and a white bowl and a blue bowl ", "segment": [{"bbox": [0.0, 0.011241830065359478, 0.9977450980392157, 0.9865196078431373], "label": "a black dining table"}, {"bbox": [0.43218954248366015, 0.6770588235294118, 0.8185947712418301, 0.9266013071895426], "label": "a green spoon"}, {"bbox": [0.14805555555555555, 0.5298692810457516, 0.5532516339869281, 0.9376633986928103], "label": "a yellow bowl"}, {"bbox": [0.5072549019607843, 0.3863888888888889, 0.9005718954248365, 0.7682843137254902], "label": "a yellow bowl"}, {"bbox": [0.2213562091503268, 0.2070261437908497, 0.5468790849673203, 0.5377614379084967], "label": "a white bowl"}, {"bbox": [0.5350653594771242, 0.051519607843137256, 0.8961111111111111, 0.40475490196078434], "label": "a blue bowl"}], "image_id": "30954"}, "381": {"caption": "a photo of a white elephant and a red elephant and a green elephant ", "segment": [{"bbox": [0.568859375, 0.2241057934508816, 0.942984375, 0.712896725440806], "label": "a white elephant"}, {"bbox": [0.35165625, 0.29856423173803526, 0.623125, 0.8201007556675064], "label": "a red elephant"}, {"bbox": [0.060203125, 0.2838539042821159, 0.33606250000000004, 0.8053148614609573], "label": "a green elephant"}], "image_id": "366295"}, "382": {"caption": "a photo of a red dining table and a yellow dining table and a blue chair and a yellow broccoli and a brown bottle and a red bowl ", "segment": [{"bbox": [0.03125, 0.10588235294117647, 0.9859375, 0.9811764705882353], "label": "a red dining table"}, {"bbox": [0.035812500000000004, 0.3501882352941177, 0.9640156249999998, 0.9906352941176471], "label": "a yellow dining table"}, {"bbox": [0.057374999999999995, 0.18736470588235293, 0.23521874999999998, 0.7359529411764705], "label": "a blue chair"}, {"bbox": [0.373875, 0.13656470588235295, 0.6641875, 0.4091764705882353], "label": "a yellow broccoli"}, {"bbox": [0.6954374999999999, 0.3280705882352941, 0.8699999999999999, 0.5772235294117647], "label": "a brown bottle"}, {"bbox": [0.44978125, 0.29451764705882355, 0.6115, 0.4347529411764706], "label": "a red bowl"}], "image_id": "338581"}, "383": {"caption": "a photo of a black boat and a blue boat and a yellow boat and a white boat and a black boat ", "segment": [{"bbox": [0.16834375, 0.36464583333333334, 0.9841093750000001, 0.5983125], "label": "a black boat"}, {"bbox": [0.8391093749999999, 0.25833333333333336, 1.0, 0.3863333333333333], "label": "a blue boat"}, {"bbox": [0.0033750000000000004, 0.37304166666666666, 0.16854687499999998, 0.5528125], "label": "a yellow boat"}, {"bbox": [0.001859375, 0.22468749999999998, 0.18703125, 0.3777708333333333], "label": "a white boat"}, {"bbox": [0.06771875000000001, 0.20945833333333336, 0.393078125, 0.457], "label": "a black boat"}], "image_id": "285096"}, "384": {"caption": "a photo of a white apple and a brown apple and a black orange and a red orange and a blue orange and a yellow orange ", "segment": [{"bbox": [0.0, 0.31379687500000003, 0.5243125, 0.7044218750000001], "label": "a white apple"}, {"bbox": [0.5208333333333334, 0.0012968749999999999, 1.0, 0.319015625], "label": "a brown apple"}, {"bbox": [0.0708125, 0.6774375, 0.49133333333333334, 0.99125], "label": "a black orange"}, {"bbox": [0.5007916666666666, 0.73028125, 0.9640000000000001, 0.9884999999999999], "label": "a red orange"}, {"bbox": [0.4674166666666667, 0.49437499999999995, 0.8689166666666668, 0.764046875], "label": "a blue orange"}, {"bbox": [0.764, 0.28009375, 1.0, 0.55009375], "label": "a yellow orange"}], "image_id": "128598"}, "385": {"caption": "a photo of a blue dining table and a green knife and a white knife and a yellow apple ", "segment": [{"bbox": [0.0035280373831775703, 0.8258749999999999, 0.992196261682243, 0.9835312499999999], "label": "a blue dining table"}, {"bbox": [0.19154205607476638, 0.161796875, 0.5981308411214953, 0.6831406250000001], "label": "a green knife"}, {"bbox": [0.34911214953271025, 0.1830625, 0.6993224299065419, 0.67009375], "label": "a white knife"}, {"bbox": [0.4046261682242991, 0.661171875, 0.9147897196261682, 0.9670624999999999], "label": "a yellow apple"}], "image_id": "573796"}, "386": {"caption": "a photo of a white chair and a blue chair and a blue potted plant and a yellow vase and a brown dining table ", "segment": [{"bbox": [0.7610833333333333, 0.602890625, 1.0, 0.8625468749999999], "label": "a white chair"}, {"bbox": [0.002875, 0.44085937499999994, 0.3670208333333333, 0.806453125], "label": "a blue chair"}, {"bbox": [0.0, 0.324796875, 0.9991041666666667, 0.9783593749999999], "label": "a blue potted plant"}, {"bbox": [0.3625416666666667, 0.694375, 0.5902708333333334, 0.9887656249999999], "label": "a yellow vase"}, {"bbox": [0.004166666666666667, 0.70996875, 1.0, 0.98184375], "label": "a brown dining table"}], "image_id": "488785"}, "387": {"caption": "a photo of a yellow banana and a blue orange and a black orange ", "segment": [{"bbox": [0.250375, 0.06967213114754098, 0.6566875000000001, 0.5438173302107728], "label": "a yellow banana"}, {"bbox": [0.0, 0.39058548009367683, 0.3861875, 0.9858782201405153], "label": "a blue orange"}, {"bbox": [0.334453125, 0.6044028103044496, 0.6030625000000001, 0.9810304449648711], "label": "a black orange"}], "image_id": "254143"}, "388": {"caption": "a photo of a black airplane and a blue airplane and a yellow airplane and a blue airplane ", "segment": [{"bbox": [0.23689062500000002, 0.48266978922716625, 0.7665625, 0.8921311475409835], "label": "a black airplane"}, {"bbox": [0.352140625, 0.44864168618266975, 0.8555781249999999, 0.7153864168618268], "label": "a blue airplane"}, {"bbox": [0.59021875, 0.4377751756440281, 0.95140625, 0.8244496487119438], "label": "a yellow airplane"}, {"bbox": [0.8006249999999999, 0.4314519906323185, 1.0, 0.7842622950819672], "label": "a blue airplane"}], "image_id": "131386"}, "389": {"caption": "a photo of a red bus and a black bus and a black bus and a brown bus ", "segment": [{"bbox": [0.6255625, 0.2914791666666667, 0.978703125, 0.7443958333333334], "label": "a red bus"}, {"bbox": [0.36317187500000003, 0.1903125, 0.65034375, 0.7443749999999999], "label": "a black bus"}, {"bbox": [0.168515625, 0.12591666666666665, 0.36296875, 0.2543125], "label": "a black bus"}, {"bbox": [0.163359375, 0.23143750000000002, 0.367578125, 0.7462916666666667], "label": "a brown bus"}], "image_id": "334743"}, "390": {"caption": "a photo of a green truck and a white truck and a white truck and a blue suitcase ", "segment": [{"bbox": [0.1453125, 0.22962616822429907, 0.439234375, 0.6370327102803738], "label": "a green truck"}, {"bbox": [0.43203125, 0.35273364485981307, 0.8822812500000001, 0.7933177570093457], "label": "a white truck"}, {"bbox": [0.48209375000000004, 0.17932242990654207, 1.0, 0.4272663551401869], "label": "a white truck"}, {"bbox": [0.015625, 0.3014018691588785, 0.8375, 0.9322429906542056], "label": "a blue suitcase"}], "image_id": "390087"}, "391": {"caption": "a photo of a green teddy bear and a yellow teddy bear and a red teddy bear ", "segment": [{"bbox": [0.25392187499999996, 0.013458333333333333, 0.8071718749999999, 0.9596458333333333], "label": "a green teddy bear"}, {"bbox": [0.0, 0.6719166666666666, 0.431453125, 0.9887708333333334], "label": "a yellow teddy bear"}, {"bbox": [0.0054218750000000005, 0.0003541666666666667, 0.5725156250000001, 0.6334375], "label": "a red teddy bear"}], "image_id": "68411"}, "392": {"caption": "a photo of a yellow banana and a white banana and a green banana and a blue bowl and a brown dining table ", "segment": [{"bbox": [0.12125, 0.46067010309278356, 0.934578125, 0.7910051546391752], "label": "a yellow banana"}, {"bbox": [0.104125, 0.34824742268041237, 0.292421875, 0.5152835051546392], "label": "a white banana"}, {"bbox": [0.72703125, 0.3420876288659794, 0.901203125, 0.4927577319587629], "label": "a green banana"}, {"bbox": [0.001359375, 0.43077319587628865, 1.0, 0.9363917525773195], "label": "a blue bowl"}, {"bbox": [0.0, 0.007783505154639175, 1.0, 0.9818298969072164], "label": "a brown dining table"}], "image_id": "139260"}, "393": {"caption": "a photo of a blue toothbrush and a yellow toothbrush and a black toothbrush ", "segment": [{"bbox": [0.0, 0.1813958333333333, 0.26190625, 0.9070208333333334], "label": "a blue toothbrush"}, {"bbox": [0.002078125, 0.44429166666666664, 0.150125, 0.923875], "label": "a yellow toothbrush"}, {"bbox": [0.12467187500000002, 0.15585416666666668, 0.38765625000000004, 0.8857083333333333], "label": "a black toothbrush"}], "image_id": "244878"}, "394": {"caption": "a photo of a yellow zebra and a brown zebra and a yellow zebra ", "segment": [{"bbox": [0.6415599999999999, 0.10494661921708184, 0.84616, 0.8779715302491103], "label": "a yellow zebra"}, {"bbox": [0.42748, 0.11879003558718862, 0.63744, 0.9219217081850534], "label": "a brown zebra"}, {"bbox": [0.04568, 0.06263345195729537, 0.477, 0.9046263345195729], "label": "a yellow zebra"}], "image_id": "300147"}, "395": {"caption": "a photo of a black horse and a yellow handbag and a white handbag ", "segment": [{"bbox": [0.6227146171693735, 0.11828125, 0.9963341067285382, 0.417203125], "label": "a black horse"}, {"bbox": [0.39709976798143853, 0.57265625, 0.597308584686775, 0.790640625], "label": "a yellow handbag"}, {"bbox": [0.6280742459396752, 0.8188281249999999, 0.8352436194895592, 0.975484375], "label": "a white handbag"}], "image_id": "73039"}, "396": {"caption": "a photo of a red kite and a brown kite and a brown kite and a yellow kite ", "segment": [{"bbox": [0.6697196261682242, 0.4173125, 0.9288551401869157, 0.7196093749999999], "label": "a red kite"}, {"bbox": [0.3023130841121495, 0.360953125, 0.44862149532710277, 0.504671875], "label": "a brown kite"}, {"bbox": [0.2372663551401869, 0.338828125, 0.5617056074766356, 0.7760468749999999], "label": "a brown kite"}, {"bbox": [0.5415186915887851, 0.276328125, 0.7714018691588785, 0.420515625], "label": "a yellow kite"}], "image_id": "429834"}, "397": {"caption": "a photo of a black dining table and a yellow dining table and a brown hot dog and a red hot dog and a yellow sandwich and a blue sandwich ", "segment": [{"bbox": [0.0, 0.5035208333333333, 0.54353125, 1.0], "label": "a black dining table"}, {"bbox": [0.0016875000000000002, 0.004125, 1.0, 0.9883958333333334], "label": "a yellow dining table"}, {"bbox": [0.20646874999999998, 0.26368749999999996, 0.524125, 0.8072083333333333], "label": "a brown hot dog"}, {"bbox": [0.525875, 0.5670625, 0.788828125, 0.8117708333333333], "label": "a red hot dog"}, {"bbox": [0.2225, 0.2651875, 0.519765625, 0.8033125000000001], "label": "a yellow sandwich"}, {"bbox": [0.52584375, 0.36141666666666666, 0.8005625000000001, 0.8265833333333333], "label": "a blue sandwich"}], "image_id": "327114"}, "398": {"caption": "a photo of a white chair and a white chair and a white chair and a red chair and a blue dining table ", "segment": [{"bbox": [0.5198125, 0.5613333333333334, 0.7714375, 1.0], "label": "a white chair"}, {"bbox": [0.61875, 0.5000833333333333, 0.8083124999999999, 0.8970416666666666], "label": "a white chair"}, {"bbox": [0.29903124999999997, 0.5063125, 0.46853125, 0.9180208333333333], "label": "a white chair"}, {"bbox": [0.12298437499999999, 0.5751666666666666, 0.382875, 1.0], "label": "a red chair"}, {"bbox": [0.24325000000000002, 0.616, 0.6030468750000001, 0.7849166666666666], "label": "a blue dining table"}], "image_id": "307323"}, "399": {"caption": "a photo of a red cat and a brown couch and a yellow refrigerator ", "segment": [{"bbox": [0.24298437499999997, 0.0750625, 0.793734375, 0.9346666666666666], "label": "a red cat"}, {"bbox": [0.0016093750000000001, 0.45377083333333335, 0.9709687499999999, 0.9871041666666667], "label": "a brown couch"}, {"bbox": [0.72115625, 0.2029375, 0.8999218750000001, 0.8216041666666667], "label": "a yellow refrigerator"}], "image_id": "398758"}, "400": {"caption": "a photo of a black cow and a white cow and a white cow and a white cow ", "segment": [{"bbox": [0.4802097902097902, 0.16007812500000002, 1.0, 0.5935625], "label": "a black cow"}, {"bbox": [0.0, 0.25328125, 0.5137762237762238, 0.909], "label": "a white cow"}, {"bbox": [0.16974358974358972, 0.1420625, 0.6017482517482518, 0.31148437500000004], "label": "a white cow"}, {"bbox": [0.2112121212121212, 0.296625, 0.7811188811188812, 0.6651718750000001], "label": "a white cow"}], "image_id": "573928"}, "401": {"caption": "a photo of a white potted plant and a brown potted plant and a black oven and a red oven ", "segment": [{"bbox": [0.49114583333333334, 0.335078125, 0.6374583333333333, 0.4655625], "label": "a white potted plant"}, {"bbox": [0.12566666666666668, 0.27796875, 0.32585416666666667, 0.482984375], "label": "a brown potted plant"}, {"bbox": [0.8059999999999999, 0.364046875, 1.0, 0.606734375], "label": "a black oven"}, {"bbox": [0.015270833333333334, 0.5275000000000001, 0.2871458333333334, 0.786546875], "label": "a red oven"}], "image_id": "22621"}, "402": {"caption": "a photo of a red book and a blue dog and a white book ", "segment": [{"bbox": [0.49214062500000005, 0.1528125, 1.0, 0.46066666666666667], "label": "a red book"}, {"bbox": [0.16753125, 0.0935, 0.99740625, 0.9870208333333333], "label": "a blue dog"}, {"bbox": [0.425, 0.0, 0.9984375, 0.15208333333333332], "label": "a white book"}], "image_id": "347650"}, "403": {"caption": "a photo of a green couch and a yellow couch and a green chair and a red dining table ", "segment": [{"bbox": [0.6730625, 0.5369718309859155, 0.988703125, 0.9450704225352113], "label": "a green couch"}, {"bbox": [0.5138906249999999, 0.5354929577464789, 0.795890625, 0.6774178403755868], "label": "a yellow couch"}, {"bbox": [0.146140625, 0.5001877934272301, 0.30015625, 0.8051173708920188], "label": "a green chair"}, {"bbox": [0.57584375, 0.6113380281690141, 0.8374843750000001, 0.8339906103286384], "label": "a red dining table"}], "image_id": "486087"}, "404": {"caption": "a photo of a red cake and a brown teddy bear and a yellow teddy bear ", "segment": [{"bbox": [0.22229508196721312, 0.28090625, 0.7376346604215457, 0.62471875], "label": "a red cake"}, {"bbox": [0.3127166276346604, 0.274484375, 0.47915690866510535, 0.45909374999999997], "label": "a brown teddy bear"}, {"bbox": [0.47163934426229503, 0.31637499999999996, 0.6437236533957845, 0.45864062499999997], "label": "a yellow teddy bear"}], "image_id": "113945"}, "405": {"caption": "a photo of a black zebra and a brown zebra and a yellow zebra ", "segment": [{"bbox": [0.530171875, 0.44627083333333334, 0.803234375, 0.6926458333333334], "label": "a black zebra"}, {"bbox": [0.21395312500000002, 0.42052083333333334, 0.3824375, 0.6450833333333333], "label": "a brown zebra"}, {"bbox": [0.33203125, 0.4244791666666667, 0.529296875, 0.65625], "label": "a yellow zebra"}], "image_id": "479762"}, "406": {"caption": "a photo of a yellow bird and a yellow bird and a yellow bench ", "segment": [{"bbox": [0.5643281250000001, 0.09023419203747073, 0.8300625, 0.70480093676815], "label": "a yellow bird"}, {"bbox": [0.000609375, 0.14348946135831384, 0.461609375, 0.6611943793911007], "label": "a yellow bird"}, {"bbox": [0.6686875, 0.22, 1.0, 0.8724590163934427], "label": "a yellow bench"}], "image_id": "212342"}, "407": {"caption": "a photo of a black laptop and a brown mouse and a blue tv ", "segment": [{"bbox": [0.01168, 0.14382749326145552, 0.6052799999999999, 0.9258490566037736], "label": "a black laptop"}, {"bbox": [0.75312, 0.6968194070080862, 0.93026, 0.8468733153638814], "label": "a brown mouse"}, {"bbox": [0.5635800000000001, 0.09886792452830188, 0.95542, 0.5415633423180594], "label": "a blue tv"}], "image_id": "232679"}, "408": {"caption": "a photo of a green cat and a black cat and a black bowl and a brown bed ", "segment": [{"bbox": [0.2473125, 0.2988958333333333, 0.85021875, 0.9472083333333333], "label": "a green cat"}, {"bbox": [0.123921875, 0.061375, 0.6582656250000001, 0.8639583333333333], "label": "a black cat"}, {"bbox": [0.05550000000000001, 0.011208333333333332, 0.8979843750000001, 0.9887916666666666], "label": "a black bowl"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a brown bed"}], "image_id": "292931"}, "409": {"caption": "a photo of a blue motorcycle and a green motorcycle and a white motorcycle ", "segment": [{"bbox": [0.32090625, 0.5855269320843092, 0.47912499999999997, 0.9300468384074941], "label": "a blue motorcycle"}, {"bbox": [0.49176562500000004, 0.5618032786885245, 0.685171875, 0.7460655737704918], "label": "a green motorcycle"}, {"bbox": [0.65971875, 0.5324590163934426, 0.9902656249999999, 0.9851756440281031], "label": "a white motorcycle"}], "image_id": "161202"}, "410": {"caption": "a photo of a brown potted plant and a green potted plant and a white couch and a black chair ", "segment": [{"bbox": [0.24438, 0.45167999999999997, 0.41798, 0.8629333333333334], "label": "a brown potted plant"}, {"bbox": [0.00176, 0.68, 0.20294, 0.9341066666666668], "label": "a green potted plant"}, {"bbox": [0.0, 0.20544, 0.5810599999999999, 0.70608], "label": "a white couch"}, {"bbox": [0.6486000000000001, 0.36050666666666664, 0.99786, 0.9485066666666666], "label": "a black chair"}], "image_id": "267321"}, "411": {"caption": "a photo of a yellow cat and a white cat and a yellow bed ", "segment": [{"bbox": [0.26170312500000004, 0.31573770491803277, 0.8282343749999999, 0.8049648711943794], "label": "a yellow cat"}, {"bbox": [0.190828125, 0.3118266978922717, 0.39314062499999997, 0.5182903981264637], "label": "a white cat"}, {"bbox": [0.005984375, 0.39227166276346603, 1.0, 0.9774707259953161], "label": "a yellow bed"}], "image_id": "54340"}, "412": {"caption": "a photo of a brown dog and a white cat and a black bed ", "segment": [{"bbox": [0.32486000000000004, 0.25405144694533766, 1.0, 0.6123472668810289], "label": "a brown dog"}, {"bbox": [0.17924, 0.16344051446945337, 0.4655, 0.552700964630225], "label": "a white cat"}, {"bbox": [0.0, 0.4087781350482315, 0.9988400000000001, 0.9808681672025722], "label": "a black bed"}], "image_id": "443537"}, "413": {"caption": "a photo of a white dining table and a white sandwich and a red sandwich and a green sandwich and a blue cup and a white sandwich ", "segment": [{"bbox": [0.0016875000000000002, 0.0, 0.9994375, 0.9954999999999999], "label": "a white dining table"}, {"bbox": [0.2166875, 0.40850000000000003, 0.73596875, 0.7969375], "label": "a white sandwich"}, {"bbox": [0.47985937500000003, 0.27537500000000004, 0.73321875, 0.5930625], "label": "a red sandwich"}, {"bbox": [0.605765625, 0.29008333333333336, 0.8258281249999999, 0.47258333333333336], "label": "a green sandwich"}, {"bbox": [0.232359375, 0.018083333333333333, 0.399265625, 0.19649999999999998], "label": "a blue cup"}, {"bbox": [0.48767187500000003, 0.021520833333333333, 0.665921875, 0.17847916666666666], "label": "a white sandwich"}], "image_id": "274109"}, "414": {"caption": "a photo of a green tv and a black laptop and a green mouse and a brown keyboard ", "segment": [{"bbox": [0.50612, 0.10522666666666666, 0.9134200000000001, 0.5719733333333333], "label": "a green tv"}, {"bbox": [0.11966, 0.22021333333333332, 0.5106799999999999, 0.69888], "label": "a black laptop"}, {"bbox": [0.84364, 0.8256533333333334, 0.9803999999999999, 0.9620266666666667], "label": "a green mouse"}, {"bbox": [0.07062, 0.66816, 0.8071799999999999, 0.8632266666666668], "label": "a brown keyboard"}], "image_id": "379310"}, "415": {"caption": "a photo of a green potted plant and a brown couch and a red chair and a brown vase ", "segment": [{"bbox": [0.321390625, 0.42365339578454336, 0.64709375, 0.8172131147540984], "label": "a green potted plant"}, {"bbox": [0.057265625, 0.003583138173302108, 0.94065625, 0.8962763466042154], "label": "a brown couch"}, {"bbox": [0.0, 0.21934426229508197, 0.31278125, 0.9892505854800936], "label": "a red chair"}, {"bbox": [0.493265625, 0.6494379391100703, 0.626703125, 0.8269555035128806], "label": "a brown vase"}], "image_id": "253489"}, "416": {"caption": "a photo of a white giraffe and a blue giraffe and a brown giraffe ", "segment": [{"bbox": [0.325, 0.09785416666666666, 0.50228125, 0.7159375], "label": "a white giraffe"}, {"bbox": [0.165796875, 0.2748958333333333, 0.30876562500000004, 0.5105625], "label": "a blue giraffe"}, {"bbox": [0.22078125, 0.22977083333333334, 0.365734375, 0.49943750000000003], "label": "a brown giraffe"}], "image_id": "333290"}, "417": {"caption": "a photo of a red cow and a brown cow and a white cow and a black cow ", "segment": [{"bbox": [0.329359375, 0.37485416666666665, 0.51890625, 0.5295416666666667], "label": "a red cow"}, {"bbox": [0.5059375, 0.3856041666666667, 0.6470312500000001, 0.5168958333333333], "label": "a brown cow"}, {"bbox": [0.682734375, 0.33616666666666667, 0.8206093749999999, 0.5037083333333334], "label": "a white cow"}, {"bbox": [0.10010937499999999, 0.4216666666666667, 0.263296875, 0.6014375], "label": "a black cow"}], "image_id": "416765"}, "418": {"caption": "a photo of a yellow bottle and a red wine glass and a black cup and a black cup and a red dining table and a green cup ", "segment": [{"bbox": [0.29395784543325526, 0.003234375, 1.0, 0.507546875], "label": "a yellow bottle"}, {"bbox": [0.0, 0.0, 0.5570023419203747, 0.602484375], "label": "a red wine glass"}, {"bbox": [0.0, 0.27321875, 0.28409836065573774, 0.5416562500000001], "label": "a black cup"}, {"bbox": [0.7759718969555035, 0.001921875, 1.0, 0.33464062499999997], "label": "a black cup"}, {"bbox": [0.0, 0.005187499999999999, 0.9927400468384074, 0.9818125], "label": "a red dining table"}, {"bbox": [0.19056206088992975, 0.148125, 0.69903981264637, 0.593078125], "label": "a green cup"}], "image_id": "51594"}, "419": {"caption": "a photo of a brown cat and a red backpack and a white suitcase ", "segment": [{"bbox": [0.46321874999999996, 0.21760445682451254, 0.784109375, 0.6472980501392758], "label": "a brown cat"}, {"bbox": [0.49264062500000005, 0.272033426183844, 0.781828125, 0.5803064066852367], "label": "a red backpack"}, {"bbox": [0.008390625, 0.6517270194986072, 0.3265625, 0.9995821727019499], "label": "a white suitcase"}], "image_id": "285733"}, "420": {"caption": "a photo of a red dining table and a white carrot and a brown spoon and a black sandwich ", "segment": [{"bbox": [0.0, 0.0, 0.9982638888888888, 1.0], "label": "a red dining table"}, {"bbox": [0.3063194444444444, 0.10387500000000001, 0.5339583333333333, 0.477625], "label": "a white carrot"}, {"bbox": [0.25, 0.396875, 0.59375, 0.8625], "label": "a brown spoon"}, {"bbox": [0.5311805555555555, 0.14781249999999999, 0.9368402777777778, 0.8811249999999999], "label": "a black sandwich"}], "image_id": "293044"}, "421": {"caption": "a photo of a brown banana and a blue donut and a yellow donut and a green donut and a red donut ", "segment": [{"bbox": [0.164921875, 0.25393442622950824, 0.45278124999999997, 0.8044964871194379], "label": "a brown banana"}, {"bbox": [0.43843750000000004, 0.5662295081967214, 0.677578125, 0.8285714285714286], "label": "a blue donut"}, {"bbox": [0.73978125, 0.287423887587822, 0.871140625, 0.5102341920374708], "label": "a yellow donut"}, {"bbox": [0.623859375, 0.498711943793911, 0.7867656249999999, 0.7220843091334894], "label": "a green donut"}, {"bbox": [0.566671875, 0.12728337236533957, 0.7538281250000001, 0.4], "label": "a red donut"}], "image_id": "235244"}, "422": {"caption": "a photo of a black pizza and a red pizza and a black pizza ", "segment": [{"bbox": [0.40785937499999997, 0.43370833333333336, 1.0, 0.9887708333333334], "label": "a black pizza"}, {"bbox": [0.38090625, 0.12583333333333332, 0.9690937500000001, 0.6179791666666666], "label": "a red pizza"}, {"bbox": [0.0, 0.051666666666666666, 0.5771875, 0.8055833333333333], "label": "a black pizza"}], "image_id": "152866"}, "423": {"caption": "a photo of a red tv and a yellow bed and a red bed ", "segment": [{"bbox": [0.028828125, 0.012887323943661972, 0.203125, 0.5613380281690141], "label": "a red tv"}, {"bbox": [0.41489062499999996, 0.49539906103286385, 0.70740625, 0.7084037558685445], "label": "a yellow bed"}, {"bbox": [0.616375, 0.5426056338028169, 1.0, 0.9887793427230047], "label": "a red bed"}], "image_id": "22432"}, "424": {"caption": "a photo of a black car and a green motorcycle and a green motorcycle ", "segment": [{"bbox": [0.6357999999999999, 0.55416, 0.99774, 0.92784], "label": "a black car"}, {"bbox": [0.32732, 0.6442933333333334, 0.5404, 0.9432533333333334], "label": "a green motorcycle"}, {"bbox": [0.41454, 0.6802933333333334, 0.63854, 0.9283733333333333], "label": "a green motorcycle"}], "image_id": "274773"}, "425": {"caption": "a photo of a white bowl and a brown bowl and a brown bowl and a yellow bowl and a red banana and a brown dining table ", "segment": [{"bbox": [0.48647916666666663, 0.386265625, 0.9519583333333334, 0.7376093750000001], "label": "a white bowl"}, {"bbox": [0.34012499999999996, 0.034734375, 0.8378125, 0.41150000000000003], "label": "a brown bowl"}, {"bbox": [0.08485416666666666, 0.31696875, 0.5049791666666666, 0.6283125], "label": "a brown bowl"}, {"bbox": [0.12583333333333332, 0.62246875, 0.6202291666666666, 0.9887656249999999], "label": "a yellow bowl"}, {"bbox": [0.3528125, 0.357328125, 0.492625, 0.50228125], "label": "a red banana"}, {"bbox": [0.0, 0.0012968749999999999, 1.0, 0.98828125], "label": "a brown dining table"}], "image_id": "354165"}, "426": {"caption": "a photo of a brown sheep and a blue sheep and a brown sheep and a black sheep and a brown sheep and a white sheep ", "segment": [{"bbox": [0.134890625, 0.4497897196261682, 0.42621875, 0.9025700934579438], "label": "a brown sheep"}, {"bbox": [0.733078125, 0.5103971962616822, 1.0, 0.986892523364486], "label": "a blue sheep"}, {"bbox": [0.5094531250000001, 0.4764018691588785, 0.725859375, 1.0], "label": "a brown sheep"}, {"bbox": [0.44775, 0.553107476635514, 0.5747500000000001, 0.9360747663551402], "label": "a black sheep"}, {"bbox": [0.43131250000000004, 0.37303738317757007, 0.65371875, 0.5797663551401869], "label": "a brown sheep"}, {"bbox": [0.362265625, 0.28686915887850467, 0.542890625, 0.4388785046728972], "label": "a white sheep"}], "image_id": "152281"}, "427": {"caption": "a photo of a yellow sandwich and a red dining table and a brown cup and a green fork ", "segment": [{"bbox": [0.527328125, 0.3651041666666667, 0.76071875, 0.6666875], "label": "a yellow sandwich"}, {"bbox": [0.0016875000000000002, 0.0011250000000000001, 1.0, 0.9898750000000001], "label": "a red dining table"}, {"bbox": [0.579390625, 0.007875, 0.8243281249999999, 0.3479791666666667], "label": "a brown cup"}, {"bbox": [0.015171875000000001, 0.38004166666666667, 0.29753125, 0.9406874999999999], "label": "a green fork"}], "image_id": "467726"}, "428": {"caption": "a photo of a brown microwave and a yellow oven and a black toaster and a green book and a brown book ", "segment": [{"bbox": [0.35234375, 0.14339583333333333, 0.8104062500000001, 0.5729166666666666], "label": "a brown microwave"}, {"bbox": [0.86965625, 0.7865208333333332, 1.0, 0.9865208333333333], "label": "a yellow oven"}, {"bbox": [0.07415625, 0.4157291666666667, 0.461796875, 0.8741666666666668], "label": "a black toaster"}, {"bbox": [0.096796875, 0.11020833333333332, 0.280265625, 0.37114583333333334], "label": "a green book"}, {"bbox": [0.18203125, 0.1166875, 0.31881250000000005, 0.3794375], "label": "a brown book"}], "image_id": "256309"}, "429": {"caption": "a photo of a brown zebra and a green zebra and a blue zebra ", "segment": [{"bbox": [0.13343750000000001, 0.2314519906323185, 0.5637343749999999, 0.8516861826697891], "label": "a brown zebra"}, {"bbox": [0.0840625, 0.2852927400468384, 0.32734375, 0.8272599531615925], "label": "a green zebra"}, {"bbox": [0.47943749999999996, 0.3185948477751756, 0.9064218749999998, 0.877423887587822], "label": "a blue zebra"}], "image_id": "501243"}, "430": {"caption": "a photo of a brown giraffe and a yellow giraffe and a yellow giraffe ", "segment": [{"bbox": [0.30260663507109004, 0.3439375, 1.0, 0.909015625], "label": "a brown giraffe"}, {"bbox": [0.6537440758293839, 0.615125, 1.0, 0.846859375], "label": "a yellow giraffe"}, {"bbox": [0.14035545023696683, 0.0965, 0.6264928909952606, 0.87303125], "label": "a yellow giraffe"}], "image_id": "73981"}, "431": {"caption": "a photo of a blue tv and a black tv and a white laptop and a yellow book and a yellow chair and a brown dining table ", "segment": [{"bbox": [0.5710625, 0.24957943925233644, 0.81753125, 0.5372196261682243], "label": "a blue tv"}, {"bbox": [0.21140625000000002, 0.34710280373831776, 0.48221875000000003, 0.6425700934579439], "label": "a black tv"}, {"bbox": [0.21340625000000002, 0.35504672897196266, 0.575578125, 0.7929205607476636], "label": "a white laptop"}, {"bbox": [0.30876562500000004, 0.7285981308411215, 0.6491718750000001, 0.9200467289719626], "label": "a yellow book"}, {"bbox": [0.50096875, 0.48443925233644863, 0.8432343750000001, 1.0], "label": "a yellow chair"}, {"bbox": [0.0, 0.5182242990654206, 0.844640625, 0.9869859813084112], "label": "a brown dining table"}], "image_id": "277440"}, "432": {"caption": "a photo of a black knife and a brown broccoli and a white broccoli and a black broccoli and a brown broccoli and a green dining table ", "segment": [{"bbox": [0.7560156250000001, 0.3558313817330211, 1.0, 0.8234894613583138], "label": "a black knife"}, {"bbox": [0.3898125, 0.0050585480093676815, 0.6776875, 0.23426229508196722], "label": "a brown broccoli"}, {"bbox": [0.6791875, 0.14831381733021076, 0.9400625, 0.539320843091335], "label": "a white broccoli"}, {"bbox": [0.407890625, 0.22601873536299766, 0.541796875, 0.40025761124121784], "label": "a black broccoli"}, {"bbox": [0.49626562500000004, 0.3366978922716628, 0.9190625000000001, 0.860304449648712], "label": "a brown broccoli"}, {"bbox": [0.7207656250000001, 0.0025995316159250588, 1.0, 1.0], "label": "a green dining table"}], "image_id": "558809"}, "433": {"caption": "a photo of a red bottle and a green sandwich and a red hot dog and a red hot dog and a white hot dog ", "segment": [{"bbox": [0.42725, 0.184953125, 0.6910416666666668, 0.666671875], "label": "a red bottle"}, {"bbox": [0.23497916666666668, 0.602546875, 0.5051875, 0.873421875], "label": "a green sandwich"}, {"bbox": [0.6268333333333334, 0.5663750000000001, 0.8969166666666666, 0.87021875], "label": "a red hot dog"}, {"bbox": [0.8156874999999999, 0.625875, 0.9913749999999999, 0.891765625], "label": "a red hot dog"}, {"bbox": [0.243625, 0.619, 0.4938333333333333, 0.8856718750000001], "label": "a white hot dog"}], "image_id": "547759"}, "434": {"caption": "a photo of a red potted plant and a blue refrigerator and a white microwave and a green vase ", "segment": [{"bbox": [0.06072072072072072, 0.01348, 0.9278978978978979, 0.38876], "label": "a red potted plant"}, {"bbox": [0.10078078078078079, 0.66464, 0.8767267267267267, 0.9890399999999999], "label": "a blue refrigerator"}, {"bbox": [0.0775975975975976, 0.37751999999999997, 0.9413813813813813, 0.6786599999999999], "label": "a white microwave"}, {"bbox": [0.4757657657657658, 0.25372, 0.7185885885885887, 0.37914], "label": "a green vase"}], "image_id": "455188"}, "435": {"caption": "a photo of a blue banana and a black banana and a green backpack and a brown banana and a green bicycle and a black banana ", "segment": [{"bbox": [0.051984375000000006, 0.03911949685534591, 0.43975, 0.4740670859538784], "label": "a blue banana"}, {"bbox": [0.24778125, 0.04995807127882599, 0.541140625, 0.4728301886792453], "label": "a black banana"}, {"bbox": [0.578203125, 0.19865828092243187, 0.9625625, 0.47220125786163525], "label": "a green backpack"}, {"bbox": [0.594578125, 0.24270440251572326, 0.9161406249999999, 0.41123689727463314], "label": "a brown banana"}, {"bbox": [0.57540625, 0.03870020964360587, 0.9584843749999999, 0.17635220125786163], "label": "a green bicycle"}, {"bbox": [0.595125, 0.560293501048218, 0.722234375, 0.8990146750524108], "label": "a black banana"}], "image_id": "193926"}, "436": {"caption": "a photo of a brown sheep and a blue sheep and a red sheep and a red sheep ", "segment": [{"bbox": [0.46503125, 0.38675233644859813, 0.770875, 0.6985747663551402], "label": "a brown sheep"}, {"bbox": [0.08196875, 0.40824766355140185, 0.302015625, 0.6663084112149533], "label": "a blue sheep"}, {"bbox": [0.027437499999999997, 0.3709579439252337, 0.206546875, 0.6279672897196261], "label": "a red sheep"}, {"bbox": [0.2140625, 0.3808411214953271, 0.88125, 0.5490654205607477], "label": "a red sheep"}], "image_id": "230166"}, "437": {"caption": "a photo of a yellow horse and a green cow and a black cow and a white cow and a blue cow and a brown cow ", "segment": [{"bbox": [0.0, 0.18216470588235295, 0.175265625, 1.0], "label": "a yellow horse"}, {"bbox": [0.75709375, 0.4084, 0.9789218749999999, 0.9773647058823529], "label": "a green cow"}, {"bbox": [0.56409375, 0.47957647058823527, 0.7568906249999999, 0.9892470588235295], "label": "a black cow"}, {"bbox": [0.374375, 0.37392941176470584, 0.5140156250000001, 0.7475294117647059], "label": "a white cow"}, {"bbox": [0.80575, 0.31527058823529414, 0.9790781249999998, 0.5592], "label": "a blue cow"}, {"bbox": [0.6440625, 0.30981176470588234, 0.7783125, 0.5700470588235294], "label": "a brown cow"}], "image_id": "410114"}, "438": {"caption": "a photo of a red banana and a red dining table and a blue bench ", "segment": [{"bbox": [0.36524999999999996, 0.7157083333333334, 0.507984375, 0.8591666666666667], "label": "a red banana"}, {"bbox": [0.029218749999999998, 0.529875, 0.763640625, 0.9714375], "label": "a red dining table"}, {"bbox": [0.0, 0.7935416666666666, 0.14835937500000002, 1.0], "label": "a blue bench"}], "image_id": "112378"}, "439": {"caption": "a photo of a green sandwich and a blue sandwich and a red sandwich and a green orange and a red orange and a brown dining table ", "segment": [{"bbox": [0.040453125, 0.42210416666666667, 0.7550625, 0.9906458333333333], "label": "a green sandwich"}, {"bbox": [0.350671875, 0.14339583333333333, 0.9983281250000001, 0.6154375000000001], "label": "a blue sandwich"}, {"bbox": [0.0, 0.09120833333333334, 0.31925, 0.4448125], "label": "a red sandwich"}, {"bbox": [0.303171875, 0.04739583333333333, 0.491875, 0.2553958333333333], "label": "a green orange"}, {"bbox": [0.2769375, 0.0, 0.48875, 0.17139583333333333], "label": "a red orange"}, {"bbox": [0.5561875, 0.0022500000000000003, 0.9977499999999999, 0.2674166666666667], "label": "a brown dining table"}], "image_id": "369370"}, "440": {"caption": "a photo of a brown sheep and a brown sheep and a black sheep ", "segment": [{"bbox": [0.5402291666666666, 0.599140625, 1.0, 0.883625], "label": "a brown sheep"}, {"bbox": [0.0, 0.593546875, 0.3928333333333333, 0.8731249999999999], "label": "a brown sheep"}, {"bbox": [0.3104791666666667, 0.5375156249999999, 0.49525, 0.72890625], "label": "a black sheep"}], "image_id": "495332"}, "441": {"caption": "a photo of a blue zebra and a black zebra and a white zebra ", "segment": [{"bbox": [0.0318125, 0.458345498783455, 0.39485937499999996, 0.8975182481751824], "label": "a blue zebra"}, {"bbox": [0.46859375, 0.3531386861313868, 0.618484375, 0.8199513381995134], "label": "a black zebra"}, {"bbox": [0.660953125, 0.34313868613138687, 0.93946875, 0.8375182481751825], "label": "a white zebra"}], "image_id": "260305"}, "442": {"caption": "a photo of a brown bicycle and a blue dining table and a green dining table ", "segment": [{"bbox": [0.22146875000000002, 0.5438333333333334, 0.914421875, 0.8727083333333334], "label": "a brown bicycle"}, {"bbox": [0.0, 0.505625, 0.17696875, 0.7505624999999999], "label": "a blue dining table"}, {"bbox": [0.57134375, 0.5258333333333334, 0.87303125, 0.6921250000000001], "label": "a green dining table"}], "image_id": "337561"}, "443": {"caption": "a photo of a brown cow and a white cow and a black cow and a green cow ", "segment": [{"bbox": [0.731234375, 0.32308093994778064, 0.867171875, 0.5371801566579635], "label": "a brown cow"}, {"bbox": [0.73871875, 0.41075718015665796, 0.95621875, 0.6236553524804178], "label": "a white cow"}, {"bbox": [0.621296875, 0.6966318537859008, 0.845875, 0.9887728459530026], "label": "a black cow"}, {"bbox": [0.40125, 0.4437597911227154, 0.634671875, 0.6382245430809399], "label": "a green cow"}], "image_id": "573455"}, "444": {"caption": "a photo of a brown car and a black car and a green car and a white truck and a green car ", "segment": [{"bbox": [0.49368749999999995, 0.2623828125, 1.0, 0.9876171874999999], "label": "a brown car"}, {"bbox": [0.12332812500000001, 0.53421875, 0.27760937500000005, 0.6627734375], "label": "a black car"}, {"bbox": [0.527921875, 0.320859375, 0.6806875, 0.60111328125], "label": "a green car"}, {"bbox": [0.006937500000000001, 0.524921875, 0.144890625, 0.668359375], "label": "a white truck"}, {"bbox": [0.0046875, 0.4609375, 0.534375, 0.64453125], "label": "a green car"}], "image_id": "142257"}, "445": {"caption": "a photo of a white potted plant and a blue couch and a yellow chair ", "segment": [{"bbox": [0.32167999999999997, 0.36551999999999996, 0.5897333333333332, 0.54828], "label": "a white potted plant"}, {"bbox": [0.28448, 0.60452, 0.9856266666666667, 1.0], "label": "a blue couch"}, {"bbox": [0.29408, 0.59996, 0.9798133333333332, 1.0], "label": "a yellow chair"}], "image_id": "143247"}, "446": {"caption": "a photo of a yellow dining table and a black chair and a green knife and a black cup and a black cup and a brown cup ", "segment": [{"bbox": [0.011764705882352941, 0.13176470588235295, 1.0, 0.971764705882353], "label": "a yellow dining table"}, {"bbox": [0.26338235294117646, 0.017434640522875817, 0.8072875816993464, 0.14805555555555555], "label": "a black chair"}, {"bbox": [0.6688725490196079, 0.5626143790849674, 0.9199509803921568, 0.7948529411764705], "label": "a green knife"}, {"bbox": [0.7119281045751634, 0.3795261437908497, 0.9011928104575163, 0.5687908496732027], "label": "a black cup"}, {"bbox": [0.08191176470588235, 0.2652124183006536, 0.2806535947712418, 0.44488562091503264], "label": "a black cup"}, {"bbox": [0.4306045751633987, 0.2520261437908497, 0.5939052287581699, 0.43602941176470594], "label": "a brown cup"}], "image_id": "541538"}, "447": {"caption": "a photo of a green car and a blue car and a blue car and a red car ", "segment": [{"bbox": [0.09734374999999999, 0.7678451882845188, 0.5505, 0.9835774058577406], "label": "a green car"}, {"bbox": [0.7368125, 0.8022384937238495, 0.99528125, 0.9797698744769875], "label": "a blue car"}, {"bbox": [0.368265625, 0.7395815899581589, 0.600890625, 0.9904602510460251], "label": "a blue car"}, {"bbox": [0.0, 0.7151255230125523, 0.1795, 1.0], "label": "a red car"}], "image_id": "480225"}, "448": {"caption": "a photo of a green zebra and a green zebra and a yellow zebra ", "segment": [{"bbox": [0.032375, 0.3838611111111111, 0.3051875, 0.7077777777777778], "label": "a green zebra"}, {"bbox": [0.470578125, 0.4816944444444444, 0.66940625, 0.6734444444444444], "label": "a green zebra"}, {"bbox": [0.79203125, 0.4403055555555555, 0.9782187499999999, 0.6891111111111111], "label": "a yellow zebra"}], "image_id": "508586"}, "449": {"caption": "a photo of a brown chair and a yellow dining table and a red pizza and a yellow vase ", "segment": [{"bbox": [0.000140625, 0.0, 0.15596875000000002, 0.23676814988290396], "label": "a brown chair"}, {"bbox": [0.0015, 0.005620608899297424, 0.996265625, 0.9898594847775175], "label": "a yellow dining table"}, {"bbox": [0.115453125, 0.43370023419203746, 0.46328125, 0.7280796252927401], "label": "a red pizza"}, {"bbox": [0.46728125, 0.0007259953161592506, 0.6515625, 0.20859484777517567], "label": "a yellow vase"}], "image_id": "212766"}, "450": {"caption": "a photo of a white bowl and a white cake and a red spoon and a white bowl and a black cup and a white bowl ", "segment": [{"bbox": [0.010116822429906542, 0.660828125, 0.5839485981308411, 0.9836406249999999], "label": "a white bowl"}, {"bbox": [0.022149532710280376, 0.6950624999999999, 0.5258644859813084, 0.9821874999999999], "label": "a white cake"}, {"bbox": [0.6147196261682244, 0.09456250000000001, 0.9913317757009347, 0.330953125], "label": "a red spoon"}, {"bbox": [0.6451635514018691, 0.7460625000000001, 0.9980140186915887, 0.9887656250000001], "label": "a white bowl"}, {"bbox": [0.758481308411215, 0.006171875, 0.9927336448598131, 0.17364062500000002], "label": "a black cup"}, {"bbox": [0.8577570093457944, 0.335625, 0.992803738317757, 0.46568750000000003], "label": "a white bowl"}], "image_id": "574837"}, "451": {"caption": "a photo of a yellow cat and a red bottle and a white bottle and a blue sink ", "segment": [{"bbox": [0.1419375, 0.34408333333333335, 0.8532187500000001, 0.8516041666666666], "label": "a yellow cat"}, {"bbox": [0.12553125, 0.0064375, 0.296140625, 0.33691666666666664], "label": "a red bottle"}, {"bbox": [0.76265625, 0.0, 0.933, 0.42602083333333335], "label": "a white bottle"}, {"bbox": [0.0, 0.03558333333333333, 1.0, 0.9862291666666666], "label": "a blue sink"}], "image_id": "543264"}, "452": {"caption": "a photo of a brown bicycle and a brown motorcycle and a blue motorcycle and a green bicycle and a green motorcycle and a green motorcycle ", "segment": [{"bbox": [0.27978125, 0.24911007025761125, 0.992890625, 0.9738407494145199], "label": "a brown bicycle"}, {"bbox": [0.1169375, 0.1618032786885246, 0.685171875, 0.7707962529274005], "label": "a brown motorcycle"}, {"bbox": [0.275875, 0.23426229508196722, 0.8231093749999999, 0.847751756440281], "label": "a blue motorcycle"}, {"bbox": [0.55025, 0.5411943793911007, 1.0, 0.990632318501171], "label": "a green bicycle"}, {"bbox": [0.07796875, 0.11011709601873537, 0.4168125, 0.532576112412178], "label": "a green motorcycle"}, {"bbox": [0.154421875, 0.12583138173302108, 0.509765625, 0.38201405152224827], "label": "a green motorcycle"}], "image_id": "404792"}, "453": {"caption": "a photo of a blue sheep and a yellow sheep and a white sheep ", "segment": [{"bbox": [0.45787500000000003, 0.551671875, 0.657875, 0.7617499999999999], "label": "a blue sheep"}, {"bbox": [0.766234375, 0.4649375, 1.0, 0.7402656249999999], "label": "a yellow sheep"}, {"bbox": [0.0, 0.5253125, 0.251375, 0.814625], "label": "a white sheep"}], "image_id": "48907"}, "454": {"caption": "a photo of a white sheep and a brown sheep and a brown sheep and a white sheep ", "segment": [{"bbox": [0.0781875, 0.47560416666666666, 0.387578125, 0.7510833333333333], "label": "a white sheep"}, {"bbox": [0.827796875, 0.37095833333333333, 1.0, 0.5999791666666667], "label": "a brown sheep"}, {"bbox": [0.53575, 0.48074999999999996, 0.8195625, 0.7981250000000001], "label": "a brown sheep"}, {"bbox": [0.5487656249999999, 0.34900000000000003, 0.8458437499999999, 0.5833333333333334], "label": "a white sheep"}], "image_id": "200541"}, "455": {"caption": "a photo of a white horse and a blue horse and a green horse and a black horse ", "segment": [{"bbox": [0.04076797385620915, 0.17524509803921567, 0.4356209150326798, 0.9563725490196078], "label": "a white horse"}, {"bbox": [0.37687908496732025, 0.17580065359477126, 0.578153594771242, 0.9616666666666666], "label": "a blue horse"}, {"bbox": [0.5280882352941176, 0.20225490196078433, 0.7483169934640523, 0.9191013071895425], "label": "a green horse"}, {"bbox": [0.747140522875817, 0.265359477124183, 0.9278921568627451, 0.7988398692810458], "label": "a black horse"}], "image_id": "41104"}, "456": {"caption": "a photo of a red boat and a red boat and a black boat ", "segment": [{"bbox": [0.00034375, 0.7545327102803738, 0.41439062500000007, 1.0], "label": "a red boat"}, {"bbox": [0.0679375, 0.37030373831775704, 0.194953125, 0.599626168224299], "label": "a red boat"}, {"bbox": [0.0875, 0.2733644859813084, 0.9984375, 0.5817757009345794], "label": "a black boat"}], "image_id": "519703"}, "457": {"caption": "a photo of a yellow sheep and a blue sheep and a blue sheep ", "segment": [{"bbox": [0.49982812499999996, 0.4749295774647887, 0.707015625, 0.8539201877934272], "label": "a yellow sheep"}, {"bbox": [0.5279375, 0.4021596244131455, 0.76640625, 0.6106338028169014], "label": "a blue sheep"}, {"bbox": [0.187734375, 0.42166666666666663, 0.46121875, 0.8301408450704225], "label": "a blue sheep"}], "image_id": "554046"}, "458": {"caption": "a photo of a black airplane and a red truck and a red truck ", "segment": [{"bbox": [0.006734374999999999, 0.022468750000000003, 0.665171875, 0.364046875], "label": "a black airplane"}, {"bbox": [0.525578125, 0.31901562499999997, 0.755875, 0.45281249999999995], "label": "a red truck"}, {"bbox": [0.413484375, 0.77940625, 0.8067343749999999, 0.9838906250000001], "label": "a red truck"}], "image_id": "541627"}, "459": {"caption": "a photo of a green dining table and a yellow pizza and a white cup and a black cup and a green knife and a green tv ", "segment": [{"bbox": [0.003, 0.157453125, 1.0, 0.982171875], "label": "a green dining table"}, {"bbox": [0.0, 0.587171875, 0.9373541666666667, 1.0], "label": "a yellow pizza"}, {"bbox": [0.7590416666666666, 0.327125, 0.9496249999999999, 0.58984375], "label": "a white cup"}, {"bbox": [0.2922291666666667, 0.313421875, 0.45243750000000005, 0.540515625], "label": "a black cup"}, {"bbox": [0.8184375, 0.630234375, 1.0, 0.7710781250000001], "label": "a green knife"}, {"bbox": [0.8710208333333332, 0.06498437500000001, 1.0, 0.19478125], "label": "a green tv"}], "image_id": "12576"}, "460": {"caption": "a photo of a white apple and a white apple and a yellow apple and a blue apple and a red apple and a white apple ", "segment": [{"bbox": [0.07221757322175733, 0.193265625, 1.0, 0.8876406249999998], "label": "a white apple"}, {"bbox": [0.00299163179916318, 0.0, 0.6424476987447699, 0.432625], "label": "a white apple"}, {"bbox": [0.6815271966527197, 0.007890625, 1.0, 0.384015625], "label": "a yellow apple"}, {"bbox": [0.18654811715481173, 0.8288437500000001, 0.8514853556485356, 0.9906406249999999], "label": "a blue apple"}, {"bbox": [0.7960878661087866, 0.632296875, 1.0, 1.0], "label": "a red apple"}, {"bbox": [0.5820920502092051, 0.0026406249999999997, 0.8790585774058577, 0.159734375], "label": "a white apple"}], "image_id": "510898"}, "461": {"caption": "a photo of a white book and a white book and a yellow book and a white scissors ", "segment": [{"bbox": [0.3764, 0.61442, 0.68936, 0.7914599999999999], "label": "a white book"}, {"bbox": [0.006, 0.56404, 0.6441866666666667, 1.0], "label": "a white book"}, {"bbox": [0.09021333333333333, 0.38268, 0.4716000000000001, 0.58424], "label": "a yellow book"}, {"bbox": [0.07317333333333334, 0.62112, 0.26461333333333337, 0.9083], "label": "a white scissors"}], "image_id": "11262"}, "462": {"caption": "a photo of a blue elephant and a white elephant and a yellow elephant ", "segment": [{"bbox": [0.142453125, 0.3440084388185654, 0.31203125, 0.49276371308016875], "label": "a blue elephant"}, {"bbox": [0.47515625000000006, 0.4203164556962025, 0.61521875, 0.5570253164556962], "label": "a white elephant"}, {"bbox": [0.71646875, 0.3863502109704641, 0.8789374999999999, 0.5951898734177216], "label": "a yellow elephant"}], "image_id": "367362"}, "463": {"caption": "a photo of a brown chair and a brown chair and a green suitcase and a green cat ", "segment": [{"bbox": [0.7500625, 0.089171875, 1.0, 0.309140625], "label": "a brown chair"}, {"bbox": [0.137625, 0.60215625, 0.5734791666666667, 0.982796875], "label": "a brown chair"}, {"bbox": [0.0, 0.00025, 1.0, 1.0], "label": "a green suitcase"}, {"bbox": [0.0, 0.258078125, 0.9022708333333332, 0.626765625], "label": "a green cat"}], "image_id": "210276"}, "464": {"caption": "a photo of a black teddy bear and a blue bench and a blue backpack ", "segment": [{"bbox": [0.22584, 0.12584, 0.6623600000000001, 0.8629333333333334], "label": "a black teddy bear"}, {"bbox": [0.0, 0.6269600000000001, 1.0, 0.9887733333333334], "label": "a blue bench"}, {"bbox": [0.1052, 0.3428533333333333, 0.3935, 0.7480533333333332], "label": "a blue backpack"}], "image_id": "395531"}, "465": {"caption": "a photo of a white cat and a red cat and a green chair and a white bed ", "segment": [{"bbox": [0.10322916666666666, 0.053765625, 0.48458333333333337, 0.548390625], "label": "a white cat"}, {"bbox": [0.2969375, 0.711234375, 0.86225, 0.9853125], "label": "a red cat"}, {"bbox": [0.21875, 0.462234375, 1.0, 0.90234375], "label": "a green chair"}, {"bbox": [0.0034583333333333332, 0.710140625, 0.34197916666666667, 0.982171875], "label": "a white bed"}], "image_id": "412377"}, "466": {"caption": "a photo of a brown bicycle and a black car and a yellow cat ", "segment": [{"bbox": [0.0, 0.01394, 0.5382133333333333, 0.9078], "label": "a brown bicycle"}, {"bbox": [0.0, 0.00158, 0.29584, 0.177], "label": "a black car"}, {"bbox": [0.26610666666666666, 0.46016, 0.5416000000000001, 0.69064], "label": "a yellow cat"}], "image_id": "297374"}, "467": {"caption": "a photo of a white sandwich and a white sandwich and a black dining table ", "segment": [{"bbox": [0.42207812499999997, 0.19047916666666667, 0.961890625, 0.6859791666666666], "label": "a white sandwich"}, {"bbox": [0.06221875, 0.135875, 0.497765625, 0.6560624999999999], "label": "a white sandwich"}, {"bbox": [0.0, 0.0, 1.0, 0.9928333333333333], "label": "a black dining table"}], "image_id": "395745"}, "468": {"caption": "a photo of a black dining table and a blue bed and a red chair and a red chair and a black chair and a blue oven ", "segment": [{"bbox": [0.47253125, 0.5583490566037737, 0.8574375, 0.999245283018868], "label": "a black dining table"}, {"bbox": [0.1399375, 0.39931603773584906, 0.4168593749999999, 0.6240330188679246], "label": "a blue bed"}, {"bbox": [0.785515625, 0.7004481132075472, 1.0, 0.9890330188679246], "label": "a red chair"}, {"bbox": [0.52671875, 0.5281603773584905, 0.6625, 0.9808490566037735], "label": "a red chair"}, {"bbox": [0.303703125, 0.8037971698113208, 0.565734375, 0.9835849056603774], "label": "a black chair"}, {"bbox": [0.690109375, 0.35537735849056606, 0.8382343750000001, 0.5997169811320755], "label": "a blue oven"}], "image_id": "541837"}, "469": {"caption": "a photo of a blue dog and a yellow bird and a yellow bird and a blue cake ", "segment": [{"bbox": [0.0, 0.6214666666666667, 0.30668, 0.9898666666666668], "label": "a blue dog"}, {"bbox": [0.00322, 0.41719999999999996, 0.26452000000000003, 0.71184], "label": "a yellow bird"}, {"bbox": [0.0039, 0.31168, 0.16558, 0.44936], "label": "a yellow bird"}, {"bbox": [0.40786, 0.11365333333333333, 0.8372, 0.7065066666666666], "label": "a blue cake"}], "image_id": "330022"}, "470": {"caption": "a photo of a yellow tv and a yellow laptop and a white keyboard ", "segment": [{"bbox": [0.42809375000000005, 0.0028125000000000003, 0.8747187499999999, 0.5668541666666668], "label": "a yellow tv"}, {"bbox": [0.0, 0.3101041666666667, 0.34045312499999997, 0.7595416666666667], "label": "a yellow laptop"}, {"bbox": [0.141578125, 0.703375, 0.82246875, 0.9887708333333334], "label": "a white keyboard"}], "image_id": "97696"}, "471": {"caption": "a photo of a blue sheep and a white sheep and a yellow sheep and a blue sheep and a blue sheep ", "segment": [{"bbox": [0.15301562500000002, 0.34948598130841124, 0.438390625, 0.751892523364486], "label": "a blue sheep"}, {"bbox": [0.58534375, 0.39999999999999997, 0.838453125, 0.9268925233644859], "label": "a white sheep"}, {"bbox": [0.082875, 0.29126168224299065, 0.45714062499999997, 0.6527336448598131], "label": "a yellow sheep"}, {"bbox": [0.4545, 0.25268691588785047, 0.646578125, 0.6420093457943925], "label": "a blue sheep"}, {"bbox": [0.06715625, 0.2916822429906542, 0.26164062499999996, 0.5835046728971963], "label": "a blue sheep"}], "image_id": "334542"}, "472": {"caption": "a photo of a blue dog and a red pizza and a brown dining table ", "segment": [{"bbox": [0.519171875, 0.0060705882352941175, 1.0, 0.9979764705882352], "label": "a blue dog"}, {"bbox": [0.0, 0.3412, 0.507375, 0.9861411764705883], "label": "a red pizza"}, {"bbox": [0.24025, 0.015741176470588238, 0.8849218749999999, 1.0], "label": "a brown dining table"}], "image_id": "273083"}, "473": {"caption": "a photo of a green dining table and a brown refrigerator and a black oven and a green chair ", "segment": [{"bbox": [0.22599431818181817, 0.7741304347826088, 0.8179261363636364, 0.9858695652173913], "label": "a green dining table"}, {"bbox": [0.8574999999999999, 0.3258260869565217, 0.998465909090909, 0.9842608695652174], "label": "a brown refrigerator"}, {"bbox": [0.39053977272727275, 0.539608695652174, 0.5615056818181818, 0.8483913043478261], "label": "a black oven"}, {"bbox": [0.6873579545454546, 0.7844347826086956, 0.8332954545454545, 0.9818260869565217], "label": "a green chair"}], "image_id": "37777"}, "474": {"caption": "a photo of a green zebra and a green zebra and a red zebra ", "segment": [{"bbox": [0.35525, 0.4077102803738318, 0.5319375, 0.6512149532710281], "label": "a green zebra"}, {"bbox": [0.460265625, 0.41404205607476635, 0.641875, 0.6507242990654205], "label": "a green zebra"}, {"bbox": [0.8153593750000001, 0.42042056074766354, 0.994140625, 0.6092523364485981], "label": "a red zebra"}], "image_id": "359751"}, "475": {"caption": "a photo of a brown elephant and a yellow elephant and a green elephant ", "segment": [{"bbox": [0.63209375, 0.38983333333333337, 0.8346875, 0.70225], "label": "a brown elephant"}, {"bbox": [0.21742187500000001, 0.38839583333333333, 0.458421875, 0.7232291666666666], "label": "a yellow elephant"}, {"bbox": [0.127, 0.43331250000000004, 0.268015625, 0.6900625], "label": "a green elephant"}], "image_id": "160220"}, "476": {"caption": "a photo of a brown cow and a yellow cow and a brown cow ", "segment": [{"bbox": [0.42971875, 0.3467708333333333, 0.952796875, 0.6643749999999999], "label": "a brown cow"}, {"bbox": [0.726453125, 0.31604166666666667, 1.0, 0.5649166666666666], "label": "a yellow cow"}, {"bbox": [0.046671875, 0.35120833333333334, 0.8014999999999999, 0.8748125000000001], "label": "a brown cow"}], "image_id": "414560"}, "477": {"caption": "a photo of a white cat and a red bed and a brown teddy bear and a green teddy bear ", "segment": [{"bbox": [0.355921875, 0.2691458333333333, 0.55628125, 0.6646875], "label": "a white cat"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a red bed"}, {"bbox": [0.324734375, 0.5617083333333334, 0.825046875, 0.9827708333333334], "label": "a brown teddy bear"}, {"bbox": [0.015578125000000002, 0.3818125, 0.3935, 0.9298750000000001], "label": "a green teddy bear"}], "image_id": "445267"}, "478": {"caption": "a photo of a red tv and a yellow chair and a yellow laptop ", "segment": [{"bbox": [0.30924, 0.4134840425531915, 0.44106, 0.642686170212766], "label": "a red tv"}, {"bbox": [0.0, 0.5517287234042553, 0.33312, 0.9994680851063829], "label": "a yellow chair"}, {"bbox": [0.1569, 0.5082446808510638, 0.28584000000000004, 0.6797340425531915], "label": "a yellow laptop"}], "image_id": "160498"}, "479": {"caption": "a photo of a yellow tv and a white laptop and a brown book ", "segment": [{"bbox": [0.45278124999999997, 0.48988290398126466, 0.60571875, 0.6516861826697892], "label": "a yellow tv"}, {"bbox": [0.76209375, 0.5434894613583138, 0.9828749999999999, 0.7851288056206089], "label": "a white laptop"}, {"bbox": [0.046875, 0.48009367681498827, 0.21875, 0.9929742388758782], "label": "a brown book"}], "image_id": "472109"}, "480": {"caption": "a photo of a green train and a white train and a black chair ", "segment": [{"bbox": [0.0, 0.0033750000000000004, 0.68075, 0.9605833333333333], "label": "a green train"}, {"bbox": [0.0033750000000000004, 0.0, 1.0, 0.989875], "label": "a white train"}, {"bbox": [0.8022500000000001, 0.3528125, 0.9977500000000001, 0.9887708333333334], "label": "a black chair"}], "image_id": "112212"}, "481": {"caption": "a photo of a brown cat and a blue cat and a blue suitcase and a green book ", "segment": [{"bbox": [0.3531875, 0.24727083333333333, 0.685640625, 0.751875], "label": "a brown cat"}, {"bbox": [0.0025468749999999997, 0.27131249999999996, 0.3829375, 0.6818124999999999], "label": "a blue cat"}, {"bbox": [0.17696875, 0.40675, 0.8342656250000001, 0.9820208333333333], "label": "a blue suitcase"}, {"bbox": [0.0015625, 0.0, 0.80625, 0.5291666666666667], "label": "a green book"}], "image_id": "508440"}, "482": {"caption": "a photo of a red elephant and a black elephant and a black elephant and a red elephant and a white elephant ", "segment": [{"bbox": [0.35543749999999996, 0.4985120350109409, 0.581171875, 0.787746170678337], "label": "a red elephant"}, {"bbox": [0.21475, 0.542691466083151, 0.40081249999999996, 0.8264551422319475], "label": "a black elephant"}, {"bbox": [0.129296875, 0.59636761487965, 0.36003124999999997, 0.8591903719912474], "label": "a black elephant"}, {"bbox": [0.5630468750000001, 0.5263457330415755, 0.7104531250000001, 0.7415317286652079], "label": "a red elephant"}, {"bbox": [0.85621875, 0.5279431072210066, 1.0, 0.6743982494529541], "label": "a white elephant"}], "image_id": "398746"}, "483": {"caption": "a photo of a blue banana and a black banana and a black banana and a brown banana and a brown bottle and a green spoon ", "segment": [{"bbox": [0.17118, 0.22824, 0.8170599999999999, 0.7764800000000001], "label": "a blue banana"}, {"bbox": [0.0053, 0.25882666666666665, 0.75176, 0.6470666666666667], "label": "a black banana"}, {"bbox": [0.00882, 0.15736, 0.8047000000000001, 0.5173599999999999], "label": "a black banana"}, {"bbox": [0.3053, 0.5290133333333333, 0.9741200000000001, 0.8984266666666666], "label": "a brown banana"}, {"bbox": [0.1948, 0.0, 0.36234000000000005, 0.29349333333333333], "label": "a brown bottle"}, {"bbox": [0.0849, 0.13173333333333334, 0.27232, 0.31511999999999996], "label": "a green spoon"}], "image_id": "1153"}, "484": {"caption": "a photo of a white giraffe and a brown giraffe and a white giraffe ", "segment": [{"bbox": [0.08903124999999999, 0.31185031185031187, 0.303359375, 0.8048856548856549], "label": "a white giraffe"}, {"bbox": [0.26515625, 0.022474012474012477, 0.56071875, 0.9865072765072765], "label": "a brown giraffe"}, {"bbox": [0.688546875, 0.35305613305613304, 0.8701718749999999, 0.7652182952182952], "label": "a white giraffe"}], "image_id": "6005"}, "485": {"caption": "a photo of a blue tv and a blue cat and a white potted plant ", "segment": [{"bbox": [0.002890625, 0.04957589285714286, 0.28346875, 0.8450446428571429], "label": "a blue tv"}, {"bbox": [0.370359375, 0.3373883928571429, 0.502953125, 0.7045758928571428], "label": "a blue cat"}, {"bbox": [0.64140625, 0.0034821428571428573, 1.0, 0.8897991071428571], "label": "a white potted plant"}], "image_id": "37907"}, "486": {"caption": "a photo of a black cat and a black laptop and a brown tv and a blue tv ", "segment": [{"bbox": [0.478453125, 0.2338333333333333, 0.9973124999999999, 0.9902916666666667], "label": "a black cat"}, {"bbox": [0.06909375, 0.3595416666666667, 0.48370312500000007, 0.9887708333333334], "label": "a black laptop"}, {"bbox": [0.391015625, 0.11460416666666666, 0.8123593750000001, 0.6247291666666667], "label": "a brown tv"}, {"bbox": [0.0691875, 0.3504375, 0.41476562499999997, 0.7343958333333334], "label": "a blue tv"}], "image_id": "461963"}, "487": {"caption": "a photo of a black fork and a white apple and a blue cake and a yellow dining table ", "segment": [{"bbox": [0.7291562500000001, 0.20154166666666665, 0.941453125, 0.6258333333333332], "label": "a black fork"}, {"bbox": [0.14784375, 0.1179375, 0.3629375, 0.4080833333333333], "label": "a white apple"}, {"bbox": [0.365765625, 0.05391666666666666, 0.610734375, 0.3425], "label": "a blue cake"}, {"bbox": [0.001953125, 0.006520833333333333, 1.0, 0.9882916666666667], "label": "a yellow dining table"}], "image_id": "523869"}, "488": {"caption": "a photo of a yellow laptop and a black keyboard and a red chair and a red chair ", "segment": [{"bbox": [0.6494375, 0.195125, 0.9955, 0.837828125], "label": "a yellow laptop"}, {"bbox": [0.638765625, 0.708203125, 1.0, 0.8363437499999999], "label": "a black keyboard"}, {"bbox": [0.1350625, 0.503890625, 0.40259375, 0.77403125], "label": "a red chair"}, {"bbox": [0.36317187500000003, 0.506703125, 0.6469375, 0.7328281249999999], "label": "a red chair"}], "image_id": "261707"}, "489": {"caption": "a photo of a brown cat and a brown couch and a blue laptop and a green couch and a brown couch ", "segment": [{"bbox": [0.6206875000000001, 0.06572916666666667, 0.9035624999999999, 0.36314583333333333], "label": "a brown cat"}, {"bbox": [0.064234375, 0.13510416666666666, 0.42718749999999994, 0.676875], "label": "a brown couch"}, {"bbox": [0.016890625, 0.3141875, 0.790546875, 0.9853541666666668], "label": "a blue laptop"}, {"bbox": [0.006750000000000001, 0.0011250000000000001, 0.26351562500000003, 0.4200416666666667], "label": "a green couch"}, {"bbox": [0.0038906250000000004, 0.0, 1.0, 0.9870208333333333], "label": "a brown couch"}], "image_id": "453400"}, "490": {"caption": "a photo of a brown sandwich and a red sandwich and a green dining table and a brown cup ", "segment": [{"bbox": [0.568375, 0.5010772833723653, 0.8796406250000001, 0.900327868852459], "label": "a brown sandwich"}, {"bbox": [0.324625, 0.5313817330210773, 0.664203125, 0.9887822014051523], "label": "a red sandwich"}, {"bbox": [0.0, 0.0011241217798594848, 1.0, 0.8930210772833723], "label": "a green dining table"}, {"bbox": [0.587, 0.034004683840749415, 0.83209375, 0.5033957845433256], "label": "a brown cup"}], "image_id": "414236"}, "491": {"caption": "a photo of a blue tv and a red chair and a blue keyboard and a green book ", "segment": [{"bbox": [0.312171875, 0.05169456066945607, 0.82240625, 0.32583682008368203], "label": "a blue tv"}, {"bbox": [0.401546875, 0.7828033472803347, 0.8287968750000001, 0.9892468619246862], "label": "a red chair"}, {"bbox": [0.44690624999999995, 0.612907949790795, 0.66284375, 0.7461087866108788], "label": "a blue keyboard"}, {"bbox": [0.067484375, 0.24907949790794978, 0.24501562500000001, 0.5288284518828452], "label": "a green book"}], "image_id": "114187"}, "492": {"caption": "a photo of a black cup and a blue spoon and a black dining table ", "segment": [{"bbox": [0.224640625, 0.4127291666666667, 0.514734375, 0.8231041666666667], "label": "a black cup"}, {"bbox": [0.2645625, 0.7551666666666667, 0.40578125, 0.9095833333333334], "label": "a blue spoon"}, {"bbox": [0.001953125, 0.6103958333333334, 1.0, 0.9870208333333333], "label": "a black dining table"}], "image_id": "128224"}, "493": {"caption": "a photo of a blue banana and a yellow bowl and a blue bowl and a blue cake ", "segment": [{"bbox": [0.09679166666666666, 0.32809374999999996, 0.6838333333333332, 0.7262187499999999], "label": "a blue banana"}, {"bbox": [0.017979166666666668, 0.38651562500000003, 1.0, 0.9842656250000001], "label": "a yellow bowl"}, {"bbox": [0.59625, 0.52134375, 1.0, 0.838203125], "label": "a blue bowl"}, {"bbox": [0.6510833333333333, 0.5818125000000001, 0.9038958333333333, 0.75584375], "label": "a blue cake"}], "image_id": "351057"}, "494": {"caption": "a photo of a black broccoli and a blue broccoli and a red broccoli and a white broccoli and a brown broccoli and a green carrot ", "segment": [{"bbox": [0.5873125, 0.2705868544600939, 1.0, 0.9811737089201877], "label": "a black broccoli"}, {"bbox": [0.062796875, 0.3962206572769953, 0.54003125, 0.8726525821596244], "label": "a blue broccoli"}, {"bbox": [0.38684375000000004, 0.6470657276995304, 0.825375, 1.0], "label": "a red broccoli"}, {"bbox": [0.0640625, 0.0471830985915493, 0.4390625, 0.4509389671361502], "label": "a white broccoli"}, {"bbox": [0.380578125, 0.04, 0.7470625, 0.41176056338028166], "label": "a brown broccoli"}, {"bbox": [0.34640624999999997, 0.28143192488262914, 0.631234375, 0.5470422535211268], "label": "a green carrot"}], "image_id": "262325"}, "495": {"caption": "a photo of a brown umbrella and a blue umbrella and a white cake and a white cake and a green cake ", "segment": [{"bbox": [0.2796235294117647, 0.385, 0.673764705882353, 0.5975312500000001], "label": "a brown umbrella"}, {"bbox": [0.08816470588235294, 0.451078125, 0.33752941176470586, 0.6775], "label": "a blue umbrella"}, {"bbox": [0.39581176470588236, 0.5725, 0.792329411764706, 0.8003281250000001], "label": "a white cake"}, {"bbox": [0.013529411764705882, 0.6674218749999999, 0.460235294117647, 0.939328125], "label": "a white cake"}, {"bbox": [0.6714823529411764, 0.5205, 1.0, 0.7238749999999999], "label": "a green cake"}], "image_id": "526956"}, "496": {"caption": "a photo of a red dining table and a blue bowl and a yellow bowl and a white bowl and a brown bowl and a red cup ", "segment": [{"bbox": [0.507859375, 0.008984375, 1.0, 0.332578125], "label": "a red dining table"}, {"bbox": [0.11471875000000001, 0.618703125, 0.48842187499999995, 0.97971875], "label": "a blue bowl"}, {"bbox": [0.5257031249999999, 0.6717500000000001, 0.8256875000000001, 0.9454062499999999], "label": "a yellow bowl"}, {"bbox": [0.836890625, 0.7626875, 0.9920937500000001, 0.941265625], "label": "a white bowl"}, {"bbox": [0.500984375, 0.146921875, 0.63734375, 0.33125], "label": "a brown bowl"}, {"bbox": [0.10103124999999999, 0.49665625, 0.22646875, 0.6582343749999999], "label": "a red cup"}], "image_id": "404668"}, "497": {"caption": "a photo of a brown potted plant and a white toilet and a black sink ", "segment": [{"bbox": [0.5405, 0.2254906542056075, 0.713546875, 0.6584345794392523], "label": "a brown potted plant"}, {"bbox": [0.0, 0.7573130841121495, 0.18334375, 0.9887616822429907], "label": "a white toilet"}, {"bbox": [0.395859375, 0.7297196261682243, 0.6421875, 0.8975233644859812], "label": "a black sink"}], "image_id": "45099"}, "498": {"caption": "a photo of a brown couch and a white couch and a white book ", "segment": [{"bbox": [0.409875, 0.44946261682242994, 0.791, 0.7462383177570093], "label": "a brown couch"}, {"bbox": [0.07173437499999999, 0.4807710280373832, 0.40340625, 0.8598364485981308], "label": "a white couch"}, {"bbox": [0.1453125, 0.28738317757009346, 0.528125, 0.5981308411214953], "label": "a white book"}], "image_id": "128148"}, "499": {"caption": "a photo of a black chair and a yellow dining table and a blue cup and a brown fork and a brown knife and a brown pizza ", "segment": [{"bbox": [0.024125, 0.0042896935933147634, 0.153203125, 0.5397771587743733], "label": "a black chair"}, {"bbox": [0.0026875, 0.17225626740947075, 1.0, 0.9856545961002786], "label": "a yellow dining table"}, {"bbox": [0.6990937500000001, 0.12910863509749304, 0.8391875000000001, 0.4105292479108635], "label": "a blue cup"}, {"bbox": [0.045234375, 0.3321727019498607, 0.2379375, 0.7093871866295264], "label": "a brown fork"}, {"bbox": [0.08109374999999999, 0.3706128133704736, 0.25787499999999997, 0.705041782729805], "label": "a brown knife"}, {"bbox": [0.23737499999999997, 0.23818941504178273, 0.803609375, 0.8102785515320334], "label": "a brown pizza"}], "image_id": "552221"}, "500": {"caption": "a photo of a blue potted plant and a blue tv and a black couch and a red chair ", "segment": [{"bbox": [0.795375, 0.24666666666666667, 0.954390625, 0.5001875], "label": "a blue potted plant"}, {"bbox": [0.096078125, 0.2168125, 0.339359375, 0.46472916666666664], "label": "a blue tv"}, {"bbox": [0.59678125, 0.6387083333333333, 1.0, 0.9871041666666666], "label": "a black couch"}, {"bbox": [0.788984375, 0.3355625, 0.95784375, 0.6803124999999999], "label": "a red chair"}], "image_id": "383549"}, "501": {"caption": "a photo of a yellow bowl and a white broccoli and a brown carrot ", "segment": [{"bbox": [0.0, 0.076234375, 0.9924065420560748, 0.6950625], "label": "a yellow bowl"}, {"bbox": [0.3307242990654206, 0.10587500000000001, 0.8690420560747665, 0.395296875], "label": "a white broccoli"}, {"bbox": [0.014065420560747662, 0.1129375, 0.3905373831775701, 0.334125], "label": "a brown carrot"}], "image_id": "405196"}, "502": {"caption": "a photo of a red cake and a blue surfboard and a black surfboard ", "segment": [{"bbox": [0.071421875, 0.0404424778761062, 0.96415625, 0.9887610619469026], "label": "a red cake"}, {"bbox": [0.34568750000000004, 0.5207787610619469, 0.6427343750000001, 0.7023716814159292], "label": "a blue surfboard"}, {"bbox": [0.17828125, 0.6294867256637169, 0.566515625, 0.7776637168141592], "label": "a black surfboard"}], "image_id": "6473"}, "503": {"caption": "a photo of a yellow cat and a blue laptop and a blue chair ", "segment": [{"bbox": [0.09749999999999999, 0.20179687500000001, 0.7426458333333333, 0.945875], "label": "a yellow cat"}, {"bbox": [0.4464375, 0.356921875, 1.0, 0.9906406249999999], "label": "a blue laptop"}, {"bbox": [0.6926458333333334, 0.176609375, 1.0, 0.35928125], "label": "a blue chair"}], "image_id": "523292"}, "504": {"caption": "a photo of a white knife and a yellow bowl and a yellow cake and a brown cup and a yellow dining table ", "segment": [{"bbox": [0.616484375, 0.2897506925207756, 1.0, 0.5565373961218837], "label": "a white knife"}, {"bbox": [0.5640625, 0.04933518005540166, 0.794234375, 0.318393351800554], "label": "a yellow bowl"}, {"bbox": [0.36506249999999996, 0.2827700831024931, 0.67940625, 0.8490581717451523], "label": "a yellow cake"}, {"bbox": [0.0131875, 0.2831301939058172, 0.25346875, 0.7168698060941829], "label": "a brown cup"}, {"bbox": [0.0, 0.002880886426592798, 1.0, 0.9899445983379501], "label": "a yellow dining table"}], "image_id": "113040"}, "505": {"caption": "a photo of a yellow bicycle and a yellow bicycle and a brown bicycle and a white bicycle and a white bicycle ", "segment": [{"bbox": [0.317171875, 0.41122916666666665, 0.49998437500000004, 0.6156874999999999], "label": "a yellow bicycle"}, {"bbox": [0.448828125, 0.4404791666666667, 0.739734375, 0.7635833333333333], "label": "a yellow bicycle"}, {"bbox": [0.648875, 0.5011249999999999, 0.9522499999999999, 0.9752708333333333], "label": "a brown bicycle"}, {"bbox": [0.268984375, 0.392, 0.41684374999999996, 0.5594583333333333], "label": "a white bicycle"}, {"bbox": [0.59440625, 0.4408958333333333, 0.8421875, 0.8512916666666667], "label": "a white bicycle"}], "image_id": "522262"}, "506": {"caption": "a photo of a black airplane and a white truck and a yellow truck ", "segment": [{"bbox": [0.0, 0.0013541666666666667, 1.0, 0.1919375], "label": "a black airplane"}, {"bbox": [0.25896875, 0.37579166666666663, 0.887890625, 0.7726458333333334], "label": "a white truck"}, {"bbox": [0.055625, 0.3865208333333333, 0.6269687500000001, 0.6876458333333333], "label": "a yellow truck"}], "image_id": "41837"}, "507": {"caption": "a photo of a blue bench and a red bench and a yellow chair ", "segment": [{"bbox": [0.163484375, 0.305625, 0.50225, 0.9707916666666666], "label": "a blue bench"}, {"bbox": [0.369890625, 0.33025000000000004, 0.52615625, 0.5072916666666667], "label": "a red bench"}, {"bbox": [0.385546875, 0.25885416666666666, 0.515484375, 0.4295833333333333], "label": "a yellow chair"}], "image_id": "423039"}, "508": {"caption": "a photo of a green elephant and a green elephant and a yellow elephant and a black elephant ", "segment": [{"bbox": [0.05109375000000001, 0.20224299065420562, 0.575578125, 0.6719158878504674], "label": "a green elephant"}, {"bbox": [0.51071875, 0.22376168224299064, 0.7751875, 0.6272429906542055], "label": "a green elephant"}, {"bbox": [0.292828125, 0.3379439252336448, 0.510671875, 0.6267523364485982], "label": "a yellow elephant"}, {"bbox": [0.7434375, 0.2336214953271028, 0.9206875, 0.6831775700934579], "label": "a black elephant"}], "image_id": "139192"}, "509": {"caption": "a photo of a blue cup and a white bowl and a white dining table ", "segment": [{"bbox": [0.7536274509803922, 0.0029411764705882353, 1.0, 0.22455882352941178], "label": "a blue cup"}, {"bbox": [0.08949346405228759, 0.22616013071895424, 0.7494444444444444, 0.8548039215686274], "label": "a white bowl"}, {"bbox": [0.0025980392156862747, 0.0, 1.0, 0.9818137254901961], "label": "a white dining table"}], "image_id": "409259"}, "510": {"caption": "a photo of a green zebra and a black zebra and a black zebra ", "segment": [{"bbox": [0.47228125, 0.525152224824356, 0.952046875, 0.9498829039812647], "label": "a green zebra"}, {"bbox": [0.10495312500000001, 0.3691100702576113, 0.5802343750000001, 0.9488758782201405], "label": "a black zebra"}, {"bbox": [0.5568906250000001, 0.37426229508196723, 0.717125, 0.5432786885245902], "label": "a black zebra"}], "image_id": "473974"}, "511": {"caption": "a photo of a blue zebra and a white zebra and a black zebra and a green zebra ", "segment": [{"bbox": [0.128640625, 0.5467083333333334, 0.298875, 0.8092291666666667], "label": "a blue zebra"}, {"bbox": [0.3108125, 0.5619375000000001, 0.52703125, 0.8322083333333334], "label": "a white zebra"}, {"bbox": [0.470265625, 0.5899375, 0.7206718750000001, 0.839125], "label": "a black zebra"}, {"bbox": [0.51653125, 0.6331666666666667, 0.9211406249999999, 0.9905625], "label": "a green zebra"}], "image_id": "268729"}, "512": {"caption": "a photo of a green cat and a green car and a blue car and a black motorcycle and a brown cat ", "segment": [{"bbox": [0.34032, 0.47957333333333335, 0.69194, 0.7763466666666666], "label": "a green cat"}, {"bbox": [0.008060000000000001, 0.003946666666666667, 0.45806, 0.48565333333333327], "label": "a green car"}, {"bbox": [0.057280000000000005, 0.59504, 1.0, 1.0], "label": "a blue car"}, {"bbox": [0.11173999999999999, 0.058133333333333335, 1.0, 0.7827200000000001], "label": "a black motorcycle"}, {"bbox": [0.41587999999999997, 0.3596266666666667, 0.5824, 0.5200533333333334], "label": "a brown cat"}], "image_id": "190326"}, "513": {"caption": "a photo of a brown suitcase and a black suitcase and a white suitcase and a brown suitcase and a green backpack ", "segment": [{"bbox": [0.43499999999999994, 0.2580603448275862, 0.902578125, 0.6872629310344828], "label": "a brown suitcase"}, {"bbox": [0.25773437499999996, 0.0447198275862069, 0.6818125, 0.34469827586206897], "label": "a black suitcase"}, {"bbox": [0.8164374999999999, 0.22635775862068966, 0.9993281249999999, 0.4695905172413793], "label": "a white suitcase"}, {"bbox": [0.0, 0.2692887931034483, 0.236234375, 0.7726508620689655], "label": "a brown suitcase"}, {"bbox": [0.653625, 0.002586206896551724, 0.99921875, 0.3264224137931034], "label": "a green backpack"}], "image_id": "168010"}, "514": {"caption": "a photo of a white bottle and a green bottle and a green sandwich and a brown wine glass and a blue knife ", "segment": [{"bbox": [0.71815625, 0.004496487119437939, 0.9400625, 0.7438173302107729], "label": "a white bottle"}, {"bbox": [0.46778125, 0.008992974238875878, 0.643203125, 0.5797658079625293], "label": "a green bottle"}, {"bbox": [0.166421875, 0.48330210772833726, 0.514265625, 0.966440281030445], "label": "a green sandwich"}, {"bbox": [0.1364375, 0.05168618266978923, 0.301359375, 0.669672131147541], "label": "a brown wine glass"}, {"bbox": [0.47978125, 0.7528103044496487, 0.9625468749999999, 0.9865105386416863], "label": "a blue knife"}], "image_id": "89549"}, "515": {"caption": "a photo of a black orange and a white orange and a yellow orange and a blue orange and a red orange and a red orange ", "segment": [{"bbox": [0.06021875, 0.31896470588235293, 0.96684375, 0.9873411764705883], "label": "a black orange"}, {"bbox": [0.6554375, 0.35505882352941176, 0.890015625, 0.7108941176470588], "label": "a white orange"}, {"bbox": [0.36859375, 0.33089411764705884, 0.6148125, 0.6657411764705883], "label": "a yellow orange"}, {"bbox": [0.065375, 0.3008235294117647, 0.311390625, 0.5857882352941176], "label": "a blue orange"}, {"bbox": [0.691203125, 0.039411764705882354, 0.8942499999999999, 0.3171294117647059], "label": "a red orange"}, {"bbox": [0.24320312500000002, 0.24155294117647058, 0.42603125000000003, 0.5039058823529412], "label": "a red orange"}], "image_id": "262113"}, "516": {"caption": "a photo of a blue sandwich and a yellow cup and a red sandwich ", "segment": [{"bbox": [0.019453124999999998, 0.36277777777777775, 0.43534375000000003, 0.860111111111111], "label": "a blue sandwich"}, {"bbox": [0.84784375, 0.0047777777777777775, 0.9973593749999999, 0.38366666666666666], "label": "a yellow cup"}, {"bbox": [0.32778125, 0.16297222222222224, 0.59721875, 0.4864166666666667], "label": "a red sandwich"}], "image_id": "92634"}, "517": {"caption": "a photo of a red tv and a blue couch and a brown chair and a brown chair ", "segment": [{"bbox": [0.30339062499999997, 0.251875, 0.49589062500000003, 0.4161458333333333], "label": "a red tv"}, {"bbox": [0.292921875, 0.6352708333333333, 0.9254374999999999, 0.9985416666666667], "label": "a blue couch"}, {"bbox": [0.10325, 0.5714375, 0.38765625000000004, 0.8233750000000001], "label": "a brown chair"}, {"bbox": [0.560015625, 0.4595208333333333, 0.762109375, 0.6281041666666667], "label": "a brown chair"}], "image_id": "548962"}, "518": {"caption": "a photo of a brown spoon and a brown bowl and a brown broccoli and a white broccoli and a red dining table ", "segment": [{"bbox": [0.09936329588014982, 0.7934574468085106, 1.0, 0.9987765957446808], "label": "a brown spoon"}, {"bbox": [0.011235955056179775, 0.04175531914893617, 0.900749063670412, 0.8795212765957446], "label": "a brown bowl"}, {"bbox": [0.49426966292134833, 0.2321276595744681, 0.6522097378277153, 0.5708510638297872], "label": "a brown broccoli"}, {"bbox": [0.2699625468164794, 0.2447872340425532, 0.42205992509363294, 0.4402659574468086], "label": "a white broccoli"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a red dining table"}], "image_id": "484069"}, "519": {"caption": "a photo of a green microwave and a black oven and a yellow oven ", "segment": [{"bbox": [0.28909375000000004, 0.2753521126760563, 0.494234375, 0.45474178403755866], "label": "a green microwave"}, {"bbox": [0.29440625, 0.5578873239436619, 0.514671875, 0.7347417840375586], "label": "a black oven"}, {"bbox": [0.292328125, 0.7241079812206573, 0.517203125, 0.8614788732394366], "label": "a yellow oven"}], "image_id": "207196"}, "520": {"caption": "a photo of a brown giraffe and a brown giraffe and a blue giraffe ", "segment": [{"bbox": [0.18951562500000002, 0.46318750000000003, 0.36871875000000004, 0.6940833333333334], "label": "a brown giraffe"}, {"bbox": [0.446484375, 0.43314583333333334, 0.6892968749999999, 0.6894166666666667], "label": "a brown giraffe"}, {"bbox": [0.6073906250000001, 0.28881249999999997, 0.73609375, 0.6599999999999999], "label": "a blue giraffe"}], "image_id": "155035"}, "521": {"caption": "a photo of a white bowl and a yellow banana and a yellow cup and a yellow bowl and a black dining table ", "segment": [{"bbox": [0.42303125, 0.13483333333333333, 0.6438125, 0.4471875], "label": "a white bowl"}, {"bbox": [0.5039374999999999, 0.5011249999999999, 0.9, 0.6831458333333332], "label": "a yellow banana"}, {"bbox": [0.13634375, 0.2728541666666667, 0.35809375, 0.5786874999999999], "label": "a yellow cup"}, {"bbox": [0.7033125, 0.22597916666666668, 0.8963906250000001, 0.4570625], "label": "a yellow bowl"}, {"bbox": [0.01640625, 0.3157083333333333, 1.0, 1.0], "label": "a black dining table"}], "image_id": "347568"}, "522": {"caption": "a photo of a white car and a blue fire hydrant and a white truck and a yellow truck ", "segment": [{"bbox": [0.0020496894409937887, 0.32228124999999996, 0.2613664596273292, 0.45275], "label": "a white car"}, {"bbox": [0.18126293995859213, 0.557625, 0.31552795031055897, 0.7865624999999999], "label": "a blue fire hydrant"}, {"bbox": [0.15296066252587992, 0.2501875, 0.4043892339544513, 0.39396875], "label": "a white truck"}, {"bbox": [0.4347412008281573, 0.026968750000000003, 1.0, 0.62696875], "label": "a yellow truck"}], "image_id": "229478"}, "523": {"caption": "a photo of a green teddy bear and a blue teddy bear and a yellow chair ", "segment": [{"bbox": [0.5494375, 0.199625, 0.9960625000000001, 0.9906458333333333], "label": "a green teddy bear"}, {"bbox": [0.00671875, 0.008958333333333334, 0.655828125, 0.9865416666666668], "label": "a blue teddy bear"}, {"bbox": [0.0, 0.0026041666666666665, 1.0, 0.9870208333333333], "label": "a yellow chair"}], "image_id": "432234"}, "524": {"caption": "a photo of a white hot dog and a blue cup and a red dining table ", "segment": [{"bbox": [0.10228124999999999, 0.4516393442622951, 0.8811875, 0.9893911007025762], "label": "a white hot dog"}, {"bbox": [0.794625, 0.004496487119437939, 1.0, 0.530327868852459], "label": "a blue cup"}, {"bbox": [0.0, 0.0, 0.39642187500000003, 0.3152459016393443], "label": "a red dining table"}], "image_id": "350340"}, "525": {"caption": "a photo of a yellow elephant and a white elephant and a yellow elephant ", "segment": [{"bbox": [0.583484375, 0.5213411764705882, 0.83865625, 0.7123529411764706], "label": "a yellow elephant"}, {"bbox": [0.41626562500000003, 0.5879294117647059, 0.587015625, 0.7567764705882353], "label": "a white elephant"}, {"bbox": [0.089390625, 0.5928470588235294, 0.2665625, 0.790635294117647], "label": "a yellow elephant"}], "image_id": "540483"}, "526": {"caption": "a photo of a white teddy bear and a red teddy bear and a blue teddy bear and a green bed ", "segment": [{"bbox": [0.38796875000000003, 0.21505543237250555, 0.7094375, 0.7386474501108647], "label": "a white teddy bear"}, {"bbox": [0.074421875, 0.21798226164079823, 0.454484375, 0.696629711751663], "label": "a red teddy bear"}, {"bbox": [0.661140625, 0.3449667405764967, 0.882875, 0.7563414634146342], "label": "a blue teddy bear"}, {"bbox": [0.0, 0.0, 0.9975468749999999, 0.9792239467849224], "label": "a green bed"}], "image_id": "113403"}, "527": {"caption": "a photo of a blue cake and a green cake and a blue cake and a red cake and a red cake and a white cake ", "segment": [{"bbox": [0.16362745098039216, 0.8266013071895425, 0.4072385620915033, 0.9770261437908497], "label": "a blue cake"}, {"bbox": [0.5959313725490196, 0.6966993464052288, 0.8295915032679738, 0.8228431372549019], "label": "a green cake"}, {"bbox": [0.6824346405228758, 0.823202614379085, 0.9391830065359477, 0.9628431372549019], "label": "a blue cake"}, {"bbox": [0.41784313725490196, 0.8108823529411765, 0.6881209150326797, 0.9820098039215687], "label": "a red cake"}, {"bbox": [0.0, 0.7426470588235294, 0.20184640522875819, 0.8692320261437909], "label": "a red cake"}, {"bbox": [0.23480392156862742, 0.7248366013071896, 0.4304575163398693, 0.8513398692810458], "label": "a white cake"}], "image_id": "503424"}, "528": {"caption": "a photo of a brown bird and a blue bird and a yellow bird and a blue bird and a green bear ", "segment": [{"bbox": [0.344015625, 0.09480093676814988, 0.49640625, 0.3054332552693208], "label": "a brown bird"}, {"bbox": [0.426875, 0.6825058548009367, 0.5983124999999999, 0.948384074941452], "label": "a blue bird"}, {"bbox": [0.65, 0.7244730679156909, 0.873359375, 0.9133021077283373], "label": "a yellow bird"}, {"bbox": [0.0, 0.6091334894613584, 0.15065625, 0.8285011709601875], "label": "a blue bird"}, {"bbox": [0.30678125, 0.2716393442622951, 0.672875, 0.7177517564402811], "label": "a green bear"}], "image_id": "229997"}, "529": {"caption": "a photo of a green dog and a red cow and a brown cow and a black cow ", "segment": [{"bbox": [0.303828125, 0.50725, 0.4850312499999999, 0.7185208333333333], "label": "a green dog"}, {"bbox": [0.188765625, 0.31460416666666663, 0.32865625, 0.6741666666666667], "label": "a red cow"}, {"bbox": [0.5444375, 0.35475, 0.86403125, 0.6952083333333333], "label": "a brown cow"}, {"bbox": [0.830953125, 0.3813333333333333, 0.9778437499999999, 0.744], "label": "a black cow"}], "image_id": "398440"}, "530": {"caption": "a photo of a brown car and a yellow car and a brown bus ", "segment": [{"bbox": [0.002421875, 0.43427777777777776, 0.23396875, 0.8157222222222221], "label": "a brown car"}, {"bbox": [0.0666875, 0.3940555555555556, 0.246640625, 0.555138888888889], "label": "a yellow car"}, {"bbox": [0.24539062500000003, 0.1277222222222222, 0.8682812500000001, 0.9263888888888889], "label": "a brown bus"}], "image_id": "147223"}, "531": {"caption": "a photo of a blue tv and a white cat and a yellow laptop and a black keyboard ", "segment": [{"bbox": [0.5154375, 0.15847916666666664, 0.954484375, 0.6253958333333334], "label": "a blue tv"}, {"bbox": [0.616125, 0.0, 0.9919375, 0.9763541666666666], "label": "a white cat"}, {"bbox": [0.0016718750000000002, 0.15458333333333335, 0.40604687500000003, 0.9688958333333333], "label": "a yellow laptop"}, {"bbox": [0.0, 0.605375, 0.307734375, 0.7623333333333332], "label": "a black keyboard"}], "image_id": "375509"}, "532": {"caption": "a photo of a blue umbrella and a green chair and a brown chair and a green chair and a white chair and a yellow umbrella ", "segment": [{"bbox": [0.3161875, 0.273140625, 0.9932916666666666, 0.602], "label": "a blue umbrella"}, {"bbox": [0.21272916666666666, 0.5955, 0.8808958333333334, 0.92809375], "label": "a green chair"}, {"bbox": [0.23520833333333335, 0.57125, 0.8086874999999999, 0.759421875], "label": "a brown chair"}, {"bbox": [0.26960416666666664, 0.5539531249999999, 0.7316666666666667, 0.717859375], "label": "a green chair"}, {"bbox": [0.2858541666666667, 0.529125, 0.7059791666666667, 0.678640625], "label": "a white chair"}, {"bbox": [0.2700208333333334, 0.41353125, 0.5695, 0.5391562500000001], "label": "a yellow umbrella"}], "image_id": "481130"}, "533": {"caption": "a photo of a white dog and a green bus and a black stop sign and a black dog ", "segment": [{"bbox": [0.51818, 0.26061333333333336, 0.71666, 0.44445333333333337], "label": "a white dog"}, {"bbox": [0.0033599999999999997, 0.00021333333333333333, 1.0, 0.9442933333333332], "label": "a green bus"}, {"bbox": [0.07736, 0.52904, 0.38172, 0.9079466666666667], "label": "a black stop sign"}, {"bbox": [0.80064, 0.11949333333333334, 1.0, 0.44154666666666664], "label": "a black dog"}], "image_id": "70493"}, "534": {"caption": "a photo of a black sandwich and a black fork and a red bowl and a blue dining table ", "segment": [{"bbox": [0.131453125, 0.18389583333333331, 0.798875, 0.7726666666666666], "label": "a black sandwich"}, {"bbox": [0.3471875, 0.15212499999999998, 0.9994375, 0.28470833333333334], "label": "a black fork"}, {"bbox": [0.0, 0.04272916666666667, 0.9983281249999999, 0.9599375], "label": "a red bowl"}, {"bbox": [0.001953125, 0.0026041666666666665, 1.0, 0.9870208333333333], "label": "a blue dining table"}], "image_id": "77951"}, "535": {"caption": "a photo of a brown dining table and a blue donut and a black donut ", "segment": [{"bbox": [0.00354, 0.0011733333333333333, 1.0, 1.0], "label": "a brown dining table"}, {"bbox": [0.5129600000000001, 0.19344000000000003, 0.66062, 0.6468], "label": "a blue donut"}, {"bbox": [0.014960000000000001, 0.6573066666666667, 0.21532, 0.9183466666666666], "label": "a black donut"}], "image_id": "405432"}, "536": {"caption": "a photo of a yellow cat and a yellow car and a green car ", "segment": [{"bbox": [0.3164166666666667, 0.1819375, 0.5601458333333333, 0.3888125], "label": "a yellow cat"}, {"bbox": [0.0, 0.360515625, 0.9985625, 0.989265625], "label": "a yellow car"}, {"bbox": [0.0027500000000000003, 0.31843750000000004, 0.1837083333333333, 0.46228125000000003], "label": "a green car"}], "image_id": "395290"}, "537": {"caption": "a photo of a brown donut and a brown donut and a red donut ", "segment": [{"bbox": [0.04925, 0.401109375, 1.0, 1.0], "label": "a brown donut"}, {"bbox": [0.20420833333333333, 0.030406250000000003, 0.991, 0.456078125], "label": "a brown donut"}, {"bbox": [0.0, 0.20379687500000002, 0.26845833333333335, 0.637796875], "label": "a red donut"}], "image_id": "206878"}, "538": {"caption": "a photo of a red toilet and a brown sink and a yellow sink and a red toilet ", "segment": [{"bbox": [0.20245833333333335, 0.5526718749999999, 0.7430625000000001, 0.8764062499999999], "label": "a red toilet"}, {"bbox": [0.3793125, 0.42670312499999996, 0.6661458333333333, 0.5581093749999999], "label": "a brown sink"}, {"bbox": [0.3343541666666667, 0.793109375, 0.7996666666666667, 0.9784374999999998], "label": "a yellow sink"}, {"bbox": [0.32208333333333333, 0.7896093750000001, 0.8069166666666666, 0.984421875], "label": "a red toilet"}], "image_id": "275929"}, "539": {"caption": "a photo of a yellow dining table and a green cup and a black spoon and a green apple and a yellow cup and a yellow cup ", "segment": [{"bbox": [0.00176, 0.004853333333333334, 0.99706, 0.9813333333333333], "label": "a yellow dining table"}, {"bbox": [0.22078, 0.03370666666666667, 0.40618, 0.3370666666666667], "label": "a green cup"}, {"bbox": [0.46868, 0.23256, 0.8098, 0.37535999999999997], "label": "a black spoon"}, {"bbox": [0.75352, 0.004693333333333333, 0.9507000000000001, 0.24882666666666667], "label": "a green apple"}, {"bbox": [0.35394, 0.040453333333333334, 0.5039399999999999, 0.30562666666666666], "label": "a yellow cup"}, {"bbox": [0.0, 0.05677333333333333, 0.14393999999999998, 0.3012533333333333], "label": "a yellow cup"}], "image_id": "440377"}, "540": {"caption": "a photo of a white vase and a white vase and a blue scissors and a green clock ", "segment": [{"bbox": [0.6073906250000001, 0.12975, 0.748234375, 0.6165], "label": "a white vase"}, {"bbox": [0.744515625, 0.1488888888888889, 0.8949374999999999, 0.6455], "label": "a white vase"}, {"bbox": [0.5018906249999999, 0.5906388888888888, 0.677984375, 0.7962777777777776], "label": "a blue scissors"}, {"bbox": [0.0, 0.47191666666666665, 0.15042187499999998, 0.6876388888888888], "label": "a green clock"}], "image_id": "382758"}, "541": {"caption": "a photo of a black refrigerator and a yellow chair and a green dining table and a brown oven ", "segment": [{"bbox": [0.20090625, 0.3528103044496487, 0.4512812500000001, 0.9330210772833724], "label": "a black refrigerator"}, {"bbox": [0.22690625, 0.6497658079625293, 0.40121874999999996, 0.9876112412177985], "label": "a yellow chair"}, {"bbox": [0.0015, 0.6967681498829039, 0.31784375000000004, 0.9484543325526932], "label": "a green dining table"}, {"bbox": [0.776640625, 0.7033723653395784, 0.9355625, 0.9887587822014051], "label": "a brown oven"}], "image_id": "221753"}, "542": {"caption": "a photo of a green dining table and a brown cup and a black bowl ", "segment": [{"bbox": [0.0, 0.045109375, 1.0, 0.554078125], "label": "a green dining table"}, {"bbox": [0.0, 0.0, 0.15804166666666666, 0.151203125], "label": "a brown cup"}, {"bbox": [0.6568124999999999, 0.23403125, 0.8496458333333333, 0.35964062500000005], "label": "a black bowl"}], "image_id": "292103"}, "543": {"caption": "a photo of a yellow chair and a brown chair and a white chair and a brown chair ", "segment": [{"bbox": [0.0, 0.43819672131147547, 0.26387499999999997, 0.9887587822014052], "label": "a yellow chair"}, {"bbox": [0.21789062499999998, 0.35023419203747075, 0.7393124999999999, 0.9876112412177986], "label": "a brown chair"}, {"bbox": [0.58621875, 0.3101170960187353, 1.0, 0.8921311475409835], "label": "a white chair"}, {"bbox": [0.01953125, 0.3434660421545667, 0.5529843750000001, 0.9876112412177986], "label": "a brown chair"}], "image_id": "292616"}, "544": {"caption": "a photo of a black chair and a green oven and a white chair ", "segment": [{"bbox": [0.1375, 0.6923333333333334, 0.35684375, 1.0], "label": "a black chair"}, {"bbox": [0.563984375, 0.6138333333333333, 0.704375, 0.8879791666666667], "label": "a green oven"}, {"bbox": [0.001953125, 0.6857083333333333, 0.15, 0.9870208333333333], "label": "a white chair"}], "image_id": "512576"}, "545": {"caption": "a photo of a blue spoon and a red cake and a yellow dining table and a black cake and a red cup ", "segment": [{"bbox": [0.435328125, 0.5672599531615925, 0.750421875, 0.8107025761124123], "label": "a blue spoon"}, {"bbox": [0.20390625, 0.28501170960187355, 0.43479687499999997, 0.7636768149882903], "label": "a red cake"}, {"bbox": [0.002078125, 0.006838407494145199, 1.0, 0.9818266978922717], "label": "a yellow dining table"}, {"bbox": [0.45590624999999996, 0.2339344262295082, 0.706890625, 0.6808899297423888], "label": "a black cake"}, {"bbox": [0.852875, 0.11627634660421546, 1.0, 0.4583606557377049], "label": "a red cup"}], "image_id": "323291"}, "546": {"caption": "a photo of a blue car and a white bus and a brown bus ", "segment": [{"bbox": [0.18160937500000002, 0.5955208333333334, 0.31446874999999996, 0.7434999999999999], "label": "a blue car"}, {"bbox": [0.3, 0.12360416666666667, 0.691015625, 0.8561875], "label": "a white bus"}, {"bbox": [0.008421874999999999, 0.4516875, 0.261234375, 0.6786458333333333], "label": "a brown bus"}], "image_id": "550691"}, "547": {"caption": "a photo of a black sheep and a brown sheep and a red sheep and a brown sheep and a black cow and a white sheep ", "segment": [{"bbox": [0.2540625, 0.372859375, 0.6325625, 0.96425], "label": "a black sheep"}, {"bbox": [0.14622916666666666, 0.266671875, 0.7770625, 0.7311875000000001], "label": "a brown sheep"}, {"bbox": [0.1923125, 0.139765625, 0.7639166666666667, 0.38648437500000005], "label": "a red sheep"}, {"bbox": [0.24627083333333333, 0.0828125, 0.5263333333333333, 0.24134374999999997], "label": "a brown sheep"}, {"bbox": [0.25364583333333335, 0.37560937499999997, 0.6305833333333334, 0.9692343749999999], "label": "a black cow"}, {"bbox": [0.6652083333333334, 0.09096875, 0.9357291666666666, 0.2535625], "label": "a white sheep"}], "image_id": "233567"}, "548": {"caption": "a photo of a green potted plant and a red cat and a green chair ", "segment": [{"bbox": [0.42699999999999994, 0.04533957845433255, 0.9216093749999998, 0.9866744730679157], "label": "a green potted plant"}, {"bbox": [0.200875, 0.30967213114754094, 0.526578125, 0.7118266978922716], "label": "a red cat"}, {"bbox": [0.0214375, 0.0003044496487119438, 0.524328125, 0.9232084309133489], "label": "a green chair"}], "image_id": "317480"}, "549": {"caption": "a photo of a yellow hot dog and a yellow cup and a brown bowl and a yellow carrot and a black carrot and a red cup ", "segment": [{"bbox": [0.1003, 0.10132132132132132, 0.59234, 0.7130930930930931], "label": "a yellow hot dog"}, {"bbox": [0.08231999999999999, 0.02921921921921922, 0.23645999999999998, 0.20972972972972975], "label": "a yellow cup"}, {"bbox": [0.0, 0.07546546546546547, 0.9975, 0.9876276276276276], "label": "a brown bowl"}, {"bbox": [0.50436, 0.6994294294294294, 0.68696, 0.8365165165165165], "label": "a yellow carrot"}, {"bbox": [0.5762, 0.5819519519519519, 0.8144000000000001, 0.8023123123123121], "label": "a black carrot"}, {"bbox": [0.0, 0.13504504504504505, 0.17266, 0.29306306306306307], "label": "a red cup"}], "image_id": "518889"}, "550": {"caption": "a photo of a red horse and a yellow horse and a white cow and a brown horse and a white horse ", "segment": [{"bbox": [0.435953125, 0.34993920972644377, 0.718484375, 0.727629179331307], "label": "a red horse"}, {"bbox": [0.2426875, 0.27887537993920974, 0.44518749999999996, 0.6658054711246201], "label": "a yellow horse"}, {"bbox": [0.13282812500000002, 0.48641337386018235, 0.345109375, 0.7137082066869301], "label": "a white cow"}, {"bbox": [0.61190625, 0.10541033434650456, 0.769703125, 0.32209726443769], "label": "a brown horse"}, {"bbox": [0.40774999999999995, 0.0841337386018237, 0.5871875, 0.3074468085106383], "label": "a white horse"}], "image_id": "71209"}, "551": {"caption": "a photo of a blue refrigerator and a red car and a black car ", "segment": [{"bbox": [0.0994375, 0.23145833333333332, 0.37078125, 0.9370833333333333], "label": "a blue refrigerator"}, {"bbox": [0.6455, 0.26083333333333336, 1.0, 0.9866666666666666], "label": "a red car"}, {"bbox": [0.543171875, 0.319, 0.68225, 0.5598541666666667], "label": "a black car"}], "image_id": "51025"}, "552": {"caption": "a photo of a brown cell phone and a yellow mouse and a green keyboard and a red handbag ", "segment": [{"bbox": [0.28514062500000004, 0.16329166666666667, 0.5154687499999999, 0.3265], "label": "a brown cell phone"}, {"bbox": [0.63471875, 0.4469375, 0.78359375, 0.7614375], "label": "a yellow mouse"}, {"bbox": [0.7853749999999999, 0.222, 1.0, 0.6019791666666666], "label": "a green keyboard"}, {"bbox": [0.048578125, 0.5820416666666667, 0.37889062500000004, 0.9887708333333334], "label": "a red handbag"}], "image_id": "459440"}, "553": {"caption": "a photo of a brown car and a blue car and a white car and a yellow car and a black car and a white car ", "segment": [{"bbox": [0.188234375, 0.6157065217391304, 0.335203125, 0.8130163043478261], "label": "a brown car"}, {"bbox": [0.618546875, 0.60375, 0.764296875, 0.8169565217391304], "label": "a blue car"}, {"bbox": [0.015140625, 0.669375, 0.17040625, 0.8007608695652174], "label": "a white car"}, {"bbox": [0.39668749999999997, 0.6266032608695652, 0.536234375, 0.8086141304347826], "label": "a yellow car"}, {"bbox": [0.7984843749999999, 0.6275, 0.953375, 0.8190217391304347], "label": "a black car"}, {"bbox": [0.070890625, 0.6304891304347826, 0.19856249999999998, 0.7621467391304348], "label": "a white car"}], "image_id": "555763"}, "554": {"caption": "a photo of a white bird and a white bird and a brown bird and a red bird and a brown bird and a yellow bird ", "segment": [{"bbox": [0.383703125, 0.32618266978922716, 0.72159375, 0.6588056206088994], "label": "a white bird"}, {"bbox": [0.678515625, 0.32925058548009367, 0.9254843749999999, 0.6078922716627635], "label": "a white bird"}, {"bbox": [0.154765625, 0.174519906323185, 0.34853125, 0.51096018735363], "label": "a brown bird"}, {"bbox": [0.0, 0.21555035128805622, 0.18715625, 0.5538875878220141], "label": "a red bird"}, {"bbox": [0.43239062500000003, 0.14292740046838406, 0.6371249999999999, 0.39829039812646366], "label": "a brown bird"}, {"bbox": [0.8609843749999999, 0.21271662763466043, 0.9880156249999998, 0.3765573770491803], "label": "a yellow bird"}], "image_id": "367876"}, "555": {"caption": "a photo of a red chair and a black couch and a blue couch and a yellow dining table and a red couch ", "segment": [{"bbox": [0.0234375, 0.3196724890829694, 0.1584375, 0.5410043668122271], "label": "a red chair"}, {"bbox": [0.15326562500000002, 0.2993886462882096, 0.574640625, 0.7051528384279476], "label": "a black couch"}, {"bbox": [0.506140625, 0.512882096069869, 0.9503125000000001, 0.9522925764192139], "label": "a blue couch"}, {"bbox": [0.631984375, 0.47272925764192136, 1.0, 0.984410480349345], "label": "a yellow dining table"}, {"bbox": [0.7193906250000001, 0.4022489082969432, 1.0, 0.6253930131004367], "label": "a red couch"}], "image_id": "196311"}, "556": {"caption": "a photo of a green sandwich and a yellow sandwich and a red bowl and a red cup and a blue hot dog ", "segment": [{"bbox": [0.24943749999999998, 0.2939110070257611, 0.51090625, 0.6182435597189696], "label": "a green sandwich"}, {"bbox": [0.46882812500000004, 0.34121779859484774, 0.671703125, 0.7196018735362997], "label": "a yellow sandwich"}, {"bbox": [0.040390625, 0.3455269320843091, 0.27675, 0.6123419203747074], "label": "a red bowl"}, {"bbox": [0.6096874999999999, 0.45887587822014053, 0.79190625, 0.7168149882903981], "label": "a red cup"}, {"bbox": [0.23742187499999998, 0.2883138173302108, 0.6671875, 0.5974004683840749], "label": "a blue hot dog"}], "image_id": "50829"}, "557": {"caption": "a photo of a yellow suitcase and a white suitcase and a yellow backpack and a blue suitcase and a black suitcase ", "segment": [{"bbox": [0.72978125, 0.0, 1.0, 0.4449375], "label": "a yellow suitcase"}, {"bbox": [0.667296875, 0.5306458333333334, 0.917921875, 0.7301666666666667], "label": "a white suitcase"}, {"bbox": [0.0915625, 0.0, 0.71103125, 0.9870208333333333], "label": "a yellow backpack"}, {"bbox": [0.0390625, 0.006520833333333333, 0.6953125, 0.9856874999999999], "label": "a blue suitcase"}, {"bbox": [0.58809375, 0.6533333333333334, 1.0, 0.9994999999999999], "label": "a black suitcase"}], "image_id": "370116"}, "558": {"caption": "a photo of a black broccoli and a black broccoli and a white broccoli and a brown broccoli and a red broccoli and a white broccoli ", "segment": [{"bbox": [0.07940625, 0.054125, 0.34412499999999996, 0.7129375000000001], "label": "a black broccoli"}, {"bbox": [0.31059375, 0.0, 0.8911718750000001, 0.41575], "label": "a black broccoli"}, {"bbox": [0.43059375, 0.34752083333333333, 0.8858750000000001, 0.9851666666666666], "label": "a white broccoli"}, {"bbox": [0.0035312499999999997, 0.1482291666666667, 0.16059375, 0.47293750000000007], "label": "a brown broccoli"}, {"bbox": [0.0052812499999999995, 0.03075, 0.154921875, 0.26314583333333336], "label": "a red broccoli"}, {"bbox": [0.0016875000000000002, 0.5668541666666667, 0.564609375, 0.9848333333333332], "label": "a white broccoli"}], "image_id": "282328"}, "559": {"caption": "a photo of a red suitcase and a green suitcase and a white suitcase and a green suitcase ", "segment": [{"bbox": [0.015312500000000001, 0.26077083333333334, 0.33673437500000003, 0.5895625], "label": "a red suitcase"}, {"bbox": [0.645515625, 0.1930625, 0.98871875, 0.6687291666666667], "label": "a green suitcase"}, {"bbox": [0.7735937500000001, 0.1460625, 1.0, 0.44718749999999996], "label": "a white suitcase"}, {"bbox": [0.682984375, 0.017083333333333332, 0.821078125, 0.2241041666666667], "label": "a green suitcase"}], "image_id": "270274"}, "560": {"caption": "a photo of a blue sandwich and a brown sandwich and a yellow wine glass and a green dining table ", "segment": [{"bbox": [0.182890625, 0.4655416666666667, 0.5536875, 0.8950625], "label": "a blue sandwich"}, {"bbox": [0.259546875, 0.38839583333333333, 0.657296875, 0.7367083333333333], "label": "a brown sandwich"}, {"bbox": [0.61825, 0.0033750000000000004, 0.8513437500000001, 0.375], "label": "a yellow wine glass"}, {"bbox": [0.001953125, 0.0051875, 0.9993437500000001, 0.9870208333333333], "label": "a green dining table"}], "image_id": "361901"}, "561": {"caption": "a photo of a green orange and a red wine glass and a white spoon and a green dining table ", "segment": [{"bbox": [0.35238493723849373, 0.548921875, 0.5602510460251047, 0.7065625], "label": "a green orange"}, {"bbox": [0.005230125523012552, 0.00153125, 0.2666317991631799, 0.2589375], "label": "a red wine glass"}, {"bbox": [0.1342050209205021, 0.006828125, 0.28328451882845196, 0.1411875], "label": "a white spoon"}, {"bbox": [0.0, 0.00225, 0.9989121338912135, 0.986515625], "label": "a green dining table"}], "image_id": "209431"}, "562": {"caption": "a photo of a red teddy bear and a brown teddy bear and a black teddy bear and a black teddy bear and a yellow teddy bear and a brown teddy bear ", "segment": [{"bbox": [0.6243529411764707, 0.37378125, 0.8261647058823529, 0.55278125], "label": "a red teddy bear"}, {"bbox": [0.38915294117647053, 0.365921875, 0.5786588235294118, 0.5546875], "label": "a brown teddy bear"}, {"bbox": [0.4406117647058823, 0.58915625, 0.6013176470588235, 0.754734375], "label": "a black teddy bear"}, {"bbox": [0.8288941176470588, 0.5951875, 0.9904705882352941, 0.75228125], "label": "a black teddy bear"}, {"bbox": [0.5369882352941177, 0.491296875, 0.6887058823529412, 0.652703125], "label": "a yellow teddy bear"}, {"bbox": [0.5984235294117647, 0.5986875, 0.7834823529411765, 0.7280468750000001], "label": "a brown teddy bear"}], "image_id": "580284"}, "563": {"caption": "a photo of a black bed and a white suitcase and a blue suitcase and a brown suitcase ", "segment": [{"bbox": [0.7980769230769231, 0.34932, 1.0, 0.9745999999999999], "label": "a black bed"}, {"bbox": [0.19153846153846152, 0.6858, 0.7310650887573965, 0.82664], "label": "a white suitcase"}, {"bbox": [0.23724852071005917, 0.59014, 0.6990532544378698, 0.72466], "label": "a blue suitcase"}, {"bbox": [0.15588757396449704, 0.8094199999999999, 0.7562426035502958, 0.9461799999999999], "label": "a brown suitcase"}], "image_id": "49567"}, "564": {"caption": "a photo of a red potted plant and a blue cat and a blue laptop and a green mouse ", "segment": [{"bbox": [0.0168125, 0.0035833333333333333, 0.248875, 0.35335416666666664], "label": "a red potted plant"}, {"bbox": [0.04203125, 0.10883333333333334, 0.984375, 0.7489166666666667], "label": "a blue cat"}, {"bbox": [0.0, 0.48539583333333336, 0.43314062499999995, 0.9213541666666667], "label": "a blue laptop"}, {"bbox": [0.44387499999999996, 0.5922291666666666, 0.8246249999999999, 0.8230833333333333], "label": "a green mouse"}], "image_id": "493295"}, "565": {"caption": "a photo of a black banana and a yellow orange and a black orange and a yellow broccoli and a blue orange ", "segment": [{"bbox": [0.6076235294117647, 0.4403900709219858, 0.775364705882353, 0.662304964539007], "label": "a black banana"}, {"bbox": [0.6056235294117647, 0.728758865248227, 0.7511764705882353, 0.9693262411347519], "label": "a yellow orange"}, {"bbox": [0.4636941176470588, 0.7764539007092199, 0.6213647058823529, 0.985886524822695], "label": "a black orange"}, {"bbox": [0.43268235294117646, 0.4271631205673759, 0.6616941176470588, 0.7013829787234043], "label": "a yellow broccoli"}, {"bbox": [0.3326352941176471, 0.7071276595744681, 0.49463529411764706, 0.9149290780141843], "label": "a blue orange"}], "image_id": "90724"}, "566": {"caption": "a photo of a blue sandwich and a yellow dining table and a white cup and a white bowl and a blue cup and a black sandwich ", "segment": [{"bbox": [0.315171875, 0.4330208333333333, 0.9572968749999999, 0.842], "label": "a blue sandwich"}, {"bbox": [0.0, 0.003958333333333333, 1.0, 0.983625], "label": "a yellow dining table"}, {"bbox": [0.763484375, 0.0, 1.0, 0.298875], "label": "a white cup"}, {"bbox": [0.08595312499999999, 0.2471875, 0.43314062499999995, 0.6539375], "label": "a white bowl"}, {"bbox": [0.007921875, 0.0, 0.23859375, 0.23814583333333333], "label": "a blue cup"}, {"bbox": [0.397640625, 0.16839583333333333, 0.8064843750000001, 0.47462499999999996], "label": "a black sandwich"}], "image_id": "441672"}, "567": {"caption": "a photo of a black horse and a red horse and a blue horse and a brown horse and a green vase ", "segment": [{"bbox": [0.05645312500000001, 0.21685416666666668, 0.57903125, 0.8017916666666667], "label": "a black horse"}, {"bbox": [0.412171875, 0.17350000000000002, 0.65625, 0.8071041666666666], "label": "a red horse"}, {"bbox": [0.288203125, 0.18427083333333333, 0.8662968750000001, 0.9617916666666666], "label": "a blue horse"}, {"bbox": [0.6929531250000001, 0.20379166666666665, 0.9161093749999999, 0.6109583333333333], "label": "a brown horse"}, {"bbox": [0.006734374999999999, 0.0, 0.9522499999999999, 0.9662916666666667], "label": "a green vase"}], "image_id": "348488"}, "568": {"caption": "a photo of a red carrot and a red carrot and a brown carrot and a red carrot and a black carrot ", "segment": [{"bbox": [0.168671875, 0.3952916666666667, 0.301828125, 0.5212291666666666], "label": "a red carrot"}, {"bbox": [0.60046875, 0.5046666666666667, 0.8577031250000001, 0.7493958333333334], "label": "a red carrot"}, {"bbox": [0.5, 0.2669375, 0.7265625, 0.3971458333333333], "label": "a brown carrot"}, {"bbox": [0.15, 0.5082916666666667, 0.40325000000000005, 0.8615416666666665], "label": "a red carrot"}, {"bbox": [0.20806249999999998, 0.8496041666666667, 0.39940625, 1.0], "label": "a black carrot"}], "image_id": "130171"}, "569": {"caption": "a photo of a brown cat and a yellow cat and a yellow bed and a black suitcase ", "segment": [{"bbox": [0.45976, 0.27312312312312315, 0.7261599999999999, 0.6774174174174173], "label": "a brown cat"}, {"bbox": [0.24348, 0.24087087087087086, 0.56574, 0.6881681681681681], "label": "a yellow cat"}, {"bbox": [0.0044800000000000005, 0.006366366366366367, 0.5148400000000001, 0.9861561561561561], "label": "a yellow bed"}, {"bbox": [0.19008, 0.23594594594594592, 0.8201600000000001, 0.8247147147147147], "label": "a black suitcase"}], "image_id": "220292"}, "570": {"caption": "a photo of a blue bird and a red bird and a red bird and a blue giraffe ", "segment": [{"bbox": [0.3607764705882353, 0.43745312500000005, 0.5096705882352941, 0.672953125], "label": "a blue bird"}, {"bbox": [0.5003294117647058, 0.6192968750000001, 0.6603999999999999, 0.8471875000000001], "label": "a red bird"}, {"bbox": [0.5358352941176471, 0.040984375, 0.756235294117647, 0.25917187499999994], "label": "a red bird"}, {"bbox": [0.09936470588235294, 0.0, 0.8889176470588236, 1.0], "label": "a blue giraffe"}], "image_id": "40926"}, "571": {"caption": "a photo of a green chair and a green umbrella and a red umbrella and a blue umbrella and a black chair ", "segment": [{"bbox": [0.780453125, 0.48472916666666666, 0.97171875, 0.6481458333333333], "label": "a green chair"}, {"bbox": [0.514453125, 0.3288125, 0.810359375, 0.7045625000000001], "label": "a green umbrella"}, {"bbox": [0.20964062499999997, 0.3271875, 0.540578125, 0.7013958333333333], "label": "a red umbrella"}, {"bbox": [0.7284843750000001, 0.34143749999999995, 0.9497656250000001, 0.5949583333333333], "label": "a blue umbrella"}, {"bbox": [0.262453125, 0.4722708333333333, 0.42996875, 0.6130208333333333], "label": "a black chair"}], "image_id": "66038"}, "572": {"caption": "a photo of a blue fork and a green sandwich and a blue bowl and a brown bowl and a brown bowl and a red cake ", "segment": [{"bbox": [0.0016875000000000002, 0.32066666666666666, 0.288203125, 0.749875], "label": "a blue fork"}, {"bbox": [0.5022031250000001, 0.0734375, 0.7625468750000001, 0.47295833333333337], "label": "a green sandwich"}, {"bbox": [0.25193750000000004, 0.18735416666666668, 0.5302187500000001, 0.4813125], "label": "a blue bowl"}, {"bbox": [0.755046875, 0.17039583333333336, 0.97196875, 0.4305], "label": "a brown bowl"}, {"bbox": [0.3818125, 0.5212916666666667, 0.55909375, 0.770625], "label": "a brown bowl"}, {"bbox": [0.625328125, 0.43816666666666665, 0.9448124999999999, 0.5732291666666666], "label": "a red cake"}], "image_id": "104589"}, "573": {"caption": "a photo of a brown chair and a blue chair and a red couch and a brown dining table and a green potted plant ", "segment": [{"bbox": [0.591, 0.4992266666666667, 0.7219, 0.75744], "label": "a brown chair"}, {"bbox": [0.74514, 0.5026933333333333, 0.87312, 0.7575466666666666], "label": "a blue chair"}, {"bbox": [0.0048200000000000005, 0.7094400000000001, 0.32671999999999995, 0.9884000000000001], "label": "a red couch"}, {"bbox": [0.6329, 0.5342133333333333, 0.9999199999999999, 0.75792], "label": "a brown dining table"}, {"bbox": [0.16219999999999998, 0.47533333333333333, 0.30804, 0.6163466666666667], "label": "a green potted plant"}], "image_id": "56108"}, "574": {"caption": "a photo of a brown orange and a white orange and a yellow orange and a white orange ", "segment": [{"bbox": [0.46686, 0.5782300884955752, 0.6776, 0.774646017699115], "label": "a brown orange"}, {"bbox": [0.35116, 0.30254424778761063, 0.55744, 0.498141592920354], "label": "a white orange"}, {"bbox": [0.29431999999999997, 0.4840929203539823, 0.50914, 0.7328097345132744], "label": "a yellow orange"}, {"bbox": [0.50354, 0.37369469026548674, 0.68818, 0.5912389380530974], "label": "a white orange"}], "image_id": "462639"}, "575": {"caption": "a photo of a blue cat and a yellow laptop and a red cat and a blue bed ", "segment": [{"bbox": [0.025656250000000002, 0.5086284289276808, 0.24576562500000004, 0.9073316708229427], "label": "a blue cat"}, {"bbox": [0.156640625, 0.061945137157107234, 0.9229062500000002, 0.9673316708229426], "label": "a yellow laptop"}, {"bbox": [0.8241250000000001, 0.05967581047381546, 0.9680625, 0.7060847880299251], "label": "a red cat"}, {"bbox": [0.0, 0.427930174563591, 1.0, 1.0], "label": "a blue bed"}], "image_id": "423742"}, "576": {"caption": "a photo of a white giraffe and a blue giraffe and a yellow giraffe and a blue giraffe ", "segment": [{"bbox": [0.48790625, 0.24644859813084113, 0.7954375, 0.6836915887850468], "label": "a white giraffe"}, {"bbox": [0.3744375, 0.3322196261682243, 0.5646718749999999, 0.6092289719626168], "label": "a blue giraffe"}, {"bbox": [0.187015625, 0.25759345794392524, 0.43984375, 0.6535747663551402], "label": "a yellow giraffe"}, {"bbox": [0.270984375, 0.3289252336448598, 0.470734375, 0.6138084112149533], "label": "a blue giraffe"}], "image_id": "482626"}, "577": {"caption": "a photo of a black airplane and a green airplane and a red truck and a yellow truck ", "segment": [{"bbox": [0.013203125, 0.0988755980861244, 0.8380625, 0.4449521531100479], "label": "a black airplane"}, {"bbox": [0.71075, 0.13964114832535884, 1.0, 0.293133971291866], "label": "a green airplane"}, {"bbox": [0.3685, 0.5106937799043062, 0.60225, 0.6654545454545454], "label": "a red truck"}, {"bbox": [0.12553125, 0.4930622009569378, 0.58865625, 0.8333253588516746], "label": "a yellow truck"}], "image_id": "8180"}, "578": {"caption": "a photo of a yellow dining table and a black wine glass and a brown wine glass and a blue wine glass and a red fork ", "segment": [{"bbox": [0.0, 0.26689999999999997, 1.0, 0.98536], "label": "a yellow dining table"}, {"bbox": [0.40327999999999997, 0.0869, 0.6402666666666667, 0.48754], "label": "a black wine glass"}, {"bbox": [0.011653333333333333, 0.08562, 0.3012, 0.57498], "label": "a brown wine glass"}, {"bbox": [0.7238133333333333, 0.08052, 0.9697066666666666, 0.47012], "label": "a blue wine glass"}, {"bbox": [0.31293333333333334, 0.47062, 0.8592266666666668, 0.65058], "label": "a red fork"}], "image_id": "450202"}, "579": {"caption": "a photo of a white bowl and a yellow broccoli and a blue broccoli and a yellow broccoli and a red broccoli and a yellow broccoli ", "segment": [{"bbox": [0.037828125000000004, 0.0, 1.0, 0.9841217798594848], "label": "a white bowl"}, {"bbox": [0.24876562500000002, 0.6661592505854801, 0.406625, 0.8580562060889929], "label": "a yellow broccoli"}, {"bbox": [0.515171875, 0.7882903981264637, 0.7702031249999999, 0.9638407494145199], "label": "a blue broccoli"}, {"bbox": [0.717421875, 0.21646370023419206, 0.9748749999999999, 0.5811709601873536], "label": "a yellow broccoli"}, {"bbox": [0.803890625, 0.6744964871194379, 0.949921875, 0.8491803278688526], "label": "a red broccoli"}, {"bbox": [0.128125, 0.0234192037470726, 0.9984375, 0.9437939110070258], "label": "a yellow broccoli"}], "image_id": "298691"}, "580": {"caption": "a photo of a green dining table and a yellow cup and a blue cup and a red fork and a green carrot and a green bowl ", "segment": [{"bbox": [0.0, 0.01038, 1.0, 0.98702], "label": "a green dining table"}, {"bbox": [0.0, 0.13912, 0.24757333333333334, 0.47022], "label": "a yellow cup"}, {"bbox": [0.049626666666666666, 0.020579999999999998, 0.3073066666666667, 0.29474], "label": "a blue cup"}, {"bbox": [0.44144, 0.6520199999999999, 0.6066133333333333, 0.9898599999999999], "label": "a red fork"}, {"bbox": [0.25434666666666667, 0.6162000000000001, 0.4808533333333333, 0.75944], "label": "a green carrot"}, {"bbox": [0.84128, 0.0005600000000000001, 0.9997066666666666, 0.17518], "label": "a green bowl"}], "image_id": "419312"}, "581": {"caption": "a photo of a yellow dining table and a green laptop and a yellow banana and a green banana and a yellow banana and a brown cell phone ", "segment": [{"bbox": [0.0015, 0.004637002341920374, 0.9985312500000001, 0.9821779859484778], "label": "a yellow dining table"}, {"bbox": [0.0, 0.0022482435597189696, 0.4078125, 0.8808899297423888], "label": "a green laptop"}, {"bbox": [0.456265625, 0.09192037470725996, 0.7614375, 0.8766744730679157], "label": "a yellow banana"}, {"bbox": [0.3958125, 0.15730679156908667, 0.622203125, 0.9078688524590165], "label": "a green banana"}, {"bbox": [0.284859375, 0.16629976580796255, 0.500765625, 0.9033723653395784], "label": "a yellow banana"}, {"bbox": [0.778390625, 0.578688524590164, 0.924140625, 0.9029976580796253], "label": "a brown cell phone"}], "image_id": "427666"}, "582": {"caption": "a photo of a yellow cat and a green bed and a red teddy bear and a black teddy bear and a red teddy bear ", "segment": [{"bbox": [0.34194, 0.30751999999999996, 0.6548399999999999, 0.6516], "label": "a yellow cat"}, {"bbox": [0.0016799999999999999, 0.00224, 1.0, 0.9887733333333333], "label": "a green bed"}, {"bbox": [0.58784, 0.26576, 0.83108, 0.5090133333333333], "label": "a red teddy bear"}, {"bbox": [0.22053999999999999, 0.18450666666666665, 0.63786, 0.4176266666666667], "label": "a black teddy bear"}, {"bbox": [0.1354, 0.28914666666666666, 0.45384, 0.7943999999999999], "label": "a red teddy bear"}], "image_id": "434996"}, "583": {"caption": "a photo of a white laptop and a brown cup and a brown cup and a green laptop and a black donut and a yellow donut ", "segment": [{"bbox": [0.0016875000000000002, 0.0022500000000000003, 0.47528125, 0.43820833333333337], "label": "a white laptop"}, {"bbox": [0.0, 0.3524791666666667, 0.34965625, 0.8344583333333333], "label": "a brown cup"}, {"bbox": [0.655671875, 0.29083333333333333, 1.0, 0.724875], "label": "a brown cup"}, {"bbox": [0.625, 0.0045000000000000005, 1.0, 0.28379166666666666], "label": "a green laptop"}, {"bbox": [0.3970625, 0.7526666666666666, 0.7399687500000001, 0.9879583333333333], "label": "a black donut"}, {"bbox": [0.36067187500000003, 0.21572916666666667, 0.57303125, 0.4561875], "label": "a yellow donut"}], "image_id": "487548"}, "584": {"caption": "a photo of a brown tv and a blue chair and a black chair and a green couch and a white couch and a brown dining table ", "segment": [{"bbox": [0.2465, 0.11218750000000001, 0.423546875, 0.27077083333333335], "label": "a brown tv"}, {"bbox": [0.132265625, 0.4516041666666667, 0.3419375, 0.7290416666666667], "label": "a blue chair"}, {"bbox": [0.801796875, 0.5420208333333334, 1.0, 0.8222083333333334], "label": "a black chair"}, {"bbox": [0.34826562499999997, 0.4931041666666667, 0.770296875, 0.8586874999999999], "label": "a green couch"}, {"bbox": [0.45931249999999996, 0.3471041666666667, 0.7178749999999999, 0.5419583333333333], "label": "a white couch"}, {"bbox": [0.586875, 0.7961041666666666, 1.0, 0.9852291666666666], "label": "a brown dining table"}], "image_id": "104801"}, "585": {"caption": "a photo of a white sheep and a green sheep and a brown sheep and a yellow sheep and a green sheep ", "segment": [{"bbox": [0.577015625, 0.2638679245283019, 1.0, 0.6359198113207547], "label": "a white sheep"}, {"bbox": [0.418875, 0.2860141509433962, 0.59553125, 0.7225707547169812], "label": "a green sheep"}, {"bbox": [0.05840625000000001, 0.3953301886792453, 0.44309374999999995, 0.6641509433962265], "label": "a brown sheep"}, {"bbox": [0.5404687499999999, 0.32334905660377355, 0.713421875, 0.6383254716981132], "label": "a yellow sheep"}, {"bbox": [0.0, 0.1957547169811321, 0.9984375, 0.7429245283018868], "label": "a green sheep"}], "image_id": "468933"}, "586": {"caption": "a photo of a yellow car and a blue bus and a brown car and a brown truck ", "segment": [{"bbox": [0.585359375, 0.604192037470726, 0.7957656249999999, 0.7740749414519907], "label": "a yellow car"}, {"bbox": [0.396703125, 0.4650819672131148, 0.6266093749999999, 0.7128337236533958], "label": "a blue bus"}, {"bbox": [0.25579687500000003, 0.567400468384075, 0.455703125, 0.7775409836065573], "label": "a brown car"}, {"bbox": [0.67284375, 0.5754332552693209, 0.817796875, 0.7131147540983607], "label": "a brown truck"}], "image_id": "26204"}, "587": {"caption": "a photo of a white sandwich and a black sandwich and a black bottle and a green sandwich and a black sandwich and a blue cup ", "segment": [{"bbox": [0.042140625, 0.38202083333333337, 0.364046875, 0.7887708333333333], "label": "a white sandwich"}, {"bbox": [0.58184375, 0.31077083333333333, 0.9417031250000001, 0.6695], "label": "a black sandwich"}, {"bbox": [0.764546875, 0.0, 1.0, 0.33847916666666666], "label": "a black bottle"}, {"bbox": [0.173171875, 0.26485416666666667, 0.4363125, 0.5121249999999999], "label": "a green sandwich"}, {"bbox": [0.5099843749999999, 0.21041666666666667, 0.73784375, 0.4414375], "label": "a black sandwich"}, {"bbox": [0.136109375, 0.0003958333333333333, 0.297109375, 0.1711458333333333], "label": "a blue cup"}], "image_id": "43944"}, "588": {"caption": "a photo of a yellow bottle and a black spoon and a blue carrot and a black carrot ", "segment": [{"bbox": [0.1224381625441696, 0.22794811320754718, 0.6444169611307421, 0.6602122641509434], "label": "a yellow bottle"}, {"bbox": [0.5959363957597174, 0.2876415094339623, 0.9191519434628975, 0.7595518867924529], "label": "a black spoon"}, {"bbox": [0.07597173144876325, 0.01813679245283019, 1.0, 0.6416981132075471], "label": "a blue carrot"}, {"bbox": [0.0, 0.5012971698113208, 0.83886925795053, 0.9518160377358492], "label": "a black carrot"}], "image_id": "531875"}, "589": {"caption": "a photo of a black broccoli and a black broccoli and a black broccoli and a green broccoli and a black broccoli and a blue broccoli ", "segment": [{"bbox": [0.24470833333333333, 0.64940625, 0.5772499999999999, 0.9764687500000001], "label": "a black broccoli"}, {"bbox": [0.041937499999999996, 0.63109375, 0.32658333333333334, 0.9906406249999999], "label": "a black broccoli"}, {"bbox": [0.6964791666666666, 0.601640625, 1.0, 0.9239843750000001], "label": "a black broccoli"}, {"bbox": [0.34160416666666665, 0.808578125, 0.733375, 1.0], "label": "a green broccoli"}, {"bbox": [0.7652916666666666, 0.4094375, 1.0, 0.6894843749999999], "label": "a black broccoli"}, {"bbox": [0.6726666666666666, 0.820953125, 0.9038958333333333, 0.9876093749999999], "label": "a blue broccoli"}], "image_id": "38294"}, "590": {"caption": "a photo of a white cat and a blue couch and a blue remote and a red remote ", "segment": [{"bbox": [0.14371875, 0.06788659793814433, 0.716, 0.5808247422680413], "label": "a white cat"}, {"bbox": [0.0026093749999999997, 0.004304123711340206, 0.999984375, 0.9892525773195877], "label": "a blue couch"}, {"bbox": [0.546921875, 0.43175257731958766, 0.91290625, 0.7571907216494846], "label": "a blue remote"}, {"bbox": [0.41371874999999997, 0.793917525773196, 0.890265625, 0.9876030927835053], "label": "a red remote"}], "image_id": "499226"}, "591": {"caption": "a photo of a white cup and a red fork and a yellow dining table and a brown fork and a yellow knife and a yellow spoon ", "segment": [{"bbox": [0.241796875, 0.3760655737704918, 0.37165625, 0.6131850117096019], "label": "a white cup"}, {"bbox": [0.0, 0.6381967213114754, 0.33584375, 0.7820140515222481], "label": "a red fork"}, {"bbox": [0.0, 0.30269320843091335, 1.0, 0.9887822014051522], "label": "a yellow dining table"}, {"bbox": [0.784390625, 0.39711943793911003, 0.9106406249999999, 0.5796487119437939], "label": "a brown fork"}, {"bbox": [0.34075, 0.6699765807962529, 0.560640625, 0.8702576112412177], "label": "a yellow knife"}, {"bbox": [0.342703125, 0.6740046838407494, 0.562625, 0.8732552693208431], "label": "a yellow spoon"}], "image_id": "158005"}, "592": {"caption": "a photo of a brown dog and a yellow dog and a red dog and a brown frisbee and a green dog ", "segment": [{"bbox": [0.0, 0.27239583333333334, 0.5136406250000001, 0.9855208333333334], "label": "a brown dog"}, {"bbox": [0.543546875, 0.20429166666666668, 1.0, 0.7871041666666667], "label": "a yellow dog"}, {"bbox": [0.854328125, 0.0, 1.0, 0.2232916666666667], "label": "a red dog"}, {"bbox": [0.4455, 0.23791666666666667, 0.5962500000000001, 0.37654166666666666], "label": "a brown frisbee"}, {"bbox": [0.44973437499999996, 0.0, 0.6131249999999999, 0.27318749999999997], "label": "a green dog"}], "image_id": "161220"}, "593": {"caption": "a photo of a blue umbrella and a yellow chair and a red chair and a brown chair ", "segment": [{"bbox": [0.43757812500000004, 0.5729791666666666, 0.607703125, 0.7108541666666667], "label": "a blue umbrella"}, {"bbox": [0.1295625, 0.7054166666666667, 0.320953125, 0.8543333333333334], "label": "a yellow chair"}, {"bbox": [0.2765, 0.7359166666666667, 0.451328125, 0.8622916666666666], "label": "a red chair"}, {"bbox": [0.41293749999999996, 0.7076041666666666, 0.5568124999999999, 0.8731458333333333], "label": "a brown chair"}], "image_id": "360494"}, "594": {"caption": "a photo of a green cow and a yellow cow and a green cow and a red cow and a blue cow and a yellow cow ", "segment": [{"bbox": [0.6535624999999999, 0.35279166666666667, 0.8494375, 0.71275], "label": "a green cow"}, {"bbox": [0.8733124999999999, 0.055187499999999994, 1.0, 0.9853541666666668], "label": "a yellow cow"}, {"bbox": [0.100359375, 0.2842083333333333, 0.282484375, 0.5065833333333333], "label": "a green cow"}, {"bbox": [0.411546875, 0.4525416666666667, 0.65821875, 0.6887083333333333], "label": "a red cow"}, {"bbox": [0.21795312500000003, 0.4427083333333333, 0.4800625, 0.6737708333333333], "label": "a blue cow"}, {"bbox": [0.076890625, 0.43233333333333335, 0.32534375, 0.6731458333333333], "label": "a yellow cow"}], "image_id": "231758"}, "595": {"caption": "a photo of a blue chair and a red skis and a white skis and a blue skis and a brown skis and a yellow skis ", "segment": [{"bbox": [0.26966666666666667, 0.084703125, 0.8749166666666667, 0.9723437500000001], "label": "a blue chair"}, {"bbox": [0.6406875, 0.142859375, 0.8623333333333333, 0.66234375], "label": "a red skis"}, {"bbox": [0.4017291666666667, 0.096109375, 0.5645000000000001, 0.789609375], "label": "a white skis"}, {"bbox": [0.5386875, 0.07809374999999999, 0.7073333333333333, 0.644421875], "label": "a blue skis"}, {"bbox": [0.122625, 0.108375, 0.2981666666666667, 0.5246406250000001], "label": "a brown skis"}, {"bbox": [0.35783333333333334, 0.141078125, 0.4907708333333333, 0.64228125], "label": "a yellow skis"}], "image_id": "233430"}, "596": {"caption": "a photo of a green dining table and a red bowl and a brown bowl and a yellow bowl and a white bowl and a white cup ", "segment": [{"bbox": [0.0016875000000000002, 0.0, 0.9943750000000001, 0.9617916666666667], "label": "a green dining table"}, {"bbox": [0.532015625, 0.5924999999999999, 0.75953125, 0.8563749999999999], "label": "a red bowl"}, {"bbox": [0.199671875, 0.12102083333333334, 0.382546875, 0.35368750000000004], "label": "a brown bowl"}, {"bbox": [0.0, 0.13497916666666668, 0.192140625, 0.3574583333333334], "label": "a yellow bowl"}, {"bbox": [0.777203125, 0.05508333333333334, 1.0, 0.31445833333333334], "label": "a white bowl"}, {"bbox": [0.682359375, 0.0, 0.8210625, 0.1615625], "label": "a white cup"}], "image_id": "211177"}, "597": {"caption": "a photo of a blue giraffe and a yellow giraffe and a green giraffe and a green giraffe ", "segment": [{"bbox": [0.336375, 0.2387291666666667, 0.466296875, 0.494], "label": "a blue giraffe"}, {"bbox": [0.51290625, 0.24187499999999998, 0.693, 0.4983541666666666], "label": "a yellow giraffe"}, {"bbox": [0.78184375, 0.26091666666666663, 0.92775, 0.49804166666666666], "label": "a green giraffe"}, {"bbox": [0.383234375, 0.2904791666666667, 0.5469062499999999, 0.49295833333333333], "label": "a green giraffe"}], "image_id": "406189"}, "598": {"caption": "a photo of a white couch and a white teddy bear and a green teddy bear and a brown teddy bear and a white teddy bear ", "segment": [{"bbox": [0.0, 0.005375375375375376, 0.9975599999999999, 1.0], "label": "a white couch"}, {"bbox": [0.2895, 0.32096096096096094, 0.6885, 0.9268168168168168], "label": "a white teddy bear"}, {"bbox": [0.58608, 0.14897897897897897, 0.9125, 0.857057057057057], "label": "a green teddy bear"}, {"bbox": [0.06916, 0.27213213213213217, 0.39103999999999994, 0.8903603603603604], "label": "a brown teddy bear"}, {"bbox": [0.31018, 0.02051051051051051, 0.6397200000000001, 0.5373573573573575], "label": "a white teddy bear"}], "image_id": "418578"}, "599": {"caption": "a photo of a green dog and a white bed and a brown teddy bear and a red teddy bear ", "segment": [{"bbox": [0.0143125, 0.13736951983298537, 0.831265625, 0.9172025052192068], "label": "a green dog"}, {"bbox": [0.0, 0.18805845511482255, 1.0, 0.9853653444676409], "label": "a white bed"}, {"bbox": [0.02003125, 0.33906054279749476, 0.15545312500000003, 0.5027766179540709], "label": "a brown teddy bear"}, {"bbox": [0.6631875, 0.18043841336116911, 0.999875, 0.4923590814196242], "label": "a red teddy bear"}], "image_id": "215744"}, "600": {"caption": "a photo of a yellow banana and a white banana and a red banana and a brown banana and a green banana and a green banana ", "segment": [{"bbox": [0.345078125, 0.479672131147541, 0.57903125, 1.0], "label": "a yellow banana"}, {"bbox": [0.21056249999999999, 0.15587822014051522, 0.48187499999999994, 0.5287822014051522], "label": "a white banana"}, {"bbox": [0.1214375, 0.57807962529274, 0.352328125, 0.9758313817330211], "label": "a red banana"}, {"bbox": [0.7258281249999999, 0.20234192037470727, 0.8784374999999999, 0.4322248243559719], "label": "a brown banana"}, {"bbox": [0.539734375, 0.5864871194379391, 0.757515625, 0.7444262295081967], "label": "a green banana"}, {"bbox": [0.4269375, 0.4233489461358314, 0.631734375, 0.5666042154566745], "label": "a green banana"}], "image_id": "473427"}, "601": {"caption": "a photo of a red cat and a green laptop and a blue chair and a blue dining table and a white laptop ", "segment": [{"bbox": [0.40878125, 0.20608333333333334, 0.8108125000000002, 0.9662083333333334], "label": "a red cat"}, {"bbox": [0.08595312499999999, 0.22022916666666664, 0.47021875, 0.8584166666666666], "label": "a green laptop"}, {"bbox": [0.547640625, 0.17029166666666665, 0.8833593750000001, 0.7599374999999999], "label": "a blue chair"}, {"bbox": [0.0, 0.5495208333333333, 0.7053125, 0.9899374999999999], "label": "a blue dining table"}, {"bbox": [0.00046875, 0.1858125, 0.26959375, 0.5674791666666666], "label": "a white laptop"}], "image_id": "55466"}, "602": {"caption": "a photo of a blue backpack and a red suitcase and a green suitcase and a blue dining table ", "segment": [{"bbox": [0.44104687499999995, 0.5796250000000001, 0.8196875, 0.9809791666666666], "label": "a blue backpack"}, {"bbox": [0.47245312500000003, 0.3127083333333333, 0.7071875000000001, 0.7334791666666667], "label": "a red suitcase"}, {"bbox": [0.0016875000000000002, 0.29662499999999997, 0.237640625, 0.7168541666666667], "label": "a green suitcase"}, {"bbox": [0.412984375, 0.16883333333333334, 1.0, 0.42597916666666674], "label": "a blue dining table"}], "image_id": "378506"}, "603": {"caption": "a photo of a blue fork and a yellow broccoli and a white broccoli and a white broccoli and a brown fork and a red dining table ", "segment": [{"bbox": [0.78703125, 0.0024791666666666664, 0.970265625, 0.14697916666666666], "label": "a blue fork"}, {"bbox": [0.181984375, 0.41006250000000005, 0.412515625, 0.6724166666666667], "label": "a yellow broccoli"}, {"bbox": [0.397328125, 0.3269375, 0.5509375000000001, 0.6595], "label": "a white broccoli"}, {"bbox": [0.5170625, 0.44470833333333337, 0.78, 0.64], "label": "a white broccoli"}, {"bbox": [0.5460625, 0.1528125, 0.86965625, 0.4134791666666667], "label": "a brown fork"}, {"bbox": [0.001484375, 0.003916666666666666, 1.0, 0.9995208333333333], "label": "a red dining table"}], "image_id": "231097"}, "604": {"caption": "a photo of a green car and a black truck and a yellow truck and a white truck ", "segment": [{"bbox": [0.79553125, 0.7550521920668058, 1.0, 0.9820250521920668], "label": "a green car"}, {"bbox": [0.66534375, 0.6674739039665971, 0.920703125, 0.8321085594989562], "label": "a black truck"}, {"bbox": [0.00678125, 0.4580584551148225, 0.497265625, 0.8299373695198329], "label": "a yellow truck"}, {"bbox": [0.56278125, 0.5723590814196242, 0.88946875, 0.8232985386221294], "label": "a white truck"}], "image_id": "223574"}, "605": {"caption": "a photo of a white dining table and a blue book and a red book and a brown book and a green book and a white book ", "segment": [{"bbox": [0.0, 0.274625, 0.5543125, 1.0], "label": "a white dining table"}, {"bbox": [0.0, 0.07128124999999999, 0.41466666666666663, 0.36128125], "label": "a blue book"}, {"bbox": [0.22670833333333332, 0.6837187499999999, 0.45558333333333334, 0.8573124999999999], "label": "a red book"}, {"bbox": [0.8599166666666667, 0.112359375, 0.9917499999999999, 0.406734375], "label": "a brown book"}, {"bbox": [0.755375, 0.44684375000000004, 0.9954166666666666, 0.5856562500000001], "label": "a green book"}, {"bbox": [0.6486458333333334, 0.0731875, 0.8169375, 0.213296875], "label": "a white book"}], "image_id": "343680"}, "606": {"caption": "a photo of a blue chair and a brown chair and a red chair and a white dining table and a brown chair and a blue refrigerator ", "segment": [{"bbox": [0.49800000000000005, 0.7061041666666666, 0.6385937500000001, 1.0], "label": "a blue chair"}, {"bbox": [0.648421875, 0.6718125, 0.78296875, 1.0], "label": "a brown chair"}, {"bbox": [0.7735937500000001, 0.6224791666666667, 0.913484375, 0.9662916666666668], "label": "a red chair"}, {"bbox": [0.0, 0.4856458333333334, 0.9652499999999999, 1.0], "label": "a white dining table"}, {"bbox": [0.34375, 0.7487083333333333, 0.5, 0.9882916666666667], "label": "a brown chair"}, {"bbox": [0.0038906250000000004, 0.20260416666666667, 0.17921874999999998, 0.5428541666666666], "label": "a blue refrigerator"}], "image_id": "74209"}, "607": {"caption": "a photo of a brown laptop and a white keyboard and a blue book and a black book ", "segment": [{"bbox": [0.67759375, 0.0022535211267605635, 1.0, 0.7887558685446009], "label": "a brown laptop"}, {"bbox": [0.691109375, 0.00676056338028169, 0.9954375000000001, 0.770281690140845], "label": "a white keyboard"}, {"bbox": [0.28718750000000004, 0.18875586854460094, 0.8002500000000001, 0.9752816901408451], "label": "a blue book"}, {"bbox": [0.002984375, 0.004483568075117371, 0.36198437499999997, 0.8584272300469483], "label": "a black book"}], "image_id": "344831"}, "608": {"caption": "a photo of a yellow dining table and a red cup and a blue knife and a green cup and a yellow cup and a black cup ", "segment": [{"bbox": [0.0015937500000000001, 0.0, 1.0, 0.9887610619469027], "label": "a yellow dining table"}, {"bbox": [0.40787500000000004, 0.09212389380530973, 0.5840468750000001, 0.3280973451327434], "label": "a red cup"}, {"bbox": [0.289546875, 0.5513274336283186, 0.41684374999999996, 0.8416592920353981], "label": "a blue knife"}, {"bbox": [0.337453125, 0.21783185840707964, 0.47828125000000005, 0.41013274336283184], "label": "a green cup"}, {"bbox": [0.03653125, 0.5692477876106194, 0.16699999999999998, 0.7761504424778761], "label": "a yellow cup"}, {"bbox": [0.66340625, 0.0, 0.81734375, 0.12515486725663716], "label": "a black cup"}], "image_id": "384040"}, "609": {"caption": "a photo of a green bottle and a blue refrigerator and a yellow microwave and a black microwave ", "segment": [{"bbox": [0.12143999999999999, 0.08082666666666666, 0.53952, 0.6356533333333333], "label": "a green bottle"}, {"bbox": [0.04014, 0.37829333333333337, 0.32382, 1.0], "label": "a blue refrigerator"}, {"bbox": [0.31998000000000004, 0.47850666666666664, 0.4835, 0.6078666666666667], "label": "a yellow microwave"}, {"bbox": [0.08556, 0.22690666666666667, 0.277, 0.3791466666666667], "label": "a black microwave"}], "image_id": "453302"}, "610": {"caption": "a photo of a brown chair and a blue laptop and a yellow oven and a brown book and a white dining table ", "segment": [{"bbox": [0.13758, 0.7116266666666667, 0.53524, 0.9890399999999999], "label": "a brown chair"}, {"bbox": [0.45, 0.28314666666666666, 0.6893199999999999, 0.5325866666666668], "label": "a blue laptop"}, {"bbox": [0.08262, 0.06232, 0.26165999999999995, 0.35733333333333334], "label": "a yellow oven"}, {"bbox": [0.30384, 0.48618666666666666, 0.61664, 0.66416], "label": "a brown book"}, {"bbox": [0.20063999999999999, 0.28570666666666666, 0.78116, 0.9818133333333333], "label": "a white dining table"}], "image_id": "291981"}, "611": {"caption": "a photo of a red couch and a black chair and a red chair and a green chair and a yellow dining table and a red chair ", "segment": [{"bbox": [0.46596875000000004, 0.3980841121495327, 0.7449687500000001, 0.6088317757009345], "label": "a red couch"}, {"bbox": [0.14650000000000002, 0.43221962616822435, 0.44709374999999996, 1.0], "label": "a black chair"}, {"bbox": [0.42018750000000005, 0.41427570093457944, 0.6388125, 1.0], "label": "a red chair"}, {"bbox": [0.057359375000000004, 0.38317757009345793, 0.21134375, 0.5750467289719626], "label": "a green chair"}, {"bbox": [0.005984375, 0.4811915887850467, 0.53559375, 0.7026869158878505], "label": "a yellow dining table"}, {"bbox": [0.802796875, 0.4036214953271028, 0.9762812499999999, 0.6189252336448597], "label": "a red chair"}], "image_id": "498738"}, "612": {"caption": "a photo of a black spoon and a red broccoli and a black broccoli and a white broccoli and a white broccoli and a red dining table ", "segment": [{"bbox": [0.28796875, 0.06325, 1.0, 0.257625], "label": "a black spoon"}, {"bbox": [0.541984375, 0.4656875, 0.7885625, 0.8597916666666666], "label": "a red broccoli"}, {"bbox": [0.451359375, 0.2109375, 0.7093281250000001, 0.5356041666666668], "label": "a black broccoli"}, {"bbox": [0.1938125, 0.305625, 0.365734375, 0.496625], "label": "a white broccoli"}, {"bbox": [0.297640625, 0.642, 0.490921875, 0.8768125], "label": "a white broccoli"}, {"bbox": [0.0, 0.0, 1.0, 0.9820625], "label": "a red dining table"}], "image_id": "311385"}, "613": {"caption": "a photo of a yellow zebra and a brown zebra and a red zebra and a yellow zebra and a yellow zebra ", "segment": [{"bbox": [0.1449375, 0.19325, 0.8020625000000001, 0.9452291666666667], "label": "a yellow zebra"}, {"bbox": [0.08240625, 0.17264583333333333, 0.35314062500000004, 0.5874375000000001], "label": "a brown zebra"}, {"bbox": [0.0, 0.20135416666666667, 0.14965625, 0.6699583333333334], "label": "a red zebra"}, {"bbox": [0.17281249999999998, 0.009166666666666667, 0.384234375, 0.19485416666666666], "label": "a yellow zebra"}, {"bbox": [0.635390625, 0.098875, 0.918546875, 0.5617916666666666], "label": "a yellow zebra"}], "image_id": "559294"}, "614": {"caption": "a photo of a green bowl and a yellow broccoli and a black broccoli and a brown broccoli and a red broccoli and a green broccoli ", "segment": [{"bbox": [0.0, 0.019741176470588238, 0.9975781250000001, 0.9973176470588235], "label": "a green bowl"}, {"bbox": [0.053000000000000005, 0.09647058823529411, 0.819953125, 0.821835294117647], "label": "a yellow broccoli"}, {"bbox": [0.11690624999999999, 0.7068, 0.562734375, 0.9861411764705883], "label": "a black broccoli"}, {"bbox": [0.6734218750000001, 0.5049411764705882, 0.96646875, 0.8124470588235293], "label": "a brown broccoli"}, {"bbox": [0.5325, 0.5448, 0.8034531250000001, 0.8679294117647058], "label": "a red broccoli"}, {"bbox": [0.771875, 0.7800235294117647, 0.9587031249999999, 1.0], "label": "a green broccoli"}], "image_id": "284681"}, "615": {"caption": "a photo of a black dining table and a yellow bottle and a white bowl and a white sandwich and a brown wine glass ", "segment": [{"bbox": [0.012296875, 0.0025625, 1.0, 0.9838333333333333], "label": "a black dining table"}, {"bbox": [0.73246875, 0.0051875, 0.8649374999999999, 0.18960416666666666], "label": "a yellow bottle"}, {"bbox": [0.49632812499999995, 0.3394375, 0.9954062499999999, 0.9796458333333333], "label": "a white bowl"}, {"bbox": [0.003078125, 0.39931249999999996, 0.41950000000000004, 0.8869583333333334], "label": "a white sandwich"}, {"bbox": [0.361953125, 0.0, 0.567390625, 0.16570833333333335], "label": "a brown wine glass"}], "image_id": "18575"}, "616": {"caption": "a photo of a yellow chair and a green bowl and a white wine glass and a white spoon and a yellow carrot and a green fork ", "segment": [{"bbox": [0.3555439330543933, 0.00225, 0.988765690376569, 0.154953125], "label": "a yellow chair"}, {"bbox": [0.3550418410041841, 0.791015625, 0.7702510460251046, 0.9887656249999999], "label": "a green bowl"}, {"bbox": [0.7043305439330544, 0.430984375, 0.9797698744769875, 0.7096406249999999], "label": "a white wine glass"}, {"bbox": [0.0, 0.7230624999999999, 0.4479288702928871, 0.86303125], "label": "a white spoon"}, {"bbox": [0.091255230125523, 0.55771875, 0.4217364016736402, 0.701828125], "label": "a yellow carrot"}, {"bbox": [0.14738493723849372, 0.8366093749999999, 0.30947698744769875, 0.9995937500000001], "label": "a green fork"}], "image_id": "550702"}, "617": {"caption": "a photo of a white umbrella and a black umbrella and a brown umbrella and a yellow umbrella and a yellow umbrella ", "segment": [{"bbox": [0.789640625, 0.5615420560747664, 0.927609375, 0.8630607476635513], "label": "a white umbrella"}, {"bbox": [0.7440625, 0.07771028037383178, 0.870578125, 0.47408878504672897], "label": "a black umbrella"}, {"bbox": [0.66521875, 0.33116822429906545, 0.7947656249999999, 0.8659579439252336], "label": "a brown umbrella"}, {"bbox": [0.566328125, 0.33897196261682244, 0.741046875, 0.8659813084112149], "label": "a yellow umbrella"}, {"bbox": [0.5015625, 0.16016355140186916, 0.67396875, 0.3580841121495327], "label": "a yellow umbrella"}], "image_id": "288000"}, "618": {"caption": "a photo of a yellow banana and a white bowl and a red apple and a white pizza and a brown pizza and a white apple ", "segment": [{"bbox": [0.57640625, 0.1415833333333333, 0.994375, 0.7550625], "label": "a yellow banana"}, {"bbox": [0.572265625, 0.3945416666666667, 0.888671875, 0.9570416666666667], "label": "a white bowl"}, {"bbox": [0.5882968749999999, 0.5509583333333333, 0.849546875, 0.9419583333333333], "label": "a red apple"}, {"bbox": [0.12809375, 0.2674166666666667, 0.461796875, 0.5191041666666667], "label": "a white pizza"}, {"bbox": [0.1938125, 0.16629166666666664, 0.510671875, 0.4134791666666667], "label": "a brown pizza"}, {"bbox": [0.611375, 0.4325833333333333, 0.8213593749999999, 0.5771666666666666], "label": "a white apple"}], "image_id": "113589"}, "619": {"caption": "a photo of a green chair and a blue chair and a white chair and a blue dining table and a yellow chair ", "segment": [{"bbox": [0.1313, 0.47855, 0.29525999999999997, 0.6853999999999999], "label": "a green chair"}, {"bbox": [0.47252, 0.41442500000000004, 0.6538399999999999, 0.5985], "label": "a blue chair"}, {"bbox": [0.04736, 0.7187, 0.26630000000000004, 0.971025], "label": "a white chair"}, {"bbox": [0.12018000000000001, 0.52045, 0.62062, 0.836575], "label": "a blue dining table"}, {"bbox": [0.6982200000000001, 0.132175, 0.9224600000000001, 0.44325000000000003], "label": "a yellow chair"}], "image_id": "549351"}, "620": {"caption": "a photo of a yellow dining table and a yellow wine glass and a blue wine glass and a black sandwich ", "segment": [{"bbox": [0.0, 0.024354166666666666, 1.0, 0.9883958333333334], "label": "a yellow dining table"}, {"bbox": [0.68075, 0.07770833333333332, 0.9391875000000001, 0.8186875], "label": "a yellow wine glass"}, {"bbox": [0.5965625, 0.0019166666666666668, 0.75503125, 0.42916666666666664], "label": "a blue wine glass"}, {"bbox": [0.23595312499999999, 0.43145833333333333, 0.6825781249999999, 0.8516875], "label": "a black sandwich"}], "image_id": "163589"}, "621": {"caption": "a photo of a black knife and a yellow knife and a red knife and a yellow knife and a black knife and a black broccoli ", "segment": [{"bbox": [0.0015, 0.5, 0.612, 0.9819819819819819], "label": "a black knife"}, {"bbox": [0.40876, 0.5370570570570571, 0.67658, 0.9867867867867869], "label": "a yellow knife"}, {"bbox": [0.6974199999999999, 0.5640540540540541, 0.99974, 0.9887687687687687], "label": "a red knife"}, {"bbox": [0.7281599999999999, 0.5226726726726727, 1.0, 0.816006006006006], "label": "a yellow knife"}, {"bbox": [0.7263200000000001, 0.26255255255255255, 1.0, 0.49930930930930933], "label": "a black knife"}, {"bbox": [0.41931999999999997, 0.05546546546546546, 0.68542, 0.5047747747747748], "label": "a black broccoli"}], "image_id": "543322"}, "622": {"caption": "a photo of a black boat and a blue boat and a green boat and a green boat and a black boat ", "segment": [{"bbox": [0.067578125, 0.504978448275862, 0.333671875, 1.0], "label": "a black boat"}, {"bbox": [0.32984375, 0.5337931034482759, 1.0, 0.9301724137931034], "label": "a blue boat"}, {"bbox": [0.318609375, 0.7103232758620689, 0.702234375, 0.9950646551724137], "label": "a green boat"}, {"bbox": [0.524546875, 0.41620689655172416, 0.7352187499999999, 0.5522198275862069], "label": "a green boat"}, {"bbox": [0.312984375, 0.37103448275862067, 0.4815781250000001, 0.49734913793103447], "label": "a black boat"}], "image_id": "419281"}, "623": {"caption": "a photo of a blue hot dog and a green cup and a green hot dog and a white hot dog and a green hot dog and a yellow cup ", "segment": [{"bbox": [0.044765624999999996, 0.6449411764705882, 0.6043749999999999, 0.9415764705882353], "label": "a blue hot dog"}, {"bbox": [0.1343125, 0.0015529411764705883, 0.414859375, 0.5543764705882352], "label": "a green cup"}, {"bbox": [0.5303125, 0.3304470588235294, 0.9688749999999999, 0.651270588235294], "label": "a green hot dog"}, {"bbox": [0.4525625, 0.35150588235294117, 0.85534375, 0.693435294117647], "label": "a white hot dog"}, {"bbox": [0.0984375, 0.5154588235294117, 0.6203125, 0.7554588235294117], "label": "a green hot dog"}, {"bbox": [0.5387187499999999, 0.0, 0.7998593749999999, 0.36628235294117645], "label": "a yellow cup"}], "image_id": "413971"}, "624": {"caption": "a photo of a brown bowl and a green cup and a brown sandwich and a yellow spoon and a green sandwich and a black sandwich ", "segment": [{"bbox": [0.3955, 0.00225, 0.9108541666666667, 0.26965625], "label": "a brown bowl"}, {"bbox": [0.010687499999999999, 0.0, 0.31372916666666667, 0.288765625], "label": "a green cup"}, {"bbox": [0.4086458333333333, 0.539359375, 0.7248333333333333, 0.798875], "label": "a brown sandwich"}, {"bbox": [0.30979166666666663, 0.22215625, 0.6553958333333333, 0.394046875], "label": "a yellow spoon"}, {"bbox": [0.7072291666666667, 0.353109375, 0.9450416666666667, 0.595515625], "label": "a green sandwich"}, {"bbox": [0.15031250000000002, 0.32820312500000004, 0.48462500000000003, 0.48520312500000007], "label": "a black sandwich"}], "image_id": "338949"}, "625": {"caption": "a photo of a red banana and a white banana and a brown banana and a red banana and a blue banana and a white banana ", "segment": [{"bbox": [0.0283125, 0.5041666666666667, 0.22321874999999997, 0.8016875], "label": "a red banana"}, {"bbox": [0.23040625, 0.5930625, 0.4760625, 0.7989999999999999], "label": "a white banana"}, {"bbox": [0.383890625, 0.5094166666666667, 0.5489531249999999, 0.7791458333333333], "label": "a brown banana"}, {"bbox": [0.28509375000000003, 0.6183125, 0.4894375, 0.7520416666666667], "label": "a red banana"}, {"bbox": [0.371609375, 0.36285416666666664, 0.517890625, 0.5297916666666667], "label": "a blue banana"}, {"bbox": [0.236625, 0.33531249999999996, 0.3705625, 0.5022083333333334], "label": "a white banana"}], "image_id": "497006"}, "626": {"caption": "a photo of a brown laptop and a blue laptop and a brown mouse and a brown chair and a blue bottle ", "segment": [{"bbox": [0.42174, 0.2575, 0.7793199999999999, 0.6976041666666667], "label": "a brown laptop"}, {"bbox": [0.0, 0.09864583333333334, 0.61724, 0.8413888888888889], "label": "a blue laptop"}, {"bbox": [0.09572, 0.7659027777777778, 0.3425, 0.9319444444444446], "label": "a brown mouse"}, {"bbox": [0.22236, 0.42614583333333333, 0.5335, 0.5771527777777777], "label": "a brown chair"}, {"bbox": [0.77446, 0.4665972222222222, 0.93712, 0.9588194444444444], "label": "a blue bottle"}], "image_id": "223444"}, "627": {"caption": "a photo of a red cup and a brown orange and a red cup and a blue dining table ", "segment": [{"bbox": [0.05168300653594771, 0.13034313725490196, 0.746062091503268, 0.9662908496732027], "label": "a red cup"}, {"bbox": [0.3435294117647059, 0.17898692810457517, 0.9788235294117646, 0.7107516339869281], "label": "a brown orange"}, {"bbox": [0.8207843137254902, 0.0025980392156862747, 0.9818137254901961, 0.22338235294117648], "label": "a red cup"}, {"bbox": [0.0, 0.0, 1.0, 0.9862418300653596], "label": "a blue dining table"}], "image_id": "463283"}, "628": {"caption": "a photo of a white bowl and a yellow bowl and a red bowl and a red broccoli and a black dining table ", "segment": [{"bbox": [0.21356250000000002, 0.16293749999999999, 1.0, 0.9857916666666667], "label": "a white bowl"}, {"bbox": [0.37134375, 0.000375, 0.8305781250000001, 0.22277083333333333], "label": "a yellow bowl"}, {"bbox": [0.011796875, 0.0, 0.22584375000000004, 0.20897916666666666], "label": "a red bowl"}, {"bbox": [0.0, 0.18310416666666668, 0.39525, 0.5812083333333333], "label": "a red broccoli"}, {"bbox": [0.0033750000000000004, 0.0, 0.9994375, 0.9370833333333334], "label": "a black dining table"}], "image_id": "134016"}, "629": {"caption": "a photo of a black horse and a yellow car and a blue truck and a black truck ", "segment": [{"bbox": [0.5689375, 0.25578823529411765, 0.69559375, 0.7101647058823529], "label": "a black horse"}, {"bbox": [0.45292187500000003, 0.36421176470588235, 0.57921875, 0.5181411764705882], "label": "a yellow car"}, {"bbox": [0.8659375, 0.26952941176470585, 0.9998281250000002, 0.44896470588235293], "label": "a blue truck"}, {"bbox": [0.0017187500000000002, 0.3246823529411765, 0.34496875, 0.7168941176470588], "label": "a black truck"}], "image_id": "362293"}, "630": {"caption": "a photo of a yellow tv and a yellow laptop and a red dining table and a brown tv ", "segment": [{"bbox": [0.737390625, 0.23402083333333332, 0.98321875, 0.4860833333333333], "label": "a yellow tv"}, {"bbox": [0.06490625, 0.3151875, 0.22057812499999999, 0.49147916666666663], "label": "a yellow laptop"}, {"bbox": [0.342859375, 0.4, 0.748046875, 0.7558541666666667], "label": "a red dining table"}, {"bbox": [0.47850000000000004, 0.23304166666666667, 0.6285937500000001, 0.36695833333333333], "label": "a brown tv"}], "image_id": "495680"}, "631": {"caption": "a photo of a yellow cow and a blue cow and a white cow and a brown cow ", "segment": [{"bbox": [0.05159375000000001, 0.36972916666666666, 0.289625, 0.8656458333333333], "label": "a yellow cow"}, {"bbox": [0.609671875, 0.3630833333333333, 0.932265625, 0.9845833333333334], "label": "a blue cow"}, {"bbox": [0.23181250000000003, 0.3565, 0.510390625, 0.8422083333333333], "label": "a white cow"}, {"bbox": [0.46484375, 0.3697916666666667, 0.716796875, 0.8307291666666666], "label": "a brown cow"}], "image_id": "116095"}, "632": {"caption": "a photo of a yellow banana and a blue banana and a brown orange and a blue orange ", "segment": [{"bbox": [0.054453125000000005, 0.0, 1.0, 1.0], "label": "a yellow banana"}, {"bbox": [0.342359375, 0.0020833333333333333, 0.5329375000000001, 0.277375], "label": "a blue banana"}, {"bbox": [0.0017656249999999998, 0.3811666666666667, 0.48882812500000006, 0.9858750000000001], "label": "a brown orange"}, {"bbox": [0.76059375, 0.13810416666666667, 1.0, 0.8510416666666667], "label": "a blue orange"}], "image_id": "119452"}, "633": {"caption": "a photo of a green tv and a yellow chair and a yellow chair and a blue bed ", "segment": [{"bbox": [0.8172656249999999, 0.277125, 0.99046875, 0.4340833333333334], "label": "a green tv"}, {"bbox": [0.27903125, 0.5827916666666667, 0.606453125, 0.9483958333333333], "label": "a yellow chair"}, {"bbox": [0.58021875, 0.6836249999999999, 0.984046875, 1.0], "label": "a yellow chair"}, {"bbox": [0.26749999999999996, 0.132625, 0.47573437500000004, 0.55475], "label": "a blue bed"}], "image_id": "570022"}, "634": {"caption": "a photo of a yellow potted plant and a black car and a yellow bench and a green potted plant ", "segment": [{"bbox": [0.3953125, 0.19126463700234192, 0.5328125, 0.41374707259953164], "label": "a yellow potted plant"}, {"bbox": [0.056843750000000005, 0.0021311475409836068, 0.279734375, 0.47747072599531615], "label": "a black car"}, {"bbox": [0.6876249999999999, 0.171615925058548, 0.96521875, 0.7199063231850117], "label": "a yellow bench"}, {"bbox": [0.0015, 0.004496487119437939, 0.1439375, 0.734824355971897], "label": "a green potted plant"}], "image_id": "543112"}, "635": {"caption": "a photo of a green chair and a blue chair and a black dining table and a brown chair and a green chair and a yellow chair ", "segment": [{"bbox": [0.29356, 0.407725, 0.53906, 0.9077250000000001], "label": "a green chair"}, {"bbox": [0.48516000000000004, 0.548375, 0.8653800000000001, 0.98925], "label": "a blue chair"}, {"bbox": [0.46982, 0.5059, 0.95094, 0.6780750000000001], "label": "a black dining table"}, {"bbox": [0.23312, 0.371875, 0.36568, 0.6698999999999999], "label": "a brown chair"}, {"bbox": [0.75326, 0.451825, 0.9995599999999999, 0.7271500000000001], "label": "a green chair"}, {"bbox": [0.00098, 0.395875, 0.13648, 0.807275], "label": "a yellow chair"}], "image_id": "485994"}, "636": {"caption": "a photo of a brown surfboard and a red surfboard and a red surfboard and a red surfboard and a brown surfboard and a red surfboard ", "segment": [{"bbox": [0.59828125, 0.6281455399061032, 0.848609375, 0.8934272300469482], "label": "a brown surfboard"}, {"bbox": [0.393765625, 0.588075117370892, 0.6210625000000001, 0.8212206572769953], "label": "a red surfboard"}, {"bbox": [0.32965625, 0.5815962441314554, 0.577796875, 0.780281690140845], "label": "a red surfboard"}, {"bbox": [0.563828125, 0.6188262910798122, 0.753328125, 0.8658920187793427], "label": "a red surfboard"}, {"bbox": [0.48428125, 0.6095539906103287, 0.66684375, 0.8352582159624414], "label": "a brown surfboard"}, {"bbox": [0.311671875, 0.5717605633802817, 0.5074375, 0.7764788732394365], "label": "a red surfboard"}], "image_id": "281508"}, "637": {"caption": "a photo of a green dining table and a yellow wine glass and a green donut and a green cup and a blue potted plant and a blue donut ", "segment": [{"bbox": [0.0, 0.24270312500000002, 0.992907949790795, 0.9887656250000001], "label": "a green dining table"}, {"bbox": [0.2617573221757322, 0.01984375, 0.5626359832635983, 0.52996875], "label": "a yellow wine glass"}, {"bbox": [0.19531380753138075, 0.545875, 0.6206276150627615, 0.8894062500000001], "label": "a green donut"}, {"bbox": [0.5796234309623431, 0.141765625, 0.9016527196652719, 0.5164531250000001], "label": "a green cup"}, {"bbox": [0.04861924686192468, 0.0, 0.29822175732217576, 0.22540624999999997], "label": "a blue potted plant"}, {"bbox": [0.5405857740585773, 0.5494687500000001, 0.7625313807531381, 0.784765625], "label": "a blue donut"}], "image_id": "176696"}, "638": {"caption": "a photo of a red pizza and a blue pizza and a red pizza and a black pizza and a black pizza and a green pizza ", "segment": [{"bbox": [0.175152224824356, 0.501125, 0.778032786885246, 0.896625], "label": "a red pizza"}, {"bbox": [0.508360655737705, 0.534828125, 1.0, 0.9994687500000001], "label": "a blue pizza"}, {"bbox": [0.0673536299765808, 0.37490625, 0.7443559718969555, 0.604125], "label": "a red pizza"}, {"bbox": [0.12798594847775174, 0.4994375, 0.6500468384074941, 0.735390625], "label": "a black pizza"}, {"bbox": [0.32334894613583137, 0.311984375, 0.7746838407494144, 0.45804687499999996], "label": "a black pizza"}, {"bbox": [0.6914285714285715, 0.265171875, 0.8420374707259953, 0.4494375], "label": "a green pizza"}], "image_id": "197262"}, "639": {"caption": "a photo of a brown umbrella and a red dining table and a green dining table and a brown cup and a red cup and a green dining table ", "segment": [{"bbox": [0.0, 0.02315625, 0.3215, 0.293828125], "label": "a brown umbrella"}, {"bbox": [0.0, 0.5979687499999999, 1.0, 0.9876093749999999], "label": "a red dining table"}, {"bbox": [0.414625, 0.530421875, 0.9753958333333335, 0.6870156250000001], "label": "a green dining table"}, {"bbox": [0.6322083333333333, 0.67415625, 1.0, 0.9820156250000001], "label": "a brown cup"}, {"bbox": [0.2529375, 0.59134375, 0.43985416666666666, 0.7727031249999999], "label": "a red cup"}, {"bbox": [0.000625, 0.34375, 0.6331875, 0.52165625], "label": "a green dining table"}], "image_id": "485483"}, "640": {"caption": "a photo of a blue umbrella and a white umbrella and a yellow dining table and a yellow dining table and a white chair and a brown chair ", "segment": [{"bbox": [0.0016799999999999999, 0.0, 0.8747199999999999, 0.8382133333333333], "label": "a blue umbrella"}, {"bbox": [0.62528, 0.13909333333333332, 1.0, 0.7147466666666666], "label": "a white umbrella"}, {"bbox": [0.2556, 0.8354133333333332, 0.64742, 0.9923733333333333], "label": "a yellow dining table"}, {"bbox": [0.16396, 0.6983999999999999, 0.37422000000000005, 0.8901333333333332], "label": "a yellow dining table"}, {"bbox": [0.10582, 0.7642399999999999, 0.25134, 1.0], "label": "a white chair"}, {"bbox": [0.7028, 0.8179733333333333, 0.8376399999999999, 0.9820266666666666], "label": "a brown chair"}], "image_id": "29709"}, "641": {"caption": "a photo of a brown chair and a blue chair and a brown couch and a black couch and a blue chair and a brown chair ", "segment": [{"bbox": [0.85471875, 0.47454332552693207, 1.0, 0.7669789227166276], "label": "a brown chair"}, {"bbox": [0.0008125000000000001, 0.5000936768149883, 0.21376562500000001, 0.9325995316159251], "label": "a blue chair"}, {"bbox": [0.08325, 0.45779859484777513, 0.2961875, 0.7431147540983607], "label": "a brown couch"}, {"bbox": [0.56840625, 0.8233723653395785, 0.9999218750000001, 0.9870023419203747], "label": "a black couch"}, {"bbox": [0.085265625, 0.46070257611241217, 0.29798437499999997, 0.7614285714285715], "label": "a blue chair"}, {"bbox": [0.6752343749999999, 0.4492505854800937, 0.818953125, 0.6924121779859486], "label": "a brown chair"}], "image_id": "492758"}, "642": {"caption": "a photo of a green motorcycle and a black motorcycle and a yellow motorcycle and a red motorcycle and a yellow motorcycle and a blue motorcycle ", "segment": [{"bbox": [0.1221875, 0.146075, 1.0, 0.9910000000000001], "label": "a green motorcycle"}, {"bbox": [0.0028125, 0.267425, 0.82584375, 0.988775], "label": "a black motorcycle"}, {"bbox": [0.14125000000000001, 0.019525, 0.5822499999999999, 0.30425], "label": "a yellow motorcycle"}, {"bbox": [0.242875, 0.11197499999999999, 0.6875312499999999, 0.3003], "label": "a red motorcycle"}, {"bbox": [0.00421875, 0.011225, 0.18960937500000002, 0.3618], "label": "a yellow motorcycle"}, {"bbox": [0.8637656249999999, 0.0837, 0.994375, 0.3736], "label": "a blue motorcycle"}], "image_id": "524108"}, "643": {"caption": "a photo of a white chair and a black dining table and a yellow laptop and a red cat ", "segment": [{"bbox": [0.00059375, 0.4512291666666667, 0.46290624999999996, 1.0], "label": "a white chair"}, {"bbox": [0.383046875, 0.1064375, 1.0, 0.9862708333333333], "label": "a black dining table"}, {"bbox": [0.33971874999999996, 0.0211875, 0.6544375, 0.21975], "label": "a yellow laptop"}, {"bbox": [0.1385, 0.35908333333333337, 0.36796875, 0.8715208333333334], "label": "a red cat"}], "image_id": "451440"}, "644": {"caption": "a photo of a brown giraffe and a brown giraffe and a green giraffe and a red giraffe and a brown giraffe and a white giraffe ", "segment": [{"bbox": [0.2128125, 0.5229166666666667, 0.525390625, 1.0], "label": "a brown giraffe"}, {"bbox": [0.515515625, 0.6868333333333333, 0.8208437500000001, 0.999625], "label": "a brown giraffe"}, {"bbox": [0.5460625, 0.2629166666666667, 1.0, 0.892125], "label": "a green giraffe"}, {"bbox": [0.566296875, 0.008604166666666666, 1.0, 0.9838958333333333], "label": "a red giraffe"}, {"bbox": [0.55746875, 0.5038125, 0.8152968749999999, 0.9845625000000001], "label": "a brown giraffe"}, {"bbox": [0.475109375, 0.4942708333333333, 0.6383593750000001, 0.6814583333333334], "label": "a white giraffe"}], "image_id": "522665"}, "645": {"caption": "a photo of a green dining table and a brown refrigerator and a green bottle and a brown pizza and a brown chair and a white cup ", "segment": [{"bbox": [0.0016875000000000002, 0.24097916666666666, 1.0, 0.9858958333333334], "label": "a green dining table"}, {"bbox": [0.15878125, 0.0011250000000000001, 0.603046875, 0.28491666666666665], "label": "a brown refrigerator"}, {"bbox": [0.653578125, 0.000625, 0.814265625, 0.5387708333333333], "label": "a green bottle"}, {"bbox": [0.443265625, 0.703375, 0.7466250000000001, 0.9460625], "label": "a brown pizza"}, {"bbox": [0.798875, 0.08764583333333334, 0.9977499999999999, 0.29662499999999997], "label": "a brown chair"}, {"bbox": [0.804328125, 0.277125, 0.951953125, 0.5464166666666667], "label": "a white cup"}], "image_id": "194724"}, "646": {"caption": "a photo of a brown broccoli and a yellow broccoli and a brown broccoli and a yellow dining table ", "segment": [{"bbox": [0.29021875, 0.37735981308411215, 0.61196875, 0.7287850467289718], "label": "a brown broccoli"}, {"bbox": [0.5695, 0.6927803738317757, 0.760359375, 0.9045093457943925], "label": "a yellow broccoli"}, {"bbox": [0.5428437500000001, 0.48261682242990656, 0.77478125, 0.731892523364486], "label": "a brown broccoli"}, {"bbox": [0.0015, 0.0022429906542056075, 1.0, 0.9887616822429907], "label": "a yellow dining table"}], "image_id": "96440"}, "647": {"caption": "a photo of a green horse and a blue horse and a white horse and a blue horse ", "segment": [{"bbox": [0.2993139293139293, 0.6749375, 0.5732224532224532, 0.902921875], "label": "a green horse"}, {"bbox": [0.5464241164241164, 0.672765625, 0.7708316008316007, 0.858046875], "label": "a blue horse"}, {"bbox": [0.18837837837837837, 0.67246875, 0.3827234927234927, 0.9106718749999999], "label": "a white horse"}, {"bbox": [0.4801871101871102, 0.67409375, 0.6074844074844075, 0.8030156250000001], "label": "a blue horse"}], "image_id": "71027"}, "648": {"caption": "a photo of a blue zebra and a black zebra and a blue zebra and a blue zebra ", "segment": [{"bbox": [0.150890625, 0.3810538641686183, 0.358328125, 0.6475644028103045], "label": "a blue zebra"}, {"bbox": [0.59934375, 0.3613817330210773, 0.8107031250000001, 0.6741217798594848], "label": "a black zebra"}, {"bbox": [0.4038125, 0.40501170960187355, 0.635375, 0.654519906323185], "label": "a blue zebra"}, {"bbox": [0.362265625, 0.4105152224824356, 0.5717187499999999, 0.676744730679157], "label": "a blue zebra"}], "image_id": "423810"}, "649": {"caption": "a photo of a black broccoli and a white spoon and a black carrot and a black broccoli and a green carrot and a white carrot ", "segment": [{"bbox": [0.0, 0.17230046948356809, 0.39578125000000003, 0.9403051643192489], "label": "a black broccoli"}, {"bbox": [0.557921875, 0.04044600938967136, 1.0, 0.5078638497652582], "label": "a white spoon"}, {"bbox": [0.446875, 0.7032863849765258, 0.609375, 1.0], "label": "a black carrot"}, {"bbox": [0.3045, 0.30145539906103286, 0.47642187499999994, 0.5406338028169014], "label": "a black broccoli"}, {"bbox": [0.524671875, 0.5788262910798122, 0.726703125, 0.7505868544600939], "label": "a green carrot"}, {"bbox": [0.660859375, 0.6066197183098592, 0.79584375, 0.7489671361502348], "label": "a white carrot"}], "image_id": "482730"}, "650": {"caption": "a photo of a yellow cup and a green knife and a brown dining table and a brown cup and a brown cup ", "segment": [{"bbox": [0.46895312499999997, 0.0921388888888889, 0.605484375, 0.39099999999999996], "label": "a yellow cup"}, {"bbox": [0.001265625, 0.4802222222222222, 0.1744375, 0.7251666666666666], "label": "a green knife"}, {"bbox": [0.0, 0.0, 1.0, 0.9865277777777777], "label": "a brown dining table"}, {"bbox": [0.164328125, 0.22022222222222224, 0.30590625, 0.505611111111111], "label": "a brown cup"}, {"bbox": [0.7849375000000001, 0.11688888888888889, 0.9641718750000001, 0.43641666666666673], "label": "a brown cup"}], "image_id": "541562"}, "651": {"caption": "a photo of a brown potted plant and a red dining table and a blue cup and a yellow knife and a blue bowl and a brown sandwich ", "segment": [{"bbox": [0.8539999999999999, 0.0013333333333333333, 0.9989687499999998, 0.3647083333333333], "label": "a brown potted plant"}, {"bbox": [0.0, 0.11764583333333332, 0.998828125, 0.9788333333333334], "label": "a red dining table"}, {"bbox": [0.772296875, 0.3422916666666667, 0.982109375, 0.5447708333333333], "label": "a blue cup"}, {"bbox": [0.0, 0.4741458333333333, 0.215109375, 0.6730833333333333], "label": "a yellow knife"}, {"bbox": [0.35896875, 0.3784166666666666, 0.653671875, 0.6432916666666666], "label": "a blue bowl"}, {"bbox": [0.071859375, 0.3393333333333333, 0.30965625, 0.5617916666666666], "label": "a brown sandwich"}], "image_id": "76384"}, "652": {"caption": "a photo of a red cup and a black fork and a red bowl and a blue dining table ", "segment": [{"bbox": [0.6406535947712418, 0.2902777777777778, 0.8261437908496732, 0.6758169934640523], "label": "a red cup"}, {"bbox": [0.5741666666666666, 0.70890522875817, 1.0, 0.8657352941176472], "label": "a black fork"}, {"bbox": [0.040539215686274506, 0.6385130718954248, 0.37387254901960787, 0.8952777777777777], "label": "a red bowl"}, {"bbox": [0.004493464052287581, 0.2675653594771242, 1.0, 0.9844117647058824], "label": "a blue dining table"}], "image_id": "32625"}, "653": {"caption": "a photo of a white cat and a black laptop and a white bed and a green book ", "segment": [{"bbox": [0.17454, 0.12085333333333334, 0.65108, 0.65928], "label": "a white cat"}, {"bbox": [0.18719999999999998, 0.17642666666666665, 1.0, 0.8802933333333334], "label": "a black laptop"}, {"bbox": [0.0, 0.08221333333333333, 1.0, 1.0], "label": "a white bed"}, {"bbox": [0.57426, 0.3003733333333333, 0.79096, 0.5037866666666667], "label": "a green book"}], "image_id": "488563"}, "654": {"caption": "a photo of a brown cell phone and a green cup and a red book and a yellow book ", "segment": [{"bbox": [0.13474999999999998, 0.12326968973747017, 0.470140625, 0.9868019093078758], "label": "a brown cell phone"}, {"bbox": [0.30159375, 0.004486873508353222, 0.662046875, 0.7842720763723151], "label": "a green cup"}, {"bbox": [0.45824999999999994, 0.8420763723150357, 0.620296875, 0.997780429594272], "label": "a red book"}, {"bbox": [0.0, 0.6610262529832936, 0.13565624999999998, 1.0], "label": "a yellow book"}], "image_id": "440937"}, "655": {"caption": "a photo of a yellow zebra and a black zebra and a blue zebra and a white zebra ", "segment": [{"bbox": [0.03796875, 0.2861111111111111, 0.39279687500000005, 0.7037198067632849], "label": "a yellow zebra"}, {"bbox": [0.353234375, 0.3640338164251208, 0.864921875, 0.9865217391304347], "label": "a black zebra"}, {"bbox": [0.45601562500000004, 0.4065217391304348, 0.9717656250000001, 0.9515700483091789], "label": "a blue zebra"}, {"bbox": [0.015062500000000001, 0.27292270531400964, 0.3405, 0.6751449275362319], "label": "a white zebra"}], "image_id": "465835"}, "656": {"caption": "a photo of a green motorcycle and a blue motorcycle and a brown motorcycle and a white truck ", "segment": [{"bbox": [0.061750000000000006, 0.265807962529274, 0.329828125, 0.5976346604215457], "label": "a green motorcycle"}, {"bbox": [0.010499999999999999, 0.25234192037470726, 0.15904687499999998, 0.5581264637002342], "label": "a blue motorcycle"}, {"bbox": [0.160421875, 0.20187353629976582, 0.8036249999999999, 0.9277049180327869], "label": "a brown motorcycle"}, {"bbox": [0.044984375, 0.1911709601873536, 0.26237499999999997, 0.32824355971896957], "label": "a white truck"}], "image_id": "422326"}, "657": {"caption": "a photo of a white couch and a blue chair and a yellow dining table and a red chair and a brown chair ", "segment": [{"bbox": [0.450671875, 0.5281341719077568, 0.890234375, 0.8570230607966456], "label": "a white couch"}, {"bbox": [0.49743750000000003, 0.7842767295597485, 0.927875, 0.9887631027253669], "label": "a blue chair"}, {"bbox": [0.29309375000000004, 0.680482180293501, 0.5231250000000001, 0.8830607966457023], "label": "a yellow dining table"}, {"bbox": [0.10453125, 0.8571488469601678, 0.5342968750000001, 0.9870230607966457], "label": "a red chair"}, {"bbox": [0.833, 0.5049685534591195, 1.0, 0.6936687631027254], "label": "a brown chair"}], "image_id": "290771"}, "658": {"caption": "a photo of a yellow suitcase and a white suitcase and a black backpack and a green backpack and a red suitcase and a black chair ", "segment": [{"bbox": [0.41557189542483663, 0.27263071895424834, 0.9233496732026144, 0.9624999999999999], "label": "a yellow suitcase"}, {"bbox": [0.3528104575163398, 0.3415686274509804, 0.5595424836601307, 0.7977450980392158], "label": "a white suitcase"}, {"bbox": [0.1511437908496732, 0.23401960784313725, 0.3587091503267974, 0.505343137254902], "label": "a black backpack"}, {"bbox": [0.5749836601307189, 0.22369281045751635, 0.8141176470588235, 0.3623039215686275], "label": "a green backpack"}, {"bbox": [0.06292483660130718, 0.1116830065359477, 0.20898692810457517, 0.29820261437908496], "label": "a red suitcase"}, {"bbox": [0.7623366013071896, 0.1633169934640523, 0.9284803921568627, 0.31004901960784315], "label": "a black chair"}], "image_id": "115245"}, "659": {"caption": "a photo of a yellow refrigerator and a black bottle and a brown bottle and a green bottle and a green bottle and a blue bottle ", "segment": [{"bbox": [0.0029791666666666664, 0.002453125, 0.9903125, 0.9823125000000001], "label": "a yellow refrigerator"}, {"bbox": [0.17527083333333332, 0.307390625, 0.45695833333333336, 0.9740624999999999], "label": "a black bottle"}, {"bbox": [0.41904166666666665, 0.27273437500000003, 0.6614791666666666, 0.9688281249999999], "label": "a brown bottle"}, {"bbox": [0.6718541666666666, 0.29090625000000003, 0.9142916666666667, 0.963640625], "label": "a green bottle"}, {"bbox": [0.023020833333333334, 0.303875, 0.2138125, 0.86353125], "label": "a green bottle"}, {"bbox": [0.6301041666666667, 0.26284375, 0.7719166666666666, 0.546109375], "label": "a blue bottle"}], "image_id": "298290"}, "660": {"caption": "a photo of a red spoon and a blue broccoli and a black spoon and a yellow broccoli and a white bowl ", "segment": [{"bbox": [0.6946875, 0.47470833333333334, 0.9531562499999999, 0.6205833333333334], "label": "a red spoon"}, {"bbox": [0.576765625, 0.26739583333333333, 0.800171875, 0.42135416666666664], "label": "a blue broccoli"}, {"bbox": [0.0, 0.01883333333333333, 0.1900625, 0.21062499999999998], "label": "a black spoon"}, {"bbox": [0.55784375, 0.36414583333333334, 0.88815625, 0.5703333333333334], "label": "a yellow broccoli"}, {"bbox": [0.534375, 0.2577083333333333, 0.9995, 0.6444375], "label": "a white bowl"}], "image_id": "475248"}, "661": {"caption": "a photo of a blue cup and a yellow bowl and a brown cup and a black knife and a red hot dog and a red dining table ", "segment": [{"bbox": [0.5640522875816993, 0.1123529411764706, 0.8089869281045752, 0.4898856209150327], "label": "a blue cup"}, {"bbox": [0.4554248366013072, 0.7663562091503268, 0.8291503267973858, 1.0], "label": "a yellow bowl"}, {"bbox": [0.21383986928104576, 0.009183006535947712, 0.5339705882352941, 0.48276143790849674], "label": "a brown cup"}, {"bbox": [0.18727124183006535, 0.7891339869281045, 0.4066830065359477, 1.0], "label": "a black knife"}, {"bbox": [0.22119281045751635, 0.5058333333333334, 0.5710294117647059, 0.8182679738562091], "label": "a red hot dog"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a red dining table"}], "image_id": "66360"}, "662": {"caption": "a photo of a blue bottle and a brown bowl and a brown bowl and a black broccoli and a black bottle and a red bottle ", "segment": [{"bbox": [0.165546875, 0.005625000000000001, 0.35979687499999996, 0.20833333333333334], "label": "a blue bottle"}, {"bbox": [0.459359375, 0.35179166666666667, 0.8650625, 0.8061875000000001], "label": "a brown bowl"}, {"bbox": [0.064171875, 0.2828125, 0.425296875, 0.6736041666666668], "label": "a brown bowl"}, {"bbox": [0.514578125, 0.5864166666666667, 0.71503125, 0.7657916666666668], "label": "a black broccoli"}, {"bbox": [0.0, 0.007791666666666667, 0.19675, 0.2649375], "label": "a black bottle"}, {"bbox": [0.34675, 0.0026041666666666665, 0.51234375, 0.16883333333333334], "label": "a red bottle"}], "image_id": "294297"}, "663": {"caption": "a photo of a black bottle and a blue fork and a black bowl and a blue orange and a yellow cake and a red cake ", "segment": [{"bbox": [0.603328125, 0.0, 0.835921875, 0.3830208333333333], "label": "a black bottle"}, {"bbox": [0.0, 0.38725, 0.360734375, 1.0], "label": "a blue fork"}, {"bbox": [0.738078125, 0.1448125, 1.0, 0.6831041666666666], "label": "a black bowl"}, {"bbox": [0.7729375, 0.17177083333333334, 1.0, 0.52], "label": "a blue orange"}, {"bbox": [0.258328125, 0.40850000000000003, 0.66584375, 0.8666458333333333], "label": "a yellow cake"}, {"bbox": [0.00671875, 0.00020833333333333335, 0.5771875000000001, 0.27091666666666664], "label": "a red cake"}], "image_id": "496954"}, "664": {"caption": "a photo of a black couch and a blue couch and a yellow dining table and a black couch and a red couch ", "segment": [{"bbox": [0.22147999999999998, 0.40206989247311825, 0.5054399999999999, 0.7269892473118279], "label": "a black couch"}, {"bbox": [0.07981999999999999, 0.40516129032258064, 0.23788, 0.6497849462365591], "label": "a blue couch"}, {"bbox": [0.39214, 0.5599999999999999, 0.7790199999999999, 0.88], "label": "a yellow dining table"}, {"bbox": [0.49672000000000005, 0.4042204301075269, 0.80942, 0.709758064516129], "label": "a black couch"}, {"bbox": [0.83978, 0.48653225806451617, 1.0, 0.8428225806451612], "label": "a red couch"}], "image_id": "415949"}, "665": {"caption": "a photo of a black book and a red book and a black book and a black handbag ", "segment": [{"bbox": [0.34334375, 0.27454732510288066, 0.526078125, 0.5503703703703704], "label": "a black book"}, {"bbox": [0.5017031249999999, 0.5707818930041152, 0.67746875, 0.8921399176954732], "label": "a red book"}, {"bbox": [0.022234375, 0.29279835390946507, 0.34376562499999996, 0.6689094650205762], "label": "a black book"}, {"bbox": [0.543875, 0.0006995884773662552, 0.9429062500000001, 0.45973251028806583], "label": "a black handbag"}], "image_id": "19333"}, "666": {"caption": "a photo of a black bus and a red bus and a white bus and a brown truck ", "segment": [{"bbox": [0.0016875000000000002, 0.5732083333333333, 0.315875, 0.989875], "label": "a black bus"}, {"bbox": [0.47359375000000004, 0.6493333333333333, 0.649109375, 0.9363125], "label": "a red bus"}, {"bbox": [0.27746875000000004, 0.6367708333333333, 0.5700625, 1.0], "label": "a white bus"}, {"bbox": [0.806640625, 0.6575624999999999, 1.0, 0.9856874999999999], "label": "a brown truck"}], "image_id": "383112"}, "667": {"caption": "a photo of a green motorcycle and a white motorcycle and a red motorcycle and a brown motorcycle ", "segment": [{"bbox": [0.10304687500000001, 0.23310416666666667, 0.9256718750000001, 0.875], "label": "a green motorcycle"}, {"bbox": [0.36153124999999997, 0.0699375, 0.9510625000000001, 0.5406666666666666], "label": "a white motorcycle"}, {"bbox": [0.003359375, 0.07758333333333334, 0.147984375, 0.22108333333333335], "label": "a red motorcycle"}, {"bbox": [0.327375, 0.03854166666666667, 0.70634375, 0.3856875], "label": "a brown motorcycle"}], "image_id": "520326"}, "668": {"caption": "a photo of a brown dining table and a blue carrot and a yellow carrot and a white carrot and a yellow carrot and a blue knife ", "segment": [{"bbox": [0.0, 1.6339869281045753e-05, 1.0, 0.9853267973856209], "label": "a brown dining table"}, {"bbox": [0.0363562091503268, 0.012990196078431373, 0.6155882352941177, 0.8441503267973857], "label": "a blue carrot"}, {"bbox": [0.07031045751633987, 0.045571895424836605, 0.75, 0.7356699346405228], "label": "a yellow carrot"}, {"bbox": [0.10444444444444445, 0.18733660130718954, 0.6631862745098039, 0.8531372549019608], "label": "a white carrot"}, {"bbox": [0.004705882352941176, 0.07294117647058823, 0.48, 0.8541176470588235], "label": "a yellow carrot"}, {"bbox": [0.5955065359477124, 0.2067483660130719, 1.0, 0.5303431372549019], "label": "a blue knife"}], "image_id": "143998"}, "669": {"caption": "a photo of a white banana and a yellow banana and a brown banana and a black banana and a brown apple and a red apple ", "segment": [{"bbox": [0.109546875, 0.16110416666666666, 0.608421875, 0.9835833333333334], "label": "a white banana"}, {"bbox": [0.11004687500000002, 0.19808333333333333, 0.6535, 0.7353333333333333], "label": "a yellow banana"}, {"bbox": [0.522609375, 0.2760208333333333, 0.851734375, 0.890375], "label": "a brown banana"}, {"bbox": [0.5858749999999999, 0.36941666666666667, 0.8364687499999999, 0.9764791666666667], "label": "a black banana"}, {"bbox": [0.0, 0.5181041666666667, 0.272609375, 1.0], "label": "a brown apple"}, {"bbox": [0.024703125, 0.6564791666666667, 0.22764062499999999, 0.9105833333333334], "label": "a red apple"}], "image_id": "240273"}, "670": {"caption": "a photo of a blue tv and a black tv and a black tv and a blue chair ", "segment": [{"bbox": [0.0173125, 0.12060416666666667, 0.352171875, 0.457], "label": "a blue tv"}, {"bbox": [0.86134375, 0.3340208333333334, 0.9865937499999999, 0.6020625000000001], "label": "a black tv"}, {"bbox": [0.70215625, 0.29422916666666665, 0.8827187500000001, 0.5205833333333333], "label": "a black tv"}, {"bbox": [0.0, 0.5420208333333334, 0.371765625, 0.9881458333333334], "label": "a blue chair"}], "image_id": "578343"}, "671": {"caption": "a photo of a brown dining table and a green cup and a blue fork and a blue cake ", "segment": [{"bbox": [0.0013281249999999999, 0.0, 1.0, 0.9881548974943053], "label": "a brown dining table"}, {"bbox": [0.630296875, 2.2779043280182233e-05, 0.773171875, 0.29947608200455583], "label": "a green cup"}, {"bbox": [0.20192187499999997, 0.37977220956719815, 0.38998437499999994, 0.9123690205011389], "label": "a blue fork"}, {"bbox": [0.362328125, 0.2862414578587699, 0.6409687500000001, 0.7644191343963553], "label": "a blue cake"}], "image_id": "115776"}, "672": {"caption": "a photo of a blue dining table and a brown bowl and a red sandwich and a brown cup and a brown fork and a yellow fork ", "segment": [{"bbox": [0.0, 0.0, 1.0, 0.98352], "label": "a blue dining table"}, {"bbox": [0.12444, 0.44832, 0.5129, 0.9864266666666666], "label": "a brown bowl"}, {"bbox": [0.42978, 0.24682666666666667, 0.7145999999999999, 0.7029866666666666], "label": "a red sandwich"}, {"bbox": [0.03034, 0.0, 0.32021999999999995, 0.41797333333333336], "label": "a brown cup"}, {"bbox": [0.53292, 0.10373333333333333, 0.76308, 0.41952], "label": "a brown fork"}, {"bbox": [0.5095, 0.10941333333333333, 0.86114, 0.25925333333333334], "label": "a yellow fork"}], "image_id": "72811"}, "673": {"caption": "a photo of a blue sheep and a black sheep and a white sheep and a red sheep and a white sheep and a black sheep ", "segment": [{"bbox": [0.0028571428571428567, 0.617203125, 0.9346583850931677, 1.0], "label": "a blue sheep"}, {"bbox": [0.0, 0.48171875000000003, 0.9061697722567288, 0.77634375], "label": "a black sheep"}, {"bbox": [0.21755693581780539, 0.23539062500000002, 1.0, 0.43084375], "label": "a white sheep"}, {"bbox": [0.23662525879917184, 0.5836875, 0.6170600414078675, 0.87078125], "label": "a red sheep"}, {"bbox": [0.10828157349896479, 0.5548437500000001, 0.48443064182194623, 0.7354843750000001], "label": "a white sheep"}, {"bbox": [0.22530020703933745, 0.43587499999999996, 0.5205175983436853, 0.5753593749999999], "label": "a black sheep"}], "image_id": "335631"}, "674": {"caption": "a photo of a blue bowl and a brown carrot and a black carrot and a brown broccoli ", "segment": [{"bbox": [0.11251948051948052, 0.2664359861591695, 0.8245454545454545, 0.8369204152249136], "label": "a blue bowl"}, {"bbox": [0.2101818181818182, 0.11529411764705882, 0.4097662337662337, 0.24941176470588236], "label": "a brown carrot"}, {"bbox": [0.06005194805194806, 0.21411764705882355, 0.19075324675324676, 0.3788235294117647], "label": "a black carrot"}, {"bbox": [0.39205194805194804, 0.12532871972318338, 0.7503116883116884, 0.44847750865051905], "label": "a brown broccoli"}], "image_id": "387906"}, "675": {"caption": "a photo of a green dog and a brown dog and a green dog and a blue couch and a yellow couch ", "segment": [{"bbox": [0.27653125, 0.20403397027600848, 0.7508125, 0.5575796178343949], "label": "a green dog"}, {"bbox": [0.0044375, 0.250828025477707, 0.4086875, 0.7458174097664543], "label": "a brown dog"}, {"bbox": [0.6899375, 0.21229299363057325, 0.99446875, 0.7122929936305733], "label": "a green dog"}, {"bbox": [0.001578125, 0.0021443736730360936, 0.997078125, 0.9892569002123143], "label": "a blue couch"}, {"bbox": [0.038234375, 0.3992144373673036, 1.0, 0.9784288747346073], "label": "a yellow couch"}], "image_id": "330037"}, "676": {"caption": "a photo of a yellow couch and a green couch and a brown couch and a blue chair and a brown chair ", "segment": [{"bbox": [0.573390625, 0.5075316455696203, 0.83884375, 0.9053797468354431], "label": "a yellow couch"}, {"bbox": [0.173078125, 0.5118354430379747, 0.36739062499999997, 0.7677531645569621], "label": "a green couch"}, {"bbox": [0.035046875, 0.6430063291139241, 0.3939375, 0.989240506329114], "label": "a brown couch"}, {"bbox": [0.1716875, 0.5067405063291139, 0.364609375, 0.7746835443037975], "label": "a blue chair"}, {"bbox": [0.034640625, 0.645, 0.39746875, 1.0], "label": "a brown chair"}], "image_id": "436470"}, "677": {"caption": "a photo of a brown spoon and a brown bowl and a brown carrot and a brown carrot and a brown carrot ", "segment": [{"bbox": [0.71346, 0.296, 0.99894, 0.5265599999999999], "label": "a brown spoon"}, {"bbox": [0.0, 0.00112, 1.0, 0.9898666666666667], "label": "a brown bowl"}, {"bbox": [0.16558, 0.27271999999999996, 0.38766, 0.5194933333333334], "label": "a brown carrot"}, {"bbox": [0.17488, 0.3111733333333333, 0.7519399999999999, 0.9122133333333333], "label": "a brown carrot"}, {"bbox": [0.25034, 0.16981333333333334, 0.56524, 0.37381333333333333], "label": "a brown carrot"}], "image_id": "368291"}, "678": {"caption": "a photo of a brown broccoli and a blue carrot and a red carrot and a green dining table ", "segment": [{"bbox": [0.35702, 0.40477477477477475, 0.5795799999999999, 0.8638138138138137], "label": "a brown broccoli"}, {"bbox": [0.06409999999999999, 0.29600600600600596, 0.27984000000000003, 0.5401501501501501], "label": "a blue carrot"}, {"bbox": [0.08807999999999999, 0.18672672672672672, 0.36397999999999997, 0.5366966966966967], "label": "a red carrot"}, {"bbox": [0.00174, 0.002612612612612613, 1.0, 0.9869669669669671], "label": "a green dining table"}], "image_id": "538888"}, "679": {"caption": "a photo of a brown cow and a white cow and a red cow and a black cow ", "segment": [{"bbox": [0.2587668593448941, 0.42418750000000005, 0.48849710982658967, 0.64903125], "label": "a brown cow"}, {"bbox": [0.0, 0.263671875, 0.4810982658959538, 0.550671875], "label": "a white cow"}, {"bbox": [0.0026396917148362236, 0.51415625, 0.23551059730250481, 0.79528125], "label": "a red cow"}, {"bbox": [0.6762620423892101, 0.240171875, 0.8515799614643546, 0.39256250000000004], "label": "a black cow"}], "image_id": "464286"}, "680": {"caption": "a photo of a white oven and a red oven and a blue oven and a black car and a blue oven ", "segment": [{"bbox": [0.27471875, 0.48314583333333333, 0.52246875, 0.7550625], "label": "a white oven"}, {"bbox": [0.3745625, 0.4704583333333333, 0.641828125, 0.7066041666666666], "label": "a red oven"}, {"bbox": [0.148390625, 0.44277083333333334, 0.3121875, 0.6814166666666667], "label": "a blue oven"}, {"bbox": [0.0, 0.381125, 0.13940625, 0.6305833333333334], "label": "a black car"}, {"bbox": [0.486828125, 0.38829166666666665, 0.66934375, 0.5905], "label": "a blue oven"}], "image_id": "170425"}, "681": {"caption": "a photo of a black banana and a red dining table and a yellow dining table and a white cup ", "segment": [{"bbox": [0.035958333333333335, 0.12809375, 0.9587916666666666, 0.898875], "label": "a black banana"}, {"bbox": [0.81175, 0.278515625, 1.0, 0.63253125], "label": "a red dining table"}, {"bbox": [0.0, 0.41039062499999995, 0.9627708333333334, 0.9974062499999998], "label": "a yellow dining table"}, {"bbox": [0.023291666666666665, 0.0005625, 0.32262500000000005, 0.34684375], "label": "a white cup"}], "image_id": "257328"}, "682": {"caption": "a photo of a black cup and a yellow cup and a brown dining table and a red bowl and a red donut and a green donut ", "segment": [{"bbox": [0.160390625, 0.00046875, 0.41004687500000003, 0.163875], "label": "a black cup"}, {"bbox": [0.47121874999999996, 0.003453125, 0.6736875, 0.14137499999999997], "label": "a yellow cup"}, {"bbox": [0.00225, 0.011390625, 0.993265625, 0.984421875], "label": "a brown dining table"}, {"bbox": [0.503890625, 0.376625, 0.8883125, 0.633765625], "label": "a red bowl"}, {"bbox": [0.17340625, 0.27531249999999996, 0.40121875000000007, 0.43637499999999996], "label": "a red donut"}, {"bbox": [0.05746875, 0.4635625, 0.321375, 0.641578125], "label": "a green donut"}], "image_id": "484641"}, "683": {"caption": "a photo of a black chair and a red couch and a green laptop and a yellow backpack ", "segment": [{"bbox": [0.10484374999999999, 0.5913958333333333, 0.34515625, 1.0], "label": "a black chair"}, {"bbox": [0.712984375, 0.6300416666666667, 1.0, 0.9862708333333334], "label": "a red couch"}, {"bbox": [0.037921875, 0.5142291666666667, 0.226765625, 0.6684375], "label": "a green laptop"}, {"bbox": [0.8123125, 0.6292083333333333, 0.9516875, 0.8414791666666666], "label": "a yellow backpack"}], "image_id": "24610"}, "684": {"caption": "a photo of a red couch and a green chair and a brown chair and a black clock ", "segment": [{"bbox": [0.771921875, 0.5182903981264637, 1.0, 0.9978454332552694], "label": "a red couch"}, {"bbox": [0.10818749999999999, 0.5056206088992974, 0.305046875, 0.8975175644028103], "label": "a green chair"}, {"bbox": [0.58290625, 0.5179391100702576, 0.773546875, 0.9101405152224824], "label": "a brown chair"}, {"bbox": [0.670640625, 0.004309133489461358, 0.999046875, 0.28929742388758783], "label": "a black clock"}], "image_id": "533129"}, "685": {"caption": "a photo of a yellow boat and a black boat and a brown boat and a blue boat and a green boat and a black boat ", "segment": [{"bbox": [0.038703125, 0.6066388888888888, 0.22549999999999998, 0.7815833333333333], "label": "a yellow boat"}, {"bbox": [0.41587500000000005, 0.7569166666666667, 0.5751406250000001, 0.9411944444444446], "label": "a black boat"}, {"bbox": [0.19375, 0.6871666666666667, 0.369265625, 0.8266111111111111], "label": "a brown boat"}, {"bbox": [0.8159218750000001, 0.7949444444444445, 0.9735312500000001, 0.9372777777777779], "label": "a blue boat"}, {"bbox": [0.32878124999999997, 0.7594722222222223, 0.474140625, 0.8898055555555556], "label": "a green boat"}, {"bbox": [0.256828125, 0.7239166666666667, 0.384984375, 0.8617222222222223], "label": "a black boat"}], "image_id": "183997"}, "686": {"caption": "a photo of a red banana and a black banana and a red banana and a green banana and a green banana ", "segment": [{"bbox": [0.00674, 0.7573066666666667, 0.30338, 1.0], "label": "a red banana"}, {"bbox": [0.47046, 0.6081333333333334, 0.7071799999999999, 1.0], "label": "a black banana"}, {"bbox": [0.0, 0.62824, 0.18882, 0.97176], "label": "a red banana"}, {"bbox": [0.65992, 0.7973066666666667, 0.84204, 1.0], "label": "a green banana"}, {"bbox": [0.79852, 0.7944533333333333, 0.98764, 1.0], "label": "a green banana"}], "image_id": "68380"}, "687": {"caption": "a photo of a white fork and a brown knife and a red knife and a white cake and a brown fork and a white spoon ", "segment": [{"bbox": [0.20451764705882353, 0.608453125, 0.40543529411764706, 0.848640625], "label": "a white fork"}, {"bbox": [0.07275294117647059, 0.438171875, 0.5207999999999999, 0.8298593750000001], "label": "a brown knife"}, {"bbox": [0.013529411764705882, 0.43820312499999997, 0.29103529411764706, 0.9483125000000001], "label": "a red knife"}, {"bbox": [0.5053411764705883, 0.0045, 1.0, 0.3108125], "label": "a white cake"}, {"bbox": [0.1988235294117647, 0.5096406250000001, 0.5843294117647059, 0.777671875], "label": "a brown fork"}, {"bbox": [0.19741176470588237, 0.493359375, 0.5819764705882353, 0.7705], "label": "a white spoon"}], "image_id": "19226"}, "688": {"caption": "a photo of a white bowl and a blue banana and a white banana and a blue banana ", "segment": [{"bbox": [0.171171875, 0.3022409638554217, 0.635375, 0.937566265060241], "label": "a white bowl"}, {"bbox": [0.0043749999999999995, 0.21959036144578312, 0.23951562500000004, 0.5394216867469879], "label": "a blue banana"}, {"bbox": [0.09909375000000001, 0.002240963855421687, 0.25792187499999997, 0.24269879518072293], "label": "a white banana"}, {"bbox": [0.0, 0.0, 0.150890625, 0.1453734939759036], "label": "a blue banana"}], "image_id": "34121"}, "689": {"caption": "a photo of a black cake and a white cake and a yellow cake and a brown cake ", "segment": [{"bbox": [0.144703125, 0.25651053864168616, 0.325890625, 0.41], "label": "a black cake"}, {"bbox": [0.22789062499999999, 0.5164871194379391, 0.373328125, 0.7254566744730678], "label": "a white cake"}, {"bbox": [0.33214062499999997, 0.26208430913348946, 0.461890625, 0.43053864168618267], "label": "a yellow cake"}, {"bbox": [0.296875, 0.2716627634660422, 0.9984375, 0.9625292740046838], "label": "a brown cake"}], "image_id": "442809"}, "690": {"caption": "a photo of a green refrigerator and a white refrigerator and a black refrigerator and a red refrigerator and a yellow refrigerator and a brown refrigerator ", "segment": [{"bbox": [0.680578125, 0.35281690140845073, 0.8570781249999999, 0.8449530516431926], "label": "a green refrigerator"}, {"bbox": [0.360359375, 0.3178873239436619, 0.51671875, 0.8525586854460094], "label": "a white refrigerator"}, {"bbox": [0.236328125, 0.35281690140845073, 0.369453125, 0.8516901408450706], "label": "a black refrigerator"}, {"bbox": [0.731296875, 0.27568075117370894, 0.88053125, 0.6097417840375586], "label": "a red refrigerator"}, {"bbox": [0.106203125, 0.26291079812206575, 0.249796875, 0.5550469483568075], "label": "a yellow refrigerator"}, {"bbox": [0.16821875, 0.23492957746478874, 0.335375, 0.3609389671361502], "label": "a brown refrigerator"}], "image_id": "462629"}, "691": {"caption": "a photo of a brown tv and a red chair and a yellow laptop and a black chair ", "segment": [{"bbox": [0.19628125000000002, 0.04109302325581396, 0.44334375000000004, 0.32279069767441865], "label": "a brown tv"}, {"bbox": [0.588484375, 0.09567441860465116, 0.9849375, 1.0], "label": "a red chair"}, {"bbox": [0.442375, 0.1236046511627907, 0.63865625, 0.36404651162790697], "label": "a yellow laptop"}, {"bbox": [0.35728125, 0.5191162790697674, 0.50284375, 0.7053953488372093], "label": "a black chair"}], "image_id": "399164"}, "692": {"caption": "a photo of a brown potted plant and a blue tv and a red chair and a red laptop and a blue couch and a brown book ", "segment": [{"bbox": [0.699546875, 0.38564583333333335, 0.9820625, 0.7757916666666667], "label": "a brown potted plant"}, {"bbox": [0.451234375, 0.31347916666666664, 0.592921875, 0.47775], "label": "a blue tv"}, {"bbox": [0.32742187500000003, 0.4883125, 0.60321875, 0.935625], "label": "a red chair"}, {"bbox": [0.583140625, 0.38877083333333334, 0.709546875, 0.5280833333333333], "label": "a red laptop"}, {"bbox": [0.0016718750000000002, 0.6892499999999999, 0.21812499999999999, 0.9890208333333332], "label": "a blue couch"}, {"bbox": [0.5828125, 0.23958333333333334, 0.9984375, 0.53125], "label": "a brown book"}], "image_id": "37740"}, "693": {"caption": "a photo of a yellow laptop and a green laptop and a black laptop and a red keyboard and a black tv ", "segment": [{"bbox": [0.7297343749999999, 0.44933333333333336, 1.0, 0.760125], "label": "a yellow laptop"}, {"bbox": [0.268078125, 0.304375, 0.431796875, 0.5062916666666666], "label": "a green laptop"}, {"bbox": [0.0016875000000000002, 0.3595416666666667, 0.182015625, 0.5775208333333334], "label": "a black laptop"}, {"bbox": [0.40431249999999996, 0.509875, 0.66875, 0.653125], "label": "a red keyboard"}, {"bbox": [0.45701562500000004, 0.2529791666666667, 0.6888125, 0.5037083333333333], "label": "a black tv"}], "image_id": "254745"}, "694": {"caption": "a photo of a green broccoli and a yellow broccoli and a yellow broccoli and a green broccoli and a blue carrot ", "segment": [{"bbox": [0.44974000000000003, 0.20426426426426425, 0.69636, 0.6218618618618618], "label": "a green broccoli"}, {"bbox": [0.03134, 0.24234234234234234, 0.31028, 0.6635435435435435], "label": "a yellow broccoli"}, {"bbox": [0.6879400000000001, 0.10588588588588588, 0.93084, 0.3082282282282282], "label": "a yellow broccoli"}, {"bbox": [0.7367400000000001, 0.32408408408408407, 0.9817400000000001, 0.5805705705705705], "label": "a green broccoli"}, {"bbox": [0.75552, 0.4983483483483483, 1.0, 0.9680180180180181], "label": "a blue carrot"}], "image_id": "398563"}, "695": {"caption": "a photo of a blue bicycle and a green car and a red boat and a black boat and a yellow bicycle ", "segment": [{"bbox": [0.10882812500000001, 0.5288125, 0.25153125000000004, 0.6677083333333333], "label": "a blue bicycle"}, {"bbox": [0.362765625, 0.499875, 0.6644687499999999, 0.664], "label": "a green car"}, {"bbox": [0.48657812500000003, 0.7675625, 1.0, 0.930875], "label": "a red boat"}, {"bbox": [0.008421874999999999, 0.7280833333333334, 0.458421875, 0.9101041666666667], "label": "a black boat"}, {"bbox": [0.03371875, 0.5378541666666667, 0.159640625, 0.6642708333333334], "label": "a yellow bicycle"}], "image_id": "147576"}, "696": {"caption": "a photo of a brown suitcase and a green suitcase and a white suitcase and a brown train ", "segment": [{"bbox": [0.3034, 0.3049866666666667, 0.6185799999999999, 0.7075733333333334], "label": "a brown suitcase"}, {"bbox": [0.61656, 0.11712, 0.9375, 0.69144], "label": "a green suitcase"}, {"bbox": [0.01686, 0.30112, 0.30674, 0.7123466666666667], "label": "a white suitcase"}, {"bbox": [0.0033799999999999998, 0.004506666666666667, 0.99776, 0.4876533333333333], "label": "a brown train"}], "image_id": "282741"}, "697": {"caption": "a photo of a white horse and a white horse and a black horse and a yellow horse and a black horse ", "segment": [{"bbox": [0.069984375, 0.6386150234741784, 0.20426562499999998, 0.8789671361502347], "label": "a white horse"}, {"bbox": [0.589765625, 0.6322535211267605, 0.71571875, 0.8666666666666666], "label": "a white horse"}, {"bbox": [0.193859375, 0.6195070422535212, 0.35259375, 0.8777699530516432], "label": "a black horse"}, {"bbox": [0.315125, 0.6118544600938967, 0.46746875, 0.8826995305164319], "label": "a yellow horse"}, {"bbox": [0.722609375, 0.645962441314554, 0.8848437500000002, 0.8646009389671361], "label": "a black horse"}], "image_id": "183155"}, "698": {"caption": "a photo of a blue cow and a red cow and a white sheep and a brown sheep ", "segment": [{"bbox": [0.158546875, 0.20448356807511736, 0.6731093749999999, 0.7640375586854461], "label": "a blue cow"}, {"bbox": [0.315203125, 0.24631455399061034, 0.6763125000000001, 0.6129342723004695], "label": "a red cow"}, {"bbox": [0.15559375, 0.20779342723004693, 0.68290625, 0.7584507042253522], "label": "a white sheep"}, {"bbox": [0.44615625000000003, 0.23753521126760563, 0.679875, 0.5392488262910798], "label": "a brown sheep"}], "image_id": "551533"}, "699": {"caption": "a photo of a red cat and a brown bed and a black suitcase and a brown suitcase ", "segment": [{"bbox": [0.43790625, 0.36922437673130193, 0.6089374999999999, 0.6294459833795013], "label": "a red cat"}, {"bbox": [0.26110937500000003, 0.05130193905817174, 0.9975625000000001, 0.988393351800554], "label": "a brown bed"}, {"bbox": [0.00253125, 0.1273961218836565, 0.684484375, 0.9835734072022161], "label": "a black suitcase"}, {"bbox": [0.41576562499999997, 0.008975069252077562, 0.785890625, 0.36404432132963993], "label": "a brown suitcase"}], "image_id": "229139"}, "700": {"caption": "a photo of a yellow zebra and a green car and a yellow car and a red car and a yellow car ", "segment": [{"bbox": [0.54228125, 0.6300833333333333, 0.9266875000000001, 0.9652916666666668], "label": "a yellow zebra"}, {"bbox": [0.44584375, 0.161375, 0.7463593749999999, 0.29825], "label": "a green car"}, {"bbox": [0.06118749999999999, 0.16368749999999999, 0.36059375, 0.30025], "label": "a yellow car"}, {"bbox": [0.757375, 0.22360416666666666, 0.9037812500000001, 0.36904166666666666], "label": "a red car"}, {"bbox": [0.121875, 0.08125, 0.9984375, 0.2125], "label": "a yellow car"}], "image_id": "118911"}, "701": {"caption": "a photo of a white car and a white zebra and a white zebra and a white zebra and a yellow giraffe ", "segment": [{"bbox": [0.30536, 0.6534666666666668, 0.48658000000000007, 0.7832266666666667], "label": "a white car"}, {"bbox": [0.04582, 0.62056, 0.38271999999999995, 1.0], "label": "a white zebra"}, {"bbox": [0.5270199999999999, 0.6205066666666667, 0.87162, 0.9876], "label": "a white zebra"}, {"bbox": [0.8005599999999999, 0.6487466666666667, 1.0, 1.0], "label": "a white zebra"}, {"bbox": [0.09079999999999999, 0.0021333333333333334, 0.81726, 0.9886666666666667], "label": "a yellow giraffe"}], "image_id": "188173"}, "702": {"caption": "a photo of a white boat and a red boat and a yellow umbrella and a white boat and a blue boat and a red umbrella ", "segment": [{"bbox": [0.0, 0.5685416666666666, 0.9977499999999999, 0.9865208333333333], "label": "a white boat"}, {"bbox": [0.267984375, 0.5303333333333333, 0.9977499999999999, 0.7910208333333333], "label": "a red boat"}, {"bbox": [0.0375, 0.3645833333333333, 0.9953125, 0.5125], "label": "a yellow umbrella"}, {"bbox": [0.35167187499999997, 0.36835416666666665, 0.7718906249999999, 0.5469375], "label": "a white boat"}, {"bbox": [0.0016875000000000002, 0.8382083333333333, 0.281453125, 0.9887708333333333], "label": "a blue boat"}, {"bbox": [0.788765625, 0.2814583333333333, 0.932015625, 0.4410208333333333], "label": "a red umbrella"}], "image_id": "287663"}, "703": {"caption": "a photo of a brown potted plant and a red dining table and a white chair and a red couch ", "segment": [{"bbox": [0.0390625, 0.08587822014051523, 0.2359375, 0.3622248243559719], "label": "a brown potted plant"}, {"bbox": [0.368921875, 0.6335362997658079, 0.626375, 0.8758782201405152], "label": "a red dining table"}, {"bbox": [0.66353125, 0.5119906323185012, 0.8123125, 0.7682669789227167], "label": "a white chair"}, {"bbox": [0.57965625, 0.5783372365339579, 0.9377656250000002, 0.9962060889929742], "label": "a red couch"}], "image_id": "471287"}, "704": {"caption": "a photo of a blue bowl and a black broccoli and a red cake and a black cake ", "segment": [{"bbox": [0.0, 0.0919375, 0.6778593749999999, 0.9890208333333333], "label": "a blue bowl"}, {"bbox": [0.0, 0.23145833333333332, 0.6091562500000001, 1.0], "label": "a black broccoli"}, {"bbox": [0.6891875, 0.6542708333333334, 1.0, 0.989875], "label": "a red cake"}, {"bbox": [0.660625, 0.23575, 0.9948125000000001, 0.7901458333333333], "label": "a black cake"}], "image_id": "379716"}, "705": {"caption": "a photo of a yellow potted plant and a black couch and a blue couch and a brown chair and a yellow dining table and a white chair ", "segment": [{"bbox": [0.150703125, 0.00234192037470726, 0.4274375, 0.16704918032786883], "label": "a yellow potted plant"}, {"bbox": [0.8264531249999999, 0.12042154566744731, 1.0, 0.9892505854800937], "label": "a black couch"}, {"bbox": [0.45814062499999997, 0.08395784543325527, 1.0, 0.5191569086651054], "label": "a blue couch"}, {"bbox": [0.0, 0.2614519906323185, 0.274296875, 0.7710772833723654], "label": "a brown chair"}, {"bbox": [0.0015625, 0.28295081967213115, 0.26373437499999997, 0.7841217798594847], "label": "a yellow dining table"}, {"bbox": [0.0, 0.04995316159250585, 0.16853125, 0.26756440281030447], "label": "a white chair"}], "image_id": "309044"}, "706": {"caption": "a photo of a blue giraffe and a red giraffe and a white giraffe and a blue giraffe and a black giraffe ", "segment": [{"bbox": [0.02378125, 0.31347417840375585, 0.5006875000000001, 1.0], "label": "a blue giraffe"}, {"bbox": [0.83315625, 0.8269718309859155, 1.0, 0.9887558685446011], "label": "a red giraffe"}, {"bbox": [0.45471874999999995, 0.417981220657277, 0.671609375, 0.9955164319248827], "label": "a white giraffe"}, {"bbox": [0.339546875, 0.3618075117370892, 0.5534375, 0.9865258215962441], "label": "a blue giraffe"}, {"bbox": [0.8481093749999999, 0.6406103286384977, 1.0, 0.8765492957746478], "label": "a black giraffe"}], "image_id": "172265"}, "707": {"caption": "a photo of a green broccoli and a blue pizza and a white dining table and a brown oven and a yellow broccoli and a white broccoli ", "segment": [{"bbox": [0.35052, 0.36413333333333336, 0.48202, 0.49965333333333334], "label": "a green broccoli"}, {"bbox": [0.00674, 0.05842666666666667, 0.9741599999999999, 0.97528], "label": "a blue pizza"}, {"bbox": [0.0016799999999999999, 0.0, 1.0, 0.98456], "label": "a white dining table"}, {"bbox": [0.0, 0.004773333333333333, 1.0, 0.9891733333333333], "label": "a brown oven"}, {"bbox": [0.62386, 0.22991999999999999, 0.75726, 0.40952], "label": "a yellow broccoli"}, {"bbox": [0.5225599999999999, 0.41832, 0.7345799999999999, 0.5898933333333334], "label": "a white broccoli"}], "image_id": "87414"}, "708": {"caption": "a photo of a blue book and a brown pizza and a white book and a black book and a green book and a green book ", "segment": [{"bbox": [0.511828125, 0.3070563674321503, 0.88771875, 0.5873277661795407], "label": "a blue book"}, {"bbox": [0.3010625, 0.588768267223382, 0.6340625, 0.8898956158663883], "label": "a brown pizza"}, {"bbox": [0.201078125, 0.21075156576200418, 0.4760625, 0.4058872651356994], "label": "a white book"}, {"bbox": [0.0018124999999999999, 0.4868475991649269, 0.25434375, 0.6713152400835073], "label": "a black book"}, {"bbox": [0.0, 0.5657620041753654, 0.24225, 0.7398538622129436], "label": "a green book"}, {"bbox": [0.445703125, 0.15281837160751566, 0.713125, 0.2808977035490606], "label": "a green book"}], "image_id": "371822"}, "709": {"caption": "a photo of a blue banana and a white banana and a brown banana and a yellow banana and a yellow banana and a black banana ", "segment": [{"bbox": [0.15709375, 0.19256250000000003, 0.40203125, 0.6632916666666666], "label": "a blue banana"}, {"bbox": [0.0, 0.33197916666666666, 0.2571875, 0.7335833333333334], "label": "a white banana"}, {"bbox": [0.638390625, 0.18562499999999998, 0.8852968750000001, 0.5864791666666667], "label": "a brown banana"}, {"bbox": [0.488765625, 0.20954166666666665, 0.6505625, 0.7713541666666667], "label": "a yellow banana"}, {"bbox": [0.36903125000000003, 0.2582916666666667, 0.51371875, 0.6476041666666668], "label": "a yellow banana"}, {"bbox": [0.6622656250000001, 0.55675, 0.8244687500000001, 0.7229583333333333], "label": "a black banana"}], "image_id": "349402"}, "710": {"caption": "a photo of a green banana and a brown banana and a white banana and a black cake ", "segment": [{"bbox": [0.30065624999999996, 0.5168544600938967, 0.502578125, 0.8651643192488263], "label": "a green banana"}, {"bbox": [0.12021875, 0.3442018779342723, 0.283578125, 0.6008450704225352], "label": "a brown banana"}, {"bbox": [0.47325, 0.2705868544600939, 0.628109375, 0.5505633802816902], "label": "a white banana"}, {"bbox": [0.0, 0.0018779342723004697, 0.9258906250000001, 0.9883802816901409], "label": "a black cake"}], "image_id": "321079"}, "711": {"caption": "a photo of a black dining table and a black wine glass and a white knife and a blue sandwich and a black wine glass and a yellow spoon ", "segment": [{"bbox": [0.0, 0.2798598130841122, 0.9978906249999999, 0.9444859813084112], "label": "a black dining table"}, {"bbox": [0.736609375, 0.07735981308411215, 0.936890625, 0.544392523364486], "label": "a black wine glass"}, {"bbox": [0.69434375, 0.46572429906542057, 0.919609375, 0.8189953271028036], "label": "a white knife"}, {"bbox": [0.061328125, 0.465303738317757, 0.33378125000000003, 0.6885981308411215], "label": "a blue sandwich"}, {"bbox": [0.58790625, 0.09822429906542056, 0.7165781250000001, 0.47460280373831776], "label": "a black wine glass"}, {"bbox": [0.0, 0.4292757009345794, 0.135421875, 0.6040420560747662], "label": "a yellow spoon"}], "image_id": "396224"}, "712": {"caption": "a photo of a blue broccoli and a brown carrot and a brown carrot and a blue carrot and a black carrot and a white carrot ", "segment": [{"bbox": [0.03764583333333334, 0.05575, 1.0, 0.403984375], "label": "a blue broccoli"}, {"bbox": [0.4874583333333333, 0.692265625, 0.7999791666666667, 0.9018125000000001], "label": "a brown carrot"}, {"bbox": [0.7335208333333333, 0.72775, 0.9483333333333334, 0.8663125], "label": "a brown carrot"}, {"bbox": [0.6497291666666667, 0.59878125, 0.8717083333333334, 0.729640625], "label": "a blue carrot"}, {"bbox": [0.26666666666666666, 0.6494375, 0.4015, 0.8427031249999999], "label": "a black carrot"}, {"bbox": [0.0006875000000000001, 0.7402656249999999, 0.16410416666666666, 0.88734375], "label": "a white carrot"}], "image_id": "557059"}, "713": {"caption": "a photo of a white vase and a red bird and a white potted plant and a blue bird ", "segment": [{"bbox": [0.34598240469208213, 0.41776562500000003, 0.5853958944281525, 0.6803125], "label": "a white vase"}, {"bbox": [0.09155425219941349, 0.48503125, 0.379208211143695, 0.617515625], "label": "a red bird"}, {"bbox": [0.09049853372434018, 0.024484375, 0.9140762463343108, 0.680640625], "label": "a white potted plant"}, {"bbox": [0.5398826979472141, 0.392390625, 0.9740762463343108, 0.63059375], "label": "a blue bird"}], "image_id": "567609"}, "714": {"caption": "a photo of a red horse and a white horse and a white cake and a blue horse and a blue horse ", "segment": [{"bbox": [0.22206, 0.5035542168674699, 0.35253999999999996, 0.6990361445783133], "label": "a red horse"}, {"bbox": [0.33127999999999996, 0.7311746987951807, 0.50122, 0.9483734939759036], "label": "a white horse"}, {"bbox": [0.00298, 0.06518072289156626, 1.0, 0.9887650602409638], "label": "a white cake"}, {"bbox": [0.25312, 0.3776807228915663, 0.3841, 0.5514156626506024], "label": "a blue horse"}, {"bbox": [0.24938, 0.3627710843373494, 0.37674, 0.4979819277108433], "label": "a blue horse"}], "image_id": "13605"}, "715": {"caption": "a photo of a blue car and a brown car and a brown motorcycle and a black truck ", "segment": [{"bbox": [0.0, 0.14945812807881773, 0.348, 0.3720689655172414], "label": "a blue car"}, {"bbox": [0.43284374999999997, 0.2466502463054187, 0.572078125, 0.3817980295566502], "label": "a brown car"}, {"bbox": [0.07112500000000001, 0.048423645320197044, 0.8804375, 0.9766748768472907], "label": "a brown motorcycle"}, {"bbox": [0.818984375, 0.2231527093596059, 0.997625, 0.584679802955665], "label": "a black truck"}], "image_id": "308276"}, "716": {"caption": "a photo of a black bowl and a green cup and a green bowl and a green apple and a brown orange and a blue carrot ", "segment": [{"bbox": [0.43782, 0.4369461077844311, 0.88314, 0.925688622754491], "label": "a black bowl"}, {"bbox": [0.34376, 0.004491017964071856, 0.7430599999999999, 0.5438323353293413], "label": "a green cup"}, {"bbox": [0.00598, 0.10760479041916167, 0.34072, 0.5885928143712575], "label": "a green bowl"}, {"bbox": [0.0, 0.5234730538922155, 0.23834, 0.9272155688622754], "label": "a green apple"}, {"bbox": [0.23026, 0.6012574850299401, 0.44115999999999994, 0.8823952095808384], "label": "a brown orange"}, {"bbox": [0.17148, 0.37488023952095806, 0.3245, 0.5289221556886228], "label": "a blue carrot"}], "image_id": "437789"}, "717": {"caption": "a photo of a blue truck and a green car and a red car and a black truck ", "segment": [{"bbox": [0.388453125, 0.09641666666666666, 0.7130000000000001, 0.6008958333333333], "label": "a blue truck"}, {"bbox": [0.0, 0.3811666666666667, 0.164796875, 0.57175], "label": "a green car"}, {"bbox": [0.0989375, 0.369875, 0.238328125, 0.5361666666666667], "label": "a red car"}, {"bbox": [0.28040625, 0.2781458333333333, 0.633453125, 0.7331041666666667], "label": "a black truck"}], "image_id": "19631"}, "718": {"caption": "a photo of a blue zebra and a black zebra and a white zebra and a green zebra and a brown zebra ", "segment": [{"bbox": [0.13274999999999998, 0.597125, 0.49021875000000004, 0.9273541666666667], "label": "a blue zebra"}, {"bbox": [0.464375, 0.5963541666666666, 0.59871875, 0.7494999999999999], "label": "a black zebra"}, {"bbox": [0.63475, 0.5708749999999999, 0.8100312500000001, 0.6984375], "label": "a white zebra"}, {"bbox": [0.6462343749999999, 0.5854791666666667, 0.8342031249999999, 0.7629999999999999], "label": "a green zebra"}, {"bbox": [0.259625, 0.681125, 0.7758593749999999, 0.8425208333333333], "label": "a brown zebra"}], "image_id": "456690"}, "719": {"caption": "a photo of a blue cup and a yellow broccoli and a brown bowl and a red dining table ", "segment": [{"bbox": [0.0, 0.00224, 0.20562, 0.2921333333333333], "label": "a blue cup"}, {"bbox": [0.00352, 0.07530666666666666, 0.46412, 0.8470666666666667], "label": "a yellow broccoli"}, {"bbox": [0.0, 0.6104, 0.18312, 0.9870133333333333], "label": "a brown bowl"}, {"bbox": [0.5649400000000001, 0.5844266666666666, 1.0, 0.9844266666666666], "label": "a red dining table"}], "image_id": "314412"}, "720": {"caption": "a photo of a brown sandwich and a brown sandwich and a green sandwich and a red sandwich and a blue bowl and a black bowl ", "segment": [{"bbox": [0.006734374999999999, 0.364046875, 0.62021875, 0.9887656249999999], "label": "a brown sandwich"}, {"bbox": [0.32809374999999996, 0.16404687499999998, 0.67640625, 0.507859375], "label": "a brown sandwich"}, {"bbox": [0.19239062499999998, 0.00021875000000000003, 0.6129687500000001, 0.27314062499999997], "label": "a green sandwich"}, {"bbox": [0.1114375, 0.5156562499999999, 0.30910937499999996, 0.8175156250000001], "label": "a red sandwich"}, {"bbox": [0.621078125, 0.004703125, 1.0, 0.31637499999999996], "label": "a blue bowl"}, {"bbox": [0.566296875, 0.364046875, 1.0, 0.986515625], "label": "a black bowl"}], "image_id": "497439"}, "721": {"caption": "a photo of a yellow toothbrush and a yellow knife and a white spoon and a yellow spoon and a blue wine glass and a brown cup ", "segment": [{"bbox": [0.32336000000000004, 0.45488, 0.66304, 0.6736266666666667], "label": "a yellow toothbrush"}, {"bbox": [0.6960599999999999, 0.4202133333333334, 0.84944, 0.7505600000000001], "label": "a yellow knife"}, {"bbox": [0.7471, 0.45165333333333335, 0.8922599999999999, 0.7321333333333334], "label": "a white spoon"}, {"bbox": [0.77634, 0.42002666666666666, 0.9245399999999999, 0.6713866666666666], "label": "a yellow spoon"}, {"bbox": [0.4428, 0.13045333333333334, 0.5696, 0.40741333333333335], "label": "a blue wine glass"}, {"bbox": [0.57304, 0.20450666666666667, 0.71966, 0.39549333333333336], "label": "a brown cup"}], "image_id": "217561"}, "722": {"caption": "a photo of a green bowl and a green orange and a green bowl and a green orange and a brown bowl and a green orange ", "segment": [{"bbox": [0.27464052287581703, 0.6291176470588234, 0.9412418300653594, 1.0], "label": "a green bowl"}, {"bbox": [0.3325816993464052, 0.5903267973856209, 0.8831535947712419, 0.907173202614379], "label": "a green orange"}, {"bbox": [0.30230392156862745, 0.4454411764705883, 0.7575980392156862, 0.6641993464052288], "label": "a green bowl"}, {"bbox": [0.329640522875817, 0.4114705882352941, 0.7447549019607843, 0.5849346405228758], "label": "a green orange"}, {"bbox": [0.5821732026143791, 0.3438235294117647, 0.9140359477124183, 0.5011111111111112], "label": "a brown bowl"}, {"bbox": [0.08950980392156863, 0.310718954248366, 0.42495098039215684, 0.46477124183006535], "label": "a green orange"}], "image_id": "485724"}, "723": {"caption": "a photo of a red toilet and a brown toilet and a black toilet and a blue toilet and a yellow toilet and a blue toilet ", "segment": [{"bbox": [0.0, 0.45581632653061227, 0.1775625, 0.9906377551020409], "label": "a red toilet"}, {"bbox": [0.015171875000000001, 0.22183673469387755, 0.5173125, 0.9876020408163265], "label": "a brown toilet"}, {"bbox": [0.321796875, 0.15354591836734693, 0.6995625000000001, 0.8134438775510204], "label": "a black toilet"}, {"bbox": [0.509140625, 0.1064795918367347, 0.8195937499999999, 0.6758928571428571], "label": "a blue toilet"}, {"bbox": [0.651046875, 0.07377551020408164, 0.929078125, 0.5771428571428572], "label": "a yellow toilet"}, {"bbox": [0.744640625, 0.04494897959183674, 0.995140625, 0.4831377551020409], "label": "a blue toilet"}], "image_id": "372894"}, "724": {"caption": "a photo of a brown toilet and a blue bowl and a yellow bowl and a black sink and a yellow sink and a green sink ", "segment": [{"bbox": [0.42576562500000004, 0.4425586854460094, 0.5621875000000001, 0.7353521126760563], "label": "a brown toilet"}, {"bbox": [0.7147187500000001, 0.6279812206572769, 0.8723750000000001, 0.8003755868544601], "label": "a blue bowl"}, {"bbox": [0.5503125, 0.6195070422535212, 0.701609375, 0.7818544600938968], "label": "a yellow bowl"}, {"bbox": [0.238671875, 0.2349530516431925, 0.45387500000000003, 0.4102112676056338], "label": "a black sink"}, {"bbox": [0.5586875, 0.2775821596244131, 0.8803906250000001, 0.5044131455399061], "label": "a yellow sink"}, {"bbox": [0.028859375, 0.3473708920187793, 0.15615625, 0.5102112676056338], "label": "a green sink"}], "image_id": "571804"}, "725": {"caption": "a photo of a green laptop and a white keyboard and a black book and a blue tv and a red tv ", "segment": [{"bbox": [0.36825, 0.4831041666666666, 0.7010156249999999, 0.88175], "label": "a green laptop"}, {"bbox": [0.004015625, 0.6713541666666667, 0.34045312499999997, 0.824875], "label": "a white keyboard"}, {"bbox": [0.10785937500000001, 0.7752708333333334, 0.338765625, 0.9707916666666667], "label": "a black book"}, {"bbox": [0.0, 0.2929791666666667, 0.345703125, 0.6627708333333333], "label": "a blue tv"}, {"bbox": [0.378171875, 0.49075, 0.666578125, 0.7309375], "label": "a red tv"}], "image_id": "245664"}, "726": {"caption": "a photo of a white bowl and a yellow apple and a blue orange and a black orange and a yellow orange and a yellow banana ", "segment": [{"bbox": [0.05853125, 0.3446135831381733, 0.9487343750000001, 1.0], "label": "a white bowl"}, {"bbox": [0.22134375, 0.37800936768149884, 0.5498125, 0.8588758782201406], "label": "a yellow apple"}, {"bbox": [0.5447656249999999, 0.5756206088992974, 0.792921875, 0.9223419203747073], "label": "a blue orange"}, {"bbox": [0.597890625, 0.3886182669789227, 0.862703125, 0.7009367681498829], "label": "a black orange"}, {"bbox": [0.10882812500000001, 0.3705620608899297, 0.309140625, 0.7275409836065573], "label": "a yellow orange"}, {"bbox": [0.05546875, 0.8292037470725995, 0.19190625, 0.9752693208430914], "label": "a yellow banana"}], "image_id": "192871"}, "727": {"caption": "a photo of a brown bowl and a brown laptop and a green chair and a green book and a brown book and a black book ", "segment": [{"bbox": [0.07484375, 0.5900833333333334, 0.22303125000000001, 0.7485416666666667], "label": "a brown bowl"}, {"bbox": [0.39775, 0.2876458333333333, 0.6927031250000001, 0.6876458333333333], "label": "a brown laptop"}, {"bbox": [0.512546875, 0.8715833333333334, 0.908078125, 1.0], "label": "a green chair"}, {"bbox": [0.795015625, 0.5048333333333334, 0.99840625, 0.8205416666666667], "label": "a green book"}, {"bbox": [0.73196875, 0.5012916666666667, 0.9855, 0.6493958333333334], "label": "a brown book"}, {"bbox": [0.164609375, 0.4902916666666667, 0.427890625, 0.7607499999999999], "label": "a black book"}], "image_id": "9527"}, "728": {"caption": "a photo of a yellow bottle and a yellow sandwich and a yellow sandwich and a yellow cup and a red bowl ", "segment": [{"bbox": [0.054953125000000005, 0.2338333333333333, 0.18265625000000002, 0.4019375], "label": "a yellow bottle"}, {"bbox": [0.34515625, 0.38512500000000005, 0.611765625, 0.6849583333333332], "label": "a yellow sandwich"}, {"bbox": [0.4899375, 0.29552083333333334, 0.729859375, 0.5751666666666666], "label": "a yellow sandwich"}, {"bbox": [0.0, 0.3914375, 0.248140625, 0.7870833333333332], "label": "a yellow cup"}, {"bbox": [0.11309374999999999, 0.116875, 0.40368750000000003, 0.417], "label": "a red bowl"}], "image_id": "463527"}, "729": {"caption": "a photo of a blue umbrella and a green chair and a green chair and a white chair and a brown umbrella and a brown chair ", "segment": [{"bbox": [0.22889062500000001, 0.0, 0.793765625, 0.998], "label": "a blue umbrella"}, {"bbox": [0.5561875, 0.6337083333333333, 0.7550625, 0.9842708333333334], "label": "a green chair"}, {"bbox": [0.059250000000000004, 0.65125, 0.26242187499999997, 0.9898333333333333], "label": "a green chair"}, {"bbox": [0.839265625, 0.6331249999999999, 0.994515625, 0.9735208333333333], "label": "a white chair"}, {"bbox": [0.0, 0.03370833333333333, 0.185390625, 0.31235416666666665], "label": "a brown umbrella"}, {"bbox": [0.315171875, 0.6555, 0.466859375, 0.9723541666666667], "label": "a brown chair"}], "image_id": "429505"}, "730": {"caption": "a photo of a brown dining table and a white sandwich and a green sandwich and a white sandwich and a green cup and a blue cup ", "segment": [{"bbox": [0.006296875, 0.06352803738317757, 0.996046875, 0.9858878504672897], "label": "a brown dining table"}, {"bbox": [0.590609375, 0.2805140186915888, 0.874640625, 0.6490654205607477], "label": "a white sandwich"}, {"bbox": [0.556046875, 0.5983177570093458, 0.81603125, 0.9691121495327102], "label": "a green sandwich"}, {"bbox": [0.35465625, 0.4539252336448598, 0.6161562500000001, 0.8022429906542057], "label": "a white sandwich"}, {"bbox": [0.79259375, 0.10144859813084113, 0.99790625, 0.48936915887850463], "label": "a green cup"}, {"bbox": [0.455796875, 0.0, 0.668390625, 0.2419859813084112], "label": "a blue cup"}], "image_id": "302555"}, "731": {"caption": "a photo of a red clock and a white chair and a brown chair and a green dining table and a black chair and a red book ", "segment": [{"bbox": [0.29596100278551535, 0.270375, 0.48916434540389975, 0.399234375], "label": "a red clock"}, {"bbox": [0.003983286908077995, 0.538, 0.24381615598885795, 0.86984375], "label": "a white chair"}, {"bbox": [0.45935933147632313, 0.497640625, 0.7652924791086351, 0.76821875], "label": "a brown chair"}, {"bbox": [0.0006128133704735376, 0.5180625, 0.6993036211699165, 0.77253125], "label": "a green dining table"}, {"bbox": [0.0, 0.543828125, 0.15966573816155988, 0.737359375], "label": "a black chair"}, {"bbox": [0.6852367688022284, 0.2078125, 0.9972144846796658, 0.7], "label": "a red book"}], "image_id": "519598"}, "732": {"caption": "a photo of a blue kite and a white kite and a red kite and a blue kite and a brown kite ", "segment": [{"bbox": [0.64734375, 0.31754166666666667, 0.850625, 0.500125], "label": "a blue kite"}, {"bbox": [0.46643749999999995, 0.7439583333333334, 0.7886249999999999, 0.9220416666666668], "label": "a white kite"}, {"bbox": [0.62603125, 0.2876458333333333, 0.841359375, 0.5150208333333333], "label": "a red kite"}, {"bbox": [0.35603125, 0.6513333333333333, 0.5069531250000001, 0.8073333333333333], "label": "a blue kite"}, {"bbox": [0.040625, 0.0, 0.9984375, 0.91875], "label": "a brown kite"}], "image_id": "451859"}, "733": {"caption": "a photo of a red banana and a red banana and a blue banana and a brown orange and a yellow cup and a brown bowl ", "segment": [{"bbox": [0.5331862745098039, 0.25026143790849675, 0.6630882352941176, 0.6787581699346404], "label": "a red banana"}, {"bbox": [0.5867320261437908, 0.1934967320261438, 0.9114052287581699, 0.6693300653594771], "label": "a red banana"}, {"bbox": [0.3935294117647059, 0.6701960784313726, 0.6895261437908496, 0.8443137254901961], "label": "a blue banana"}, {"bbox": [0.6228104575163399, 0.7924019607843137, 0.8103431372549019, 0.9771241830065359], "label": "a brown orange"}, {"bbox": [0.0, 0.7053758169934641, 0.20179738562091504, 1.0], "label": "a yellow cup"}, {"bbox": [0.36936274509803924, 0.6801797385620915, 0.9954901960784314, 0.9887418300653595], "label": "a brown bowl"}], "image_id": "35368"}, "734": {"caption": "a photo of a black bench and a green bench and a white bench and a blue bench and a yellow bench and a red bench ", "segment": [{"bbox": [0.38340625, 0.43945833333333334, 0.89125, 0.9887916666666666], "label": "a black bench"}, {"bbox": [0.27134375, 0.42472916666666666, 0.707859375, 0.8404583333333334], "label": "a green bench"}, {"bbox": [0.204765625, 0.41052083333333333, 0.6555625, 0.7448541666666666], "label": "a white bench"}, {"bbox": [0.15687500000000001, 0.4005, 0.46282812500000003, 0.656375], "label": "a blue bench"}, {"bbox": [0.12253125000000001, 0.3878333333333333, 0.42992187499999995, 0.6112083333333334], "label": "a yellow bench"}, {"bbox": [0.10084375000000001, 0.38164583333333335, 0.38679687500000004, 0.5685833333333333], "label": "a red bench"}], "image_id": "455325"}, "735": {"caption": "a photo of a white apple and a green apple and a blue orange and a green apple and a white apple and a brown orange ", "segment": [{"bbox": [0.39503512880562064, 0.5671875, 0.7381967213114755, 0.76915625], "label": "a white apple"}, {"bbox": [0.36594847775175643, 0.212984375, 0.6462529274004684, 0.42078125], "label": "a green apple"}, {"bbox": [0.7459250585480094, 0.714375, 1.0, 0.932515625], "label": "a blue orange"}, {"bbox": [0.2768384074941452, 0.400359375, 0.5719906323185012, 0.5850781250000001], "label": "a green apple"}, {"bbox": [0.08133489461358313, 0.277859375, 0.37381733021077285, 0.45125000000000004], "label": "a white apple"}, {"bbox": [0.42969555035128804, 0.850984375, 0.7459016393442623, 1.0], "label": "a brown orange"}], "image_id": "177449"}, "736": {"caption": "a photo of a green couch and a red chair and a red chair and a red couch and a green dining table ", "segment": [{"bbox": [0.648625, 0.5741959798994974, 0.999015625, 0.9892462311557789], "label": "a green couch"}, {"bbox": [0.040234375, 0.6105276381909548, 0.24640625, 0.913391959798995], "label": "a red chair"}, {"bbox": [0.245796875, 0.5804522613065327, 0.37473437499999995, 0.9173869346733668], "label": "a red chair"}, {"bbox": [0.00134375, 0.8044472361809045, 0.21398437500000003, 0.985100502512563], "label": "a red couch"}, {"bbox": [0.082140625, 0.6096733668341708, 0.335875, 0.9233417085427136], "label": "a green dining table"}], "image_id": "457986"}, "737": {"caption": "a photo of a blue banana and a yellow banana and a black banana and a yellow banana and a green banana and a green banana ", "segment": [{"bbox": [0.5604375, 0.36, 1.0, 0.9882435597189696], "label": "a blue banana"}, {"bbox": [0.65371875, 0.394847775175644, 0.9439375, 0.7939578454332552], "label": "a yellow banana"}, {"bbox": [0.629515625, 0.5929508196721311, 0.965453125, 0.9058782201405152], "label": "a black banana"}, {"bbox": [0.51334375, 0.2823419203747073, 0.711140625, 0.8023419203747073], "label": "a yellow banana"}, {"bbox": [0.811125, 0.34992974238875874, 1.0, 0.6600468384074941], "label": "a green banana"}, {"bbox": [0.5290468749999999, 0.7811709601873537, 0.7221249999999999, 0.9882435597189696], "label": "a green banana"}], "image_id": "209441"}, "738": {"caption": "a photo of a red cell phone and a blue cell phone and a yellow cell phone and a red cell phone and a brown cell phone and a brown cell phone ", "segment": [{"bbox": [0.5114375, 0.4960421545667447, 0.7967187499999999, 0.7519672131147541], "label": "a red cell phone"}, {"bbox": [0.19640625, 0.07416861826697893, 0.3868125, 0.49887587822014046], "label": "a blue cell phone"}, {"bbox": [0.380953125, 0.27421545667447306, 0.585375, 0.6637939110070258], "label": "a yellow cell phone"}, {"bbox": [0.5716249999999999, 0.6549414519906324, 0.9434374999999999, 0.9752693208430915], "label": "a red cell phone"}, {"bbox": [0.051859375, 0.15833723653395784, 0.33185937499999996, 0.8111943793911007], "label": "a brown cell phone"}, {"bbox": [0.65159375, 0.018173302107728335, 0.8214218750000001, 0.5350585480093677], "label": "a brown cell phone"}], "image_id": "30210"}, "739": {"caption": "a photo of a red bowl and a black bowl and a yellow keyboard and a yellow book and a yellow tv ", "segment": [{"bbox": [0.0005468749999999999, 0.25018779342723, 0.14003125, 0.43408450704225354], "label": "a red bowl"}, {"bbox": [0.131328125, 0.11434272300469484, 0.27759375, 0.32286384976525817], "label": "a black bowl"}, {"bbox": [0.27728125000000003, 0.041056338028169014, 0.804, 0.3922065727699531], "label": "a yellow keyboard"}, {"bbox": [0.09879687499999999, 0.2174413145539906, 0.84590625, 0.9856807511737089], "label": "a yellow book"}, {"bbox": [0.731328125, 0.0, 0.999296875, 0.6], "label": "a yellow tv"}], "image_id": "381257"}, "740": {"caption": "a photo of a brown donut and a black donut and a white donut and a blue donut and a red donut and a red donut ", "segment": [{"bbox": [0.7359375, 0.4455208333333333, 0.937703125, 0.6480416666666666], "label": "a brown donut"}, {"bbox": [0.45090624999999995, 0.5574375, 0.639203125, 0.7460833333333333], "label": "a black donut"}, {"bbox": [0.309046875, 0.49324999999999997, 0.47689062499999996, 0.6918124999999999], "label": "a white donut"}, {"bbox": [0.519703125, 0.42433333333333334, 0.68928125, 0.5891458333333334], "label": "a blue donut"}, {"bbox": [0.769453125, 0.32575000000000004, 0.9467343749999999, 0.47933333333333333], "label": "a red donut"}, {"bbox": [0.58128125, 0.29791666666666666, 0.727171875, 0.43822916666666667], "label": "a red donut"}], "image_id": "394334"}, "741": {"caption": "a photo of a green dining table and a black bowl and a yellow cup and a brown knife and a black sandwich and a black cup ", "segment": [{"bbox": [0.0031406249999999998, 0.18116822429906543, 1.0, 0.9976401869158878], "label": "a green dining table"}, {"bbox": [0.573859375, 0.5305841121495327, 0.8706250000000001, 0.8301869158878504], "label": "a black bowl"}, {"bbox": [0.539515625, 0.04495327102803738, 0.710828125, 0.4696728971962617], "label": "a yellow cup"}, {"bbox": [0.124171875, 0.6937383177570093, 0.41590625000000003, 0.8659813084112149], "label": "a brown knife"}, {"bbox": [0.22440625, 0.36485981308411214, 0.40393749999999995, 0.5125233644859813], "label": "a black sandwich"}, {"bbox": [0.726265625, 0.38724299065420564, 0.8581406250000001, 0.5483644859813084], "label": "a black cup"}], "image_id": "64307"}, "742": {"caption": "a photo of a blue potted plant and a black potted plant and a yellow potted plant and a white bench and a yellow bench ", "segment": [{"bbox": [0.8217968750000001, 0.29818396226415095, 0.9974687500000001, 0.7071698113207547], "label": "a blue potted plant"}, {"bbox": [0.0059375, 0.484316037735849, 0.285203125, 0.9865566037735848], "label": "a black potted plant"}, {"bbox": [0.448265625, 0.002783018867924528, 0.6233124999999999, 0.49742924528301885], "label": "a yellow potted plant"}, {"bbox": [0.09209375, 0.29370283018867926, 0.54296875, 0.6147405660377357], "label": "a white bench"}, {"bbox": [0.2026875, 0.4593396226415094, 0.5415468750000001, 0.7290094339622643], "label": "a yellow bench"}], "image_id": "424258"}, "743": {"caption": "a photo of a green dining table and a yellow spoon and a brown pizza and a blue pizza and a red chair and a white fork ", "segment": [{"bbox": [0.0031406249999999998, 0.10741666666666667, 0.9983124999999999, 0.965625], "label": "a green dining table"}, {"bbox": [0.78834375, 0.54825, 1.0, 1.0], "label": "a yellow spoon"}, {"bbox": [0.0033750000000000004, 0.7123541666666667, 0.32021875, 0.8786458333333333], "label": "a brown pizza"}, {"bbox": [0.510671875, 0.6876458333333333, 0.7921406249999999, 0.8584166666666666], "label": "a blue pizza"}, {"bbox": [0.65940625, 0.0005833333333333334, 0.8606718749999999, 0.12808333333333335], "label": "a red chair"}, {"bbox": [0.8143437499999999, 0.48622916666666666, 0.9481562499999999, 0.6653125], "label": "a white fork"}], "image_id": "570465"}, "744": {"caption": "a photo of a blue car and a white car and a brown train and a brown truck and a brown truck ", "segment": [{"bbox": [0.23907812499999997, 0.549088785046729, 0.515265625, 0.8741355140186916], "label": "a blue car"}, {"bbox": [0.0, 0.6179672897196262, 0.23743750000000002, 0.9887616822429907], "label": "a white car"}, {"bbox": [0.33073437499999997, 0.39219626168224303, 0.9539687499999999, 0.563785046728972], "label": "a brown train"}, {"bbox": [0.392140625, 0.4075700934579439, 0.622671875, 0.7482943925233645], "label": "a brown truck"}, {"bbox": [0.0, 0.3355841121495327, 0.216890625, 0.7469626168224299], "label": "a brown truck"}], "image_id": "129957"}, "745": {"caption": "a photo of a green bottle and a blue dining table and a brown dining table and a black bowl and a white chair and a brown potted plant ", "segment": [{"bbox": [0.09697916666666666, 0.0, 0.4848541666666667, 1.0], "label": "a green bottle"}, {"bbox": [0.0, 0.593265625, 0.794, 0.986515625], "label": "a blue dining table"}, {"bbox": [0.5304583333333334, 0.36, 1.0, 0.9852343749999999], "label": "a brown dining table"}, {"bbox": [0.5567291666666667, 0.44932812499999997, 0.9969583333333334, 0.7107187500000001], "label": "a black bowl"}, {"bbox": [0.6652291666666666, 0.113984375, 1.0, 0.372046875], "label": "a white chair"}, {"bbox": [0.0, 0.095515625, 0.18235416666666668, 0.362328125], "label": "a brown potted plant"}], "image_id": "471861"}, "746": {"caption": "a photo of a red boat and a brown boat and a white boat and a red boat and a white boat and a brown boat ", "segment": [{"bbox": [0.112453125, 0.6532552693208431, 0.373328125, 0.8105620608899298], "label": "a red boat"}, {"bbox": [0.71875, 0.4570257611241218, 1.0, 0.7675644028103045], "label": "a brown boat"}, {"bbox": [0.34034375, 0.8426932084309133, 0.87559375, 0.9887587822014051], "label": "a white boat"}, {"bbox": [0.423453125, 0.434519906323185, 0.56584375, 0.5785714285714285], "label": "a red boat"}, {"bbox": [0.027125, 0.4129976580796253, 0.205265625, 0.5502810304449649], "label": "a white boat"}, {"bbox": [0.7815000000000001, 0.2781264637002342, 0.9907343750000001, 0.44971896955503515], "label": "a brown boat"}], "image_id": "544104"}, "747": {"caption": "a photo of a brown wine glass and a green wine glass and a yellow wine glass and a green wine glass and a blue wine glass ", "segment": [{"bbox": [0.217390625, 0.07818750000000001, 0.513375, 1.0], "label": "a brown wine glass"}, {"bbox": [0.4729375, 0.1501875, 0.751765625, 0.9878333333333332], "label": "a green wine glass"}, {"bbox": [0.6388281250000001, 0.18822916666666664, 0.931765625, 0.9882291666666667], "label": "a yellow wine glass"}, {"bbox": [0.8239375000000001, 0.23145833333333332, 1.0, 1.0], "label": "a green wine glass"}, {"bbox": [0.0017656249999999998, 0.0035416666666666665, 0.23348437500000002, 0.9870208333333333], "label": "a blue wine glass"}], "image_id": "48358"}, "748": {"caption": "a photo of a black potted plant and a red potted plant and a brown potted plant and a white potted plant and a black cat ", "segment": [{"bbox": [0.512984375, 0.3312708333333333, 0.887140625, 0.9881458333333334], "label": "a black potted plant"}, {"bbox": [0.701859375, 0.028833333333333332, 1.0, 0.8142708333333333], "label": "a red potted plant"}, {"bbox": [0.166859375, 0.02304166666666667, 0.38090625000000006, 0.3983125], "label": "a brown potted plant"}, {"bbox": [0.003359375, 0.12241666666666666, 0.380046875, 0.6201875], "label": "a white potted plant"}, {"bbox": [0.32832812499999997, 0.39829166666666665, 0.6019375, 0.5957083333333333], "label": "a black cat"}], "image_id": "380117"}, "749": {"caption": "a photo of a white baseball bat and a blue baseball bat and a green baseball bat and a brown baseball bat and a blue sports ball ", "segment": [{"bbox": [0.678015625, 0.28764018691588783, 0.867375, 0.4645560747663551], "label": "a white baseball bat"}, {"bbox": [0.196953125, 0.26196261682242994, 0.38703125, 0.452126168224299], "label": "a blue baseball bat"}, {"bbox": [0.23704687500000002, 0.21584112149532708, 0.40501562500000005, 0.4435514018691588], "label": "a green baseball bat"}, {"bbox": [0.2765625, 0.29205607476635514, 0.8875, 0.7780373831775701], "label": "a brown baseball bat"}, {"bbox": [0.440625, 0.4719626168224299, 0.5828125, 0.927570093457944], "label": "a blue sports ball"}], "image_id": "486788"}, "750": {"caption": "a photo of a yellow car and a blue bus and a red bicycle and a brown truck and a red cow ", "segment": [{"bbox": [0.31496875, 0.45182692307692307, 0.50603125, 0.6914663461538461], "label": "a yellow car"}, {"bbox": [0.0, 0.3125, 0.393046875, 0.5379086538461538], "label": "a blue bus"}, {"bbox": [0.7893749999999999, 0.5092067307692308, 0.960421875, 0.7947836538461538], "label": "a red bicycle"}, {"bbox": [0.4849375, 0.23819711538461538, 0.82090625, 0.7415625], "label": "a brown truck"}, {"bbox": [0.49609375, 0.4730528846153846, 0.628140625, 0.8198557692307692], "label": "a red cow"}], "image_id": "356612"}, "751": {"caption": "a photo of a green car and a blue truck and a blue truck and a white truck and a green truck ", "segment": [{"bbox": [0.3745625, 0.6269597069597069, 0.6576562499999999, 0.9046153846153845], "label": "a green car"}, {"bbox": [0.324, 0.44494505494505493, 0.6000625, 0.7528205128205128], "label": "a blue truck"}, {"bbox": [0.001921875, 0.12135531135531137, 0.321125, 0.9101098901098902], "label": "a blue truck"}, {"bbox": [0.58496875, 0.4521245421245422, 0.738609375, 0.7116117216117217], "label": "a white truck"}, {"bbox": [0.737140625, 0.08091575091575091, 0.9997812500000001, 0.9326007326007326], "label": "a green truck"}], "image_id": "306693"}, "752": {"caption": "a photo of a blue chair and a blue microwave and a brown oven and a red chair and a white dining table ", "segment": [{"bbox": [0.36646875, 0.546056338028169, 0.6461875, 0.9797652582159624], "label": "a blue chair"}, {"bbox": [0.6506093749999999, 0.20816901408450705, 0.8356562499999999, 0.377981220657277], "label": "a blue microwave"}, {"bbox": [0.6228906249999999, 0.5316197183098591, 0.8626249999999999, 0.9572535211267604], "label": "a brown oven"}, {"bbox": [0.03621875, 0.6039201877934272, 0.374203125, 0.9873474178403756], "label": "a red chair"}, {"bbox": [0.0017343750000000002, 0.5376525821596244, 0.624125, 0.7168779342723004], "label": "a white dining table"}], "image_id": "390184"}, "753": {"caption": "a photo of a green hot dog and a green knife and a black pizza and a green pizza and a white dining table ", "segment": [{"bbox": [0.224, 0.42346874999999995, 0.7946666666666666, 0.73146875], "label": "a green hot dog"}, {"bbox": [0.25814583333333335, 0.25696875, 0.39089583333333333, 0.427421875], "label": "a green knife"}, {"bbox": [0.533125, 0.57384375, 0.80575, 0.771375], "label": "a black pizza"}, {"bbox": [0.17379166666666668, 0.415046875, 0.8838958333333334, 0.788078125], "label": "a green pizza"}, {"bbox": [0.0, 0.790578125, 1.0, 0.987890625], "label": "a white dining table"}], "image_id": "157883"}, "754": {"caption": "a photo of a yellow chair and a green chair and a green chair and a black oven and a white potted plant ", "segment": [{"bbox": [0.09859375000000001, 0.6347083333333334, 0.349140625, 0.9902916666666667], "label": "a yellow chair"}, {"bbox": [0.342078125, 0.6233333333333333, 0.587796875, 0.9830833333333333], "label": "a green chair"}, {"bbox": [0.00228125, 0.6629791666666667, 0.12904687499999998, 1.0], "label": "a green chair"}, {"bbox": [0.537640625, 0.5370833333333334, 0.67753125, 0.80675], "label": "a black oven"}, {"bbox": [0.011515625, 0.5055, 0.15065625, 0.6612083333333333], "label": "a white potted plant"}], "image_id": "34445"}, "755": {"caption": "a photo of a blue chair and a green suitcase and a black suitcase and a black tv and a blue tv ", "segment": [{"bbox": [0.45731249999999996, 0.660671875, 0.86175, 0.99009375], "label": "a blue chair"}, {"bbox": [0.44525, 0.382078125, 0.8682708333333333, 0.776453125], "label": "a green suitcase"}, {"bbox": [0.4404583333333333, 0.132203125, 0.8359583333333334, 0.39064062499999996], "label": "a black suitcase"}, {"bbox": [0.00016666666666666666, 0.276421875, 0.22877083333333334, 0.47768750000000004], "label": "a black tv"}, {"bbox": [0.23070833333333332, 0.26965625000000004, 0.4644166666666667, 0.4382031250000001], "label": "a blue tv"}], "image_id": "309424"}, "756": {"caption": "a photo of a white elephant and a white elephant and a yellow elephant and a yellow elephant and a black elephant ", "segment": [{"bbox": [0.003, 0.2, 0.35682812499999994, 0.9887587822014052], "label": "a white elephant"}, {"bbox": [0.303546875, 0.23311475409836066, 0.712265625, 0.9177985948477753], "label": "a white elephant"}, {"bbox": [0.3913125, 0.13482435597189696, 0.8695937499999999, 0.33257611241217794], "label": "a yellow elephant"}, {"bbox": [0.671609375, 0.28667447306791566, 1.0, 0.6825526932084309], "label": "a yellow elephant"}, {"bbox": [0.632, 0.08206088992974239, 0.958921875, 0.29950819672131146], "label": "a black elephant"}], "image_id": "28449"}, "757": {"caption": "a photo of a black potted plant and a red giraffe and a yellow zebra and a blue zebra and a black potted plant ", "segment": [{"bbox": [0.27690625, 0.24981515711645103, 0.6070781249999999, 0.9327726432532347], "label": "a black potted plant"}, {"bbox": [0.07053125, 0.4147689463955637, 0.32310937500000003, 0.9417190388170055], "label": "a red giraffe"}, {"bbox": [0.59121875, 0.17859519408502775, 0.8432187499999999, 0.9148243992606285], "label": "a yellow zebra"}, {"bbox": [0.328625, 0.19101663585951942, 0.57746875, 0.912365988909427], "label": "a blue zebra"}, {"bbox": [0.49071875, 0.31933456561922363, 0.7255312500000001, 0.9321072088724583], "label": "a black potted plant"}], "image_id": "79469"}, "758": {"caption": "a photo of a blue sheep and a green sheep and a green sheep and a brown sheep and a green sheep ", "segment": [{"bbox": [0.21353125, 0.23429629629629628, 0.46828125, 0.8707407407407407], "label": "a blue sheep"}, {"bbox": [0.0, 0.23011111111111113, 0.2549375, 0.7978518518518518], "label": "a green sheep"}, {"bbox": [0.5506562500000001, 0.19603703703703704, 0.741609375, 0.8065925925925926], "label": "a green sheep"}, {"bbox": [0.63053125, 0.5357777777777778, 0.9041562500000001, 0.9023703703703703], "label": "a brown sheep"}, {"bbox": [0.723984375, 0.27525925925925926, 0.9807500000000001, 0.9763333333333334], "label": "a green sheep"}], "image_id": "410097"}, "759": {"caption": "a photo of a black car and a red car and a red car and a brown car and a yellow giraffe ", "segment": [{"bbox": [0.45740625, 0.32577083333333334, 1.0, 1.0], "label": "a black car"}, {"bbox": [0.0016875000000000002, 0.48764583333333333, 0.20562500000000003, 0.9842708333333333], "label": "a red car"}, {"bbox": [0.138203125, 0.6465, 0.27303125, 0.9701041666666667], "label": "a red car"}, {"bbox": [0.22985937500000003, 0.6468333333333334, 0.40707812500000007, 0.8137291666666667], "label": "a brown car"}, {"bbox": [0.23756249999999998, 0.05739583333333333, 0.6283125, 0.9988541666666666], "label": "a yellow giraffe"}], "image_id": "540694"}, "760": {"caption": "a photo of a blue dining table and a blue wine glass and a blue pizza and a blue pizza and a black pizza ", "segment": [{"bbox": [0.0, 0.0016875000000000002, 0.9923831775700935, 0.9881562500000001], "label": "a blue dining table"}, {"bbox": [0.24154205607476634, 0.00153125, 0.733714953271028, 0.34993749999999996], "label": "a blue wine glass"}, {"bbox": [0.0522196261682243, 0.540484375, 0.5266588785046729, 0.8666562500000001], "label": "a blue pizza"}, {"bbox": [0.29906542056074764, 0.32359375, 0.9980140186915887, 0.6427031249999999], "label": "a blue pizza"}, {"bbox": [0.4909813084112149, 0.6511250000000001, 0.9886214953271028, 0.967390625], "label": "a black pizza"}], "image_id": "508443"}, "761": {"caption": "a photo of a white banana and a yellow toaster and a yellow bowl and a blue bowl and a green oven ", "segment": [{"bbox": [0.63746875, 0.43964583333333335, 0.8572968750000001, 0.5857083333333333], "label": "a white banana"}, {"bbox": [0.2280625, 0.3962291666666667, 0.4606875, 0.6664375], "label": "a yellow toaster"}, {"bbox": [0.2396875, 0.6158333333333333, 0.381484375, 0.7611875], "label": "a yellow bowl"}, {"bbox": [0.662546875, 0.5129375, 0.9118749999999999, 0.6603958333333334], "label": "a blue bowl"}, {"bbox": [0.8493437500000001, 0.6675416666666667, 1.0, 1.0], "label": "a green oven"}], "image_id": "11360"}, "762": {"caption": "a photo of a green sheep and a white sheep and a yellow sheep and a brown sheep and a green sheep ", "segment": [{"bbox": [0.13284374999999998, 0.3626875, 0.286546875, 0.5953541666666666], "label": "a green sheep"}, {"bbox": [0.3041875, 0.2826875, 0.49703125000000004, 0.5684791666666666], "label": "a white sheep"}, {"bbox": [0.493546875, 0.36952083333333335, 0.62840625, 0.5096875], "label": "a yellow sheep"}, {"bbox": [0.432265625, 0.3978541666666667, 0.7645156249999999, 0.8473125], "label": "a brown sheep"}, {"bbox": [0.5580625, 0.5978541666666667, 0.8080625000000001, 0.8279583333333334], "label": "a green sheep"}], "image_id": "579885"}, "763": {"caption": "a photo of a yellow cup and a red bowl and a black bowl and a black bowl and a green dining table ", "segment": [{"bbox": [0.49271875, 0.022416666666666665, 0.6642343749999999, 0.28027083333333336], "label": "a yellow cup"}, {"bbox": [0.0016875000000000002, 0.22860416666666666, 0.33615625000000005, 0.6722916666666666], "label": "a red bowl"}, {"bbox": [0.6731874999999999, 0.18910416666666666, 0.8714375000000001, 0.3945625], "label": "a black bowl"}, {"bbox": [0.0874375, 0.0, 0.41704687499999993, 0.33541666666666664], "label": "a black bowl"}, {"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a green dining table"}], "image_id": "22446"}, "764": {"caption": "a photo of a white couch and a white chair and a red dining table and a blue couch and a black chair ", "segment": [{"bbox": [0.322609375, 0.5532426778242677, 0.6525624999999999, 0.8222803347280334], "label": "a white couch"}, {"bbox": [0.51571875, 0.6602510460251046, 0.72471875, 1.0], "label": "a white chair"}, {"bbox": [0.73809375, 0.6964644351464435, 0.9981718749999999, 1.0], "label": "a red dining table"}, {"bbox": [0.00671875, 0.5691004184100418, 0.261828125, 0.8073012552301255], "label": "a blue couch"}, {"bbox": [0.711796875, 0.6729497907949791, 0.839671875, 0.9629497907949791], "label": "a black chair"}], "image_id": "556516"}, "765": {"caption": "a photo of a white chair and a white couch and a green couch and a black dining table and a blue chair ", "segment": [{"bbox": [0.74721875, 0.5957042253521126, 0.8889375000000002, 0.9591314553990611], "label": "a white chair"}, {"bbox": [0.004296875, 0.6232863849765258, 0.42084374999999996, 0.9888967136150234], "label": "a white couch"}, {"bbox": [0.04365625, 0.4913615023474178, 0.212921875, 0.7131455399061033], "label": "a green couch"}, {"bbox": [0.6979375, 0.5292957746478874, 0.9682656250000001, 0.9150469483568076], "label": "a black dining table"}, {"bbox": [0.04321875, 0.4889671361502348, 0.214390625, 0.7045539906103286], "label": "a blue chair"}], "image_id": "326082"}, "766": {"caption": "a photo of a green umbrella and a yellow umbrella and a brown umbrella and a red umbrella and a brown umbrella ", "segment": [{"bbox": [0.42932812499999995, 0.5327400468384075, 0.728515625, 0.7748946135831382], "label": "a green umbrella"}, {"bbox": [0.776453125, 0.5505854800936768, 0.9577187500000001, 0.6933489461358314], "label": "a yellow umbrella"}, {"bbox": [0.6315000000000001, 0.5396252927400468, 0.82403125, 0.6882903981264636], "label": "a brown umbrella"}, {"bbox": [0.22165625000000003, 0.540632318501171, 0.43603125, 0.6705386416861826], "label": "a red umbrella"}, {"bbox": [0.026984374999999998, 0.5393208430913349, 0.24739062500000003, 0.7393208430913348], "label": "a brown umbrella"}], "image_id": "9707"}, "767": {"caption": "a photo of a black sandwich and a blue dining table and a yellow knife and a green fork and a black cup ", "segment": [{"bbox": [0.0, 0.13034375, 0.9677916666666667, 0.9213437499999999], "label": "a black sandwich"}, {"bbox": [0.0, 0.7168593750000001, 0.99775, 0.9887656250000001], "label": "a blue dining table"}, {"bbox": [0.5372083333333334, 0.006875000000000001, 1.0, 0.41070312499999995], "label": "a yellow knife"}, {"bbox": [0.0034583333333333332, 0.018187500000000002, 0.24241666666666667, 0.322078125], "label": "a green fork"}, {"bbox": [0.7962708333333333, 0.0, 1.0, 0.211234375], "label": "a black cup"}], "image_id": "108189"}, "768": {"caption": "a photo of a black dining table and a brown cup and a black cup and a green spoon and a red chair ", "segment": [{"bbox": [0.0, 0.17566666666666667, 1.0, 0.9887291666666667], "label": "a black dining table"}, {"bbox": [0.092, 0.41325, 0.331640625, 0.6949791666666667], "label": "a brown cup"}, {"bbox": [0.43823437500000006, 0.5462708333333333, 0.738703125, 0.9496458333333333], "label": "a black cup"}, {"bbox": [0.12809375, 0.5303333333333333, 0.37753125, 0.7730416666666666], "label": "a green spoon"}, {"bbox": [0.751109375, 0.0015, 1.0, 0.37860416666666663], "label": "a red chair"}], "image_id": "434179"}, "769": {"caption": "a photo of a red spoon and a black carrot and a red bowl and a yellow oven and a blue carrot ", "segment": [{"bbox": [0.305859375, 0.2594847775175644, 0.99703125, 0.6212880562060891], "label": "a red spoon"}, {"bbox": [0.31175, 0.5824355971896955, 0.58575, 0.7278688524590164], "label": "a black carrot"}, {"bbox": [0.0015, 0.0005620608899297424, 0.9160781250000001, 0.9915690866510539], "label": "a red bowl"}, {"bbox": [0.0034687500000000005, 0.0025995316159250588, 1.0, 0.9870023419203747], "label": "a yellow oven"}, {"bbox": [0.0421875, 0.351288056206089, 0.7953125, 0.9742388758782201], "label": "a blue carrot"}], "image_id": "415768"}, "770": {"caption": "a photo of a green cell phone and a white dining table and a green fork and a blue pizza and a brown cup ", "segment": [{"bbox": [0.054921874999999995, 0.5808541666666667, 0.203375, 0.9336249999999999], "label": "a green cell phone"}, {"bbox": [0.0016875000000000002, 0.0045000000000000005, 1.0, 0.9865208333333334], "label": "a white dining table"}, {"bbox": [0.364859375, 0.6745416666666666, 0.625, 0.9876041666666666], "label": "a green fork"}, {"bbox": [0.161796875, 0.2471875, 0.9623593749999999, 0.6966249999999999], "label": "a blue pizza"}, {"bbox": [0.137890625, 0.0, 0.32454687499999996, 0.23452083333333332], "label": "a brown cup"}], "image_id": "181627"}, "771": {"caption": "a photo of a blue bench and a green suitcase and a white suitcase and a white suitcase and a brown suitcase ", "segment": [{"bbox": [0.0, 0.42247916666666663, 0.1955, 0.7460625000000001], "label": "a blue bench"}, {"bbox": [0.1836875, 0.5773958333333333, 0.45328125, 0.7745208333333333], "label": "a green suitcase"}, {"bbox": [0.5874843750000001, 0.4496041666666667, 0.8054218750000001, 0.8261249999999999], "label": "a white suitcase"}, {"bbox": [0.706140625, 0.4295, 0.856109375, 0.8094374999999999], "label": "a white suitcase"}, {"bbox": [0.410625, 0.5268541666666666, 0.6187343750000001, 0.8075416666666667], "label": "a brown suitcase"}], "image_id": "283984"}, "772": {"caption": "a photo of a brown motorcycle and a red motorcycle and a white motorcycle and a green motorcycle and a black motorcycle ", "segment": [{"bbox": [0.039734375, 0.36028125, 0.32439062500000004, 0.97259375], "label": "a brown motorcycle"}, {"bbox": [0.22196875, 0.37129687499999997, 0.59640625, 0.889234375], "label": "a red motorcycle"}, {"bbox": [0.5443125, 0.40629687499999995, 0.7399687500000001, 0.7295], "label": "a white motorcycle"}, {"bbox": [0.701875, 0.390359375, 0.855671875, 0.6714218750000001], "label": "a green motorcycle"}, {"bbox": [0.705359375, 0.39678125, 0.965671875, 0.6372656250000001], "label": "a black motorcycle"}], "image_id": "360673"}, "773": {"caption": "a photo of a brown bottle and a blue sandwich and a green sandwich and a green keyboard and a red laptop ", "segment": [{"bbox": [0.42592, 0.0010133333333333333, 0.5894400000000001, 0.41218666666666665], "label": "a brown bottle"}, {"bbox": [0.12584, 0.39170666666666665, 0.52516, 0.8771733333333334], "label": "a blue sandwich"}, {"bbox": [0.4163, 0.28314666666666666, 0.95056, 0.8921333333333333], "label": "a green sandwich"}, {"bbox": [0.75072, 0.4024533333333333, 1.0, 0.6122399999999999], "label": "a green keyboard"}, {"bbox": [0.7153400000000001, 0.0, 1.0, 0.6420266666666666], "label": "a red laptop"}], "image_id": "216677"}, "774": {"caption": "a photo of a red sandwich and a green wine glass and a red wine glass and a yellow bowl and a green fork ", "segment": [{"bbox": [0.17203125, 0.29283372365339577, 0.6597031250000001, 0.8174941451990633], "label": "a red sandwich"}, {"bbox": [0.519703125, 0.0, 0.68415625, 0.36803278688524593], "label": "a green wine glass"}, {"bbox": [0.45353125, 0.0003044496487119438, 0.584359375, 0.2728337236533958], "label": "a red wine glass"}, {"bbox": [0.6224062499999999, 0.35145199063231847, 0.897046875, 0.6825526932084309], "label": "a yellow bowl"}, {"bbox": [0.015828125000000002, 0.5666276346604215, 0.40203125, 0.7655971896955502], "label": "a green fork"}], "image_id": "533206"}, "775": {"caption": "a photo of a red cup and a brown fork and a white bowl and a green bowl and a red cake ", "segment": [{"bbox": [0.648671875, 0.3064912280701754, 0.9852343749999999, 0.8255263157894737], "label": "a red cup"}, {"bbox": [0.0, 0.6609356725146198, 0.49906249999999996, 0.9654385964912281], "label": "a brown fork"}, {"bbox": [0.24471875, 0.6919590643274854, 0.554890625, 0.8540643274853802], "label": "a white bowl"}, {"bbox": [0.26778124999999997, 0.5887719298245614, 0.53678125, 0.7707894736842106], "label": "a green bowl"}, {"bbox": [0.26778124999999997, 0.5468421052631579, 0.5375, 0.7796198830409357], "label": "a red cake"}], "image_id": "257941"}, "776": {"caption": "a photo of a white cup and a blue fork and a blue knife and a black pizza and a white dining table ", "segment": [{"bbox": [0.70956, 0.4496, 0.93034, 0.8383466666666667], "label": "a white cup"}, {"bbox": [0.62564, 0.7496266666666667, 0.80422, 1.0], "label": "a blue fork"}, {"bbox": [0.6788, 0.7999466666666667, 0.8382, 1.0], "label": "a blue knife"}, {"bbox": [0.09776, 0.6314666666666667, 0.59662, 0.9123466666666666], "label": "a black pizza"}, {"bbox": [0.0, 0.50512, 1.0, 1.0], "label": "a white dining table"}], "image_id": "282143"}, "777": {"caption": "a photo of a white banana and a black banana and a black banana and a green banana and a black sandwich ", "segment": [{"bbox": [0.26008333333333333, 0.388109375, 0.9387083333333334, 0.69978125], "label": "a white banana"}, {"bbox": [0.12883333333333333, 0.10785937500000001, 0.38052083333333336, 0.382015625], "label": "a black banana"}, {"bbox": [0.3895208333333333, 0.033703125, 0.6531874999999999, 0.337078125], "label": "a black banana"}, {"bbox": [0.3785, 0.3245, 0.6173541666666668, 0.50790625], "label": "a green banana"}, {"bbox": [0.07964583333333333, 0.036359375, 1.0, 0.859734375], "label": "a black sandwich"}], "image_id": "291528"}, "778": {"caption": "a photo of a green elephant and a yellow elephant and a red elephant and a black elephant and a green elephant ", "segment": [{"bbox": [0.363234375, 0.019672131147540985, 0.935609375, 0.9515690866510539], "label": "a green elephant"}, {"bbox": [0.323078125, 0.40428571428571425, 0.7874062500000001, 0.9898594847775175], "label": "a yellow elephant"}, {"bbox": [0.061843749999999996, 0.2797423887587822, 0.48060937499999995, 0.9612412177985948], "label": "a red elephant"}, {"bbox": [0.284234375, 0.0007494145199063232, 1.0, 0.8953629976580796], "label": "a black elephant"}, {"bbox": [0.0, 0.0, 0.255859375, 0.4887353629976581], "label": "a green elephant"}], "image_id": "529549"}, "779": {"caption": "a photo of a black bowl and a green banana and a brown cake and a green sandwich and a white bowl ", "segment": [{"bbox": [0.24879687499999997, 0.006052104208416834, 0.7393906250000001, 0.5678557114228456], "label": "a black bowl"}, {"bbox": [0.02278125, 0.5455110220440882, 0.49409374999999994, 0.8646092184368737], "label": "a green banana"}, {"bbox": [0.520375, 0.45168336673346693, 0.96540625, 0.9078557114228456], "label": "a brown cake"}, {"bbox": [0.5221250000000001, 0.46517034068136276, 0.9706718750000001, 0.9078557114228456], "label": "a green sandwich"}, {"bbox": [0.00203125, 0.3844088176352705, 0.516421875, 0.9870140280561122], "label": "a white bowl"}], "image_id": "29994"}, "780": {"caption": "a photo of a brown chair and a white dining table and a blue book and a brown chair and a brown chair ", "segment": [{"bbox": [0.5608125, 0.45158333333333334, 0.7736562499999999, 0.8479791666666666], "label": "a brown chair"}, {"bbox": [0.7701718750000001, 0.4528125, 1.0, 0.9034791666666666], "label": "a white dining table"}, {"bbox": [0.55575, 0.8096875, 0.760140625, 0.9876041666666666], "label": "a blue book"}, {"bbox": [0.169109375, 0.5950833333333333, 0.60128125, 0.9981666666666666], "label": "a brown chair"}, {"bbox": [0.285734375, 0.46602083333333333, 0.5751250000000001, 0.6954583333333333], "label": "a brown chair"}], "image_id": "277984"}, "781": {"caption": "a photo of a red fork and a brown carrot and a white carrot and a green cake and a white dining table ", "segment": [{"bbox": [0.7522065727699531, 0.6700625, 0.9222769953051643, 1.0], "label": "a red fork"}, {"bbox": [0.3736854460093897, 0.194671875, 0.9590610328638498, 0.44926562499999995], "label": "a brown carrot"}, {"bbox": [0.588075117370892, 0.056874999999999995, 0.7677464788732394, 0.21634375], "label": "a white carrot"}, {"bbox": [0.0768075117370892, 0.517390625, 0.7130281690140845, 0.9084218749999999], "label": "a green cake"}, {"bbox": [0.003896713615023474, 0.3350625, 1.0, 0.9870156250000001], "label": "a white dining table"}], "image_id": "485972"}, "782": {"caption": "a photo of a brown elephant and a red elephant and a white elephant and a black elephant and a brown elephant ", "segment": [{"bbox": [0.34890625000000003, 0.5999765807962529, 0.554875, 0.8981030444964871], "label": "a brown elephant"}, {"bbox": [0.07196875, 0.5415690866510539, 0.373328125, 0.8898829039812647], "label": "a red elephant"}, {"bbox": [0.7925625000000001, 0.49754098360655735, 0.9412499999999999, 0.8081498829039813], "label": "a white elephant"}, {"bbox": [0.7287656250000001, 0.5527634660421545, 0.866609375, 0.845175644028103], "label": "a black elephant"}, {"bbox": [0.569359375, 0.5126932084309134, 0.728859375, 0.9011709601873535], "label": "a brown elephant"}], "image_id": "469343"}, "783": {"caption": "a photo of a green stop sign and a yellow car and a yellow car and a green car and a black car ", "segment": [{"bbox": [0.046340000000000006, 0.0478134110787172, 0.35048, 0.35606413994169095], "label": "a green stop sign"}, {"bbox": [0.00924, 0.7813411078717201, 0.84324, 0.9678425655976677], "label": "a yellow car"}, {"bbox": [0.69064, 0.6610495626822158, 0.8806799999999999, 0.8727405247813411], "label": "a yellow car"}, {"bbox": [0.29396, 0.6247230320699708, 0.47848, 0.7928571428571428], "label": "a green car"}, {"bbox": [0.65, 0.577259475218659, 0.954, 0.8309037900874635], "label": "a black car"}], "image_id": "16931"}, "784": {"caption": "a photo of a yellow bus and a red bicycle and a yellow bicycle and a blue bicycle and a black bicycle ", "segment": [{"bbox": [0.187359375, 0.004489795918367347, 0.9987499999999999, 0.9348299319727891], "label": "a yellow bus"}, {"bbox": [0.529578125, 0.6000000000000001, 0.7169375, 0.9011337868480727], "label": "a red bicycle"}, {"bbox": [0.105390625, 0.6110884353741497, 0.256140625, 0.7950113378684808], "label": "a yellow bicycle"}, {"bbox": [0.359234375, 0.6089795918367347, 0.503890625, 0.8524036281179138], "label": "a blue bicycle"}, {"bbox": [0.47028125000000004, 0.636485260770975, 0.60709375, 0.8736054421768708], "label": "a black bicycle"}], "image_id": "397514"}, "785": {"caption": "a photo of a blue dining table and a green knife and a green carrot and a black carrot and a white book ", "segment": [{"bbox": [0.0, 0.0, 1.0, 1.0], "label": "a blue dining table"}, {"bbox": [0.368078125, 0.05522916666666667, 0.498171875, 0.21683333333333332], "label": "a green knife"}, {"bbox": [0.659953125, 0.39960416666666665, 0.9592031249999999, 0.5528333333333334], "label": "a green carrot"}, {"bbox": [0.459203125, 0.39389583333333333, 0.743109375, 0.6823958333333332], "label": "a black carrot"}, {"bbox": [0.0, 0.6535624999999999, 0.12640625, 0.9906458333333333], "label": "a white book"}], "image_id": "287667"}, "786": {"caption": "a photo of a white dining table and a red bench and a red bench and a brown umbrella and a brown dining table ", "segment": [{"bbox": [0.34640624999999997, 0.7442916666666667, 0.6390156250000001, 0.9729791666666666], "label": "a white dining table"}, {"bbox": [0.649859375, 0.6811666666666666, 0.894546875, 0.8731249999999999], "label": "a red bench"}, {"bbox": [0.8432031249999999, 0.6436041666666666, 0.9917187499999999, 0.7793541666666667], "label": "a red bench"}, {"bbox": [0.31703125, 0.2903541666666667, 0.79309375, 0.5442708333333334], "label": "a brown umbrella"}, {"bbox": [0.672703125, 0.6740833333333334, 0.8768437499999999, 0.8112916666666667], "label": "a brown dining table"}], "image_id": "234938"}, "787": {"caption": "a photo of a white chair and a blue umbrella and a red umbrella and a black chair and a brown umbrella ", "segment": [{"bbox": [0.0, 0.7026875, 0.27266666666666667, 0.983578125], "label": "a white chair"}, {"bbox": [0.1831875, 0.23535937499999998, 1.0, 0.9786093749999999], "label": "a blue umbrella"}, {"bbox": [0.044083333333333335, 0.0, 1.0, 0.24987499999999999], "label": "a red umbrella"}, {"bbox": [0.2601875, 0.78571875, 0.40641666666666665, 0.9967500000000001], "label": "a black chair"}, {"bbox": [0.35141666666666665, 0.5862499999999999, 1.0, 0.93240625], "label": "a brown umbrella"}], "image_id": "359546"}, "788": {"caption": "a photo of a brown potted plant and a brown tv and a yellow couch and a brown couch and a brown chair ", "segment": [{"bbox": [0.80978125, 0.3204791666666667, 1.0, 0.5239583333333333], "label": "a brown potted plant"}, {"bbox": [0.008421874999999999, 0.042854166666666665, 0.21742187499999996, 0.32599999999999996], "label": "a brown tv"}, {"bbox": [0.51934375, 0.46341666666666664, 0.9995937500000001, 0.8166875], "label": "a yellow couch"}, {"bbox": [0.5181875, 0.7324583333333333, 1.0, 1.0], "label": "a brown couch"}, {"bbox": [0.5351874999999999, 0.7502083333333334, 1.0, 0.9897083333333333], "label": "a brown chair"}], "image_id": "184830"}, "789": {"caption": "a photo of a blue cat and a yellow chair and a black microwave and a brown handbag and a brown dining table ", "segment": [{"bbox": [0.22540624999999997, 0.45156908665105383, 0.7333125, 0.9470725995316158], "label": "a blue cat"}, {"bbox": [0.7680625, 0.327751756440281, 0.9280156250000001, 0.7445901639344262], "label": "a yellow chair"}, {"bbox": [0.04109375, 0.17046838407494147, 0.43378125, 0.5642857142857143], "label": "a black microwave"}, {"bbox": [0.82346875, 0.4696018735362998, 0.9992812499999999, 0.9853629976580797], "label": "a brown handbag"}, {"bbox": [0.0015, 0.39550351288056207, 0.86659375, 0.9865105386416863], "label": "a brown dining table"}], "image_id": "506151"}, "790": {"caption": "a photo of a blue zebra and a green zebra and a yellow zebra and a blue zebra and a red zebra ", "segment": [{"bbox": [0.674953125, 0.2319375, 0.9985156250000001, 0.7641875], "label": "a blue zebra"}, {"bbox": [0.27184375, 0.25070833333333337, 0.602046875, 0.6809166666666667], "label": "a green zebra"}, {"bbox": [0.13146875, 0.34920833333333334, 0.296203125, 0.7857708333333334], "label": "a yellow zebra"}, {"bbox": [0.037078125, 0.27570833333333333, 0.32190624999999995, 0.5543750000000001], "label": "a blue zebra"}, {"bbox": [0.043921875, 0.24662499999999998, 0.44595312500000006, 0.7961666666666666], "label": "a red zebra"}], "image_id": "400836"}, "791": {"caption": "a photo of a black elephant and a white elephant and a black elephant and a yellow elephant and a brown elephant ", "segment": [{"bbox": [0.51646875, 0.15885245901639344, 0.744984375, 0.6840281030444965], "label": "a black elephant"}, {"bbox": [0.3019375, 0.21693208430913347, 0.54928125, 0.416463700234192], "label": "a white elephant"}, {"bbox": [0.186703125, 0.3572833723653396, 0.38590625, 0.6979859484777516], "label": "a black elephant"}, {"bbox": [0.37307812500000004, 0.293864168618267, 0.5270625, 0.6966276346604215], "label": "a yellow elephant"}, {"bbox": [0.126140625, 0.352903981264637, 0.30700000000000005, 0.6828571428571428], "label": "a brown elephant"}], "image_id": "70685"}, "792": {"caption": "a photo of a white sheep and a white sheep and a blue sheep and a black sheep and a red sheep ", "segment": [{"bbox": [0.3189375, 0.47894613583138174, 0.478296875, 0.7067915690866511], "label": "a white sheep"}, {"bbox": [0.49679687499999997, 0.4532552693208431, 0.6494843749999999, 0.709695550351288], "label": "a white sheep"}, {"bbox": [0.19789062500000001, 0.5168852459016393, 0.397796875, 0.7515456674473069], "label": "a blue sheep"}, {"bbox": [0.070109375, 0.500327868852459, 0.21115625, 0.7287587822014052], "label": "a black sheep"}, {"bbox": [0.0203125, 0.4309133489461358, 0.7203125, 0.7283372365339579], "label": "a red sheep"}], "image_id": "389566"}, "793": {"caption": "a photo of a red suitcase and a black backpack and a black suitcase and a blue backpack and a brown bench ", "segment": [{"bbox": [0.5284, 0.49886227544910183, 1.0, 0.9887724550898204], "label": "a red suitcase"}, {"bbox": [0.0, 0.6224850299401198, 0.2627, 0.9887724550898204], "label": "a black backpack"}, {"bbox": [0.43782, 0.04167664670658683, 0.7808399999999999, 0.31643712574850297], "label": "a black suitcase"}, {"bbox": [0.2389, 0.5326347305389222, 0.5363, 0.9385329341317367], "label": "a blue backpack"}, {"bbox": [0.5181, 0.0, 0.96994, 0.5283233532934132], "label": "a brown bench"}], "image_id": "251044"}, "794": {"caption": "a photo of a yellow sheep and a white sheep and a yellow sheep and a red sheep and a blue sheep ", "segment": [{"bbox": [0.093671875, 0.02828125, 0.9069687500000001, 0.90416015625], "label": "a yellow sheep"}, {"bbox": [0.287796875, 0.5441015625, 0.692078125, 0.94453125], "label": "a white sheep"}, {"bbox": [0.38, 0.0001953125, 0.55790625, 0.13228515624999998], "label": "a yellow sheep"}, {"bbox": [0.865375, 0.0, 1.0, 0.273125], "label": "a red sheep"}, {"bbox": [0.627421875, 0.62884765625, 0.7658437499999999, 0.79513671875], "label": "a blue sheep"}], "image_id": "178435"}, "795": {"caption": "a photo of a red bed and a red chair and a green chair and a blue dining table and a red chair ", "segment": [{"bbox": [0.606734375, 0.08089583333333333, 0.9977499999999999, 1.0], "label": "a red bed"}, {"bbox": [0.1291875, 0.6556875000000001, 0.305375, 0.928625], "label": "a red chair"}, {"bbox": [0.31109375, 0.44618749999999996, 0.494390625, 0.8318333333333333], "label": "a green chair"}, {"bbox": [0.137859375, 0.5543333333333333, 0.34840625000000003, 0.7734375], "label": "a blue dining table"}, {"bbox": [0.658, 0.4801458333333333, 0.9072968750000001, 0.7311458333333333], "label": "a red chair"}], "image_id": "11987"}, "796": {"caption": "a photo of a brown spoon and a yellow cake and a black cake and a brown cake and a yellow dining table ", "segment": [{"bbox": [0.0, 0.47464052287581704, 0.331484375, 0.6777342047930284], "label": "a brown spoon"}, {"bbox": [0.68915625, 0.541677559912854, 0.821703125, 0.7484531590413943], "label": "a yellow cake"}, {"bbox": [0.53965625, 0.49459694989106756, 0.672765625, 0.6959477124183007], "label": "a black cake"}, {"bbox": [0.511, 0.3189542483660131, 0.966015625, 0.6843355119825708], "label": "a brown cake"}, {"bbox": [0.0032187500000000003, 0.0044880174291938996, 1.0, 0.9865141612200435], "label": "a yellow dining table"}], "image_id": "242060"}, "797": {"caption": "a photo of a green donut and a white donut and a white donut and a red donut and a brown dining table ", "segment": [{"bbox": [0.049203125, 0.3820222634508349, 0.49584375, 0.9640445269016698], "label": "a green donut"}, {"bbox": [0.0874375, 0.02025974025974026, 0.5299531249999999, 0.5058627087198516], "label": "a white donut"}, {"bbox": [0.485828125, 0.04087198515769944, 0.9030625000000001, 0.4955102040816327], "label": "a white donut"}, {"bbox": [0.48496875, 0.407847866419295, 0.902203125, 0.9440445269016698], "label": "a red donut"}, {"bbox": [0.00378125, 0.004489795918367347, 0.9992656249999999, 0.9887569573283858], "label": "a brown dining table"}], "image_id": "162827"}, "798": {"caption": "a photo of a yellow laptop and a green keyboard and a white book and a yellow chair and a white tv ", "segment": [{"bbox": [0.63852, 0.30405333333333334, 0.88514, 0.6148533333333334], "label": "a yellow laptop"}, {"bbox": [0.17696, 0.54832, 0.55786, 0.7595466666666666], "label": "a green keyboard"}, {"bbox": [0.0, 0.2811466666666667, 0.13448, 0.4095466666666667], "label": "a white book"}, {"bbox": [0.79274, 0.16352, 1.0, 0.5780266666666667], "label": "a yellow chair"}, {"bbox": [0.16992, 0.3041066666666667, 0.41816, 0.5791999999999999], "label": "a white tv"}], "image_id": "253263"}, "799": {"caption": "a photo of a brown dining table and a yellow cup and a green orange and a black wine glass and a green cup ", "segment": [{"bbox": [0.02678, 0.7820241691842901, 0.9982, 0.9865256797583082], "label": "a brown dining table"}, {"bbox": [0.37495999999999996, 0.6005740181268882, 0.57902, 0.8688821752265862], "label": "a yellow cup"}, {"bbox": [0.30360000000000004, 0.05513595166163142, 0.5931600000000001, 0.30634441087613296], "label": "a green orange"}, {"bbox": [0.30524, 0.2971299093655589, 0.6058600000000001, 0.6141389728096677], "label": "a black wine glass"}, {"bbox": [0.1373, 0.5548036253776435, 0.322, 0.8362839879154078], "label": "a green cup"}], "image_id": "484080"}}