{
  "image_path": "./ref_datasets/hico_det/images/train/train_00028524.jpg",
  "image_id": "train_00028524",
  "width": 427,
  "height": 640,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 28524,
  "annotations": {
    "objects": "[{'id': 559, 'bbox_human': [46, 424, 53, 635], 'bbox_object': [212, 267, 245, 271], 'connection': 1, 'invis': 0}, {'id': 560, 'bbox_human': [38, 423, 52, 640], 'bbox_object': [210, 274, 244, 274], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('toothbrush', 'brush_with'), ('toothbrush', 'hold')]",
    "negative_captions": "[('toothbrush', 'wash'), ('toothbrush', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[558, 559]",
    "negative_objects": "[560, 561]",
    "ambiguous_objects": "[]",
    "size": "[427, 640, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "teenager",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a casual outfit, consisting of a dark zip-up hoodie over a lighter-colored shirt.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "jacket",
                "hoodie",
                "sweatshirt"
              ],
              "name": "hoodie",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "toothbrush"
            ],
            "name": "toothbrush",
            "position": "hand"
          }
        ],
        "description": "The person is in the foreground and appears to be an adult. The gender is unknown, and their emotion is neutral. They are wearing a dark zip-up hoodie over a lighter-colored shirt. In their hand, they are holding a toothbrush, which they are using. The setting appears to be a bathroom.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be engaged in a routine activity, such as brushing teeth, without displaying strong emotions.",
        "meaningful": true,
        "story": "A teenager is captured in a candid moment while brushing their teeth, possibly in a bathroom setting. The casual attire suggests a relaxed environment at home.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is brushing their teeth, holding the toothbrush with their right hand while standing in front of a mirror in what appears to be a bathroom setting. Their posture suggests a casual and routine activity, possibly part of their daily hygiene regimen. The individual's expression seems focused on the task at hand, indicating an intent to clean their teeth effectively. The surrounding environment includes typical bathroom items like a toothpaste tube and flowers, which contribute to a sense of normalcy and personal care. The person's attire, consisting of a hoodie and pajama pants, implies they might be in a relaxed state, perhaps preparing for bed or starting their day.",
        "intention": "The individual is maintaining personal hygiene as part of a routine to ensure oral cleanliness and prepare for the day or bedtime",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3340166123984609,
            0.2149805523455143
          ],
          [
            0.3338540252453908,
            0.25382510796189306
          ],
          [
            0.33440119085921294,
            0.29553492963314054
          ],
          [
            0.34460563773732394,
            0.3395844608545303
          ],
          [
            0.36312697930015336,
            0.37374688535928724
          ],
          [
            0.390347029940266,
            0.4050342909991741
          ],
          [
            0.42625087701026,
            0.4321026675403118
          ],
          [
            0.4631545041946712,
            0.4515724316239357
          ],
          [
            0.5052439362438836,
            0.4591039218008518
          ],
          [
            0.5348904524490801,
            0.4458115980029106
          ],
          [
            0.5568629429467189,
            0.4242249526083469
          ],
          [
            0.5739655582431807,
            0.40007065832614896
          ],
          [
            0.5854259044599995,
            0.37247847244143484
          ],
          [
            0.5943987757994523,
            0.3409175187349319
          ],
          [
            0.5998729096084344,
            0.3112039532512426
          ],
          [
            0.6077411660545046,
            0.2799220889806747
          ],
          [
            0.6166867830155884,
            0.24978640154004098
          ],
          [
            0.4353000632733076,
            0.24561179466545582
          ],
          [
            0.4589298357729052,
            0.24037342742085457
          ],
          [
            0.4802754888888704,
            0.24212585613131524
          ],
          [
            0.5022630985064744,
            0.2422762554138899
          ],
          [
            0.5258147977354855,
            0.2422769855707884
          ],
          [
            0.5737413423601382,
            0.24016859233379365
          ],
          [
            0.584929064868405,
            0.2387857533991337
          ],
          [
            0.6024998000889328,
            0.23603776879608632
          ],
          [
            0.6127536272117229,
            0.2314507406204939
          ],
          [
            0.6229982363336181,
            0.23648023083806038
          ],
          [
            0.5461120897409867,
            0.2753768231719732
          ],
          [
            0.5491710007489825,
            0.2972154378890991
          ],
          [
            0.5541214668539385,
            0.31984216570854185
          ],
          [
            0.554138757266022,
            0.3440684586763382
          ],
          [
            0.5066210283169024,
            0.35132272392511366
          ],
          [
            0.5234212345724403,
            0.35340135022997854
          ],
          [
            0.537248715464189,
            0.3575932592153549
          ],
          [
            0.5514395614259017,
            0.3539020292460918
          ],
          [
            0.5634834657109434,
            0.3500648200511932
          ],
          [
            0.45329939557302357,
            0.27080454155802725
          ],
          [
            0.4676968872686739,
            0.2722831483930349
          ],
          [
            0.48982098191109097,
            0.2705542281270027
          ],
          [
            0.5000166503750548,
            0.2717956382781267
          ],
          [
            0.48843892117574006,
            0.2767947096377611
          ],
          [
            0.46498132015239757,
            0.2767754778265953
          ],
          [
            0.5698581662374262,
            0.26988663002848623
          ],
          [
            0.5816576869322648,
            0.26866708546876905
          ],
          [
            0.5982895980674154,
            0.2669254656881094
          ],
          [
            0.6033333631294074,
            0.268957844376564
          ],
          [
            0.596652870076123,
            0.2748003643006086
          ],
          [
            0.5801855508760291,
            0.27568912170827387
          ],
          [
            0.47210049413845023,
            0.3964649349451065
          ],
          [
            0.49486197624449024,
            0.3869041822850704
          ],
          [
            0.5279659754299089,
            0.38205995634198187
          ],
          [
            0.5362884715154602,
            0.3840687483549118
          ],
          [
            0.5443348005568555,
            0.38099384903907774
          ],
          [
            0.5573599157464189,
            0.3874120324850082
          ],
          [
            0.5608634221270635,
            0.39673165082931516
          ],
          [
            0.554500523838721,
            0.40646537244319914
          ],
          [
            0.5399556373744235,
            0.415272681415081
          ],
          [
            0.5269372625149944,
            0.41855611875653265
          ],
          [
            0.5050209591962215,
            0.41723242253065107
          ],
          [
            0.4853080777908177,
            0.41116700917482374
          ],
          [
            0.4771476560071305,
            0.39829705506563184
          ],
          [
            0.5066776817241374,
            0.3936273105442524
          ],
          [
            0.5323011532959311,
            0.3954866290092468
          ],
          [
            0.5446185604630206,
            0.3936260066926479
          ],
          [
            0.5586350370147388,
            0.3968247979879379
          ],
          [
            0.5444726443043438,
            0.39744882136583326
          ],
          [
            0.5304682364069765,
            0.40094069242477415
          ],
          [
            0.5051834464432126,
            0.39942353069782255
          ]
        ],
        "visibility": [
          0.9999760389328003,
          0.9999996423721313,
          1.0,
          0.009456666186451912,
          0.9970757961273193,
          1.0,
          2.851795215974562e-06,
          0.006404109299182892,
          0.012287307530641556,
          5.49584274267545e-06,
          1.2714843067307413e-11,
          3.277986934335786e-06,
          0.7973676919937134,
          3.019398695913028e-13,
          0.23191089928150177,
          3.866997799989273e-14,
          1.2953841332929983e-09,
          0.00041712188976816833,
          9.067998088529983e-12,
          0.9951978325843811,
          8.263539282488422e-18,
          4.530911112965441e-08,
          0.00018945420742966235,
          0.9998388290405273,
          0.001402613241225481,
          0.989535927772522,
          0.3940315246582031,
          0.9422513246536255,
          0.9963601231575012
        ],
        "headpose": {
          "pitch": -21.360007902698563,
          "yaw": -30.722313830122413,
          "roll": 8.774125040821849
        },
        "attributes": {
          "5 oClock Shadow": 0.021003922447562218,
          "Arched Eyebrows": 0.0005858754739165306,
          "Attractive": 0.0648844838142395,
          "Bags Under Eyes": 0.03484981507062912,
          "Bald": 5.8219988829932845e-09,
          "Bangs": 0.9765679240226746,
          "Big Lips": 0.05739232897758484,
          "Big Nose": 0.08972272276878357,
          "Black Hair": 8.390005677938461e-05,
          "Blond Hair": 0.3611803948879242,
          "Blurry": 0.07540389150381088,
          "Brown Hair": 0.04024065285921097,
          "Bushy Eyebrows": 0.001370067591778934,
          "Chubby": 0.0008079935214482248,
          "Double Chin": 5.5953390983631834e-05,
          "Eyeglasses": 0.0024074085522443056,
          "Goatee": 0.015830401331186295,
          "Gray Hair": 0.003865343751385808,
          "Heavy Makeup": 0.0020784942898899317,
          "High Cheekbones": 0.0010458874749019742,
          "Male": 0.983616054058075,
          "Mouth Slightly Open": 0.009786874987185001,
          "Mustache": 0.007762922905385494,
          "Narrow Eyes": 0.2242375910282135,
          "No Beard": 0.7652646899223328,
          "Oval Face": 0.014374935999512672,
          "Pale Skin": 0.034130532294511795,
          "Pointy Nose": 0.1020946130156517,
          "Receding Hairline": 4.917366368317744e-06,
          "Rosy Cheeks": 3.449867290328257e-05,
          "Sideburns": 0.00455661304295063,
          "Smiling": 0.0004824915376957506,
          "Straight Hair": 0.046155139803886414,
          "Wavy Hair": 0.19695116579532623,
          "Wearing Earrings": 0.003557224990800023,
          "Wearing Hat": 0.0006849901401437819,
          "Wearing Lipstick": 0.00456995191052556,
          "Wearing Necklace": 0.013827734626829624,
          "Wearing Necktie": 0.0013017978053539991,
          "Young": 0.8123060464859009
        },
        "age": [
          0.09797703474760056,
          0.960176408290863,
          0.9665083289146423,
          0.022539867088198662,
          0.024405548349022865,
          0.0009861858561635017,
          6.610104173887521e-05,
          1.3101806871418376e-05
        ],
        "race": [
          0.9990671277046204,
          0.004855486564338207,
          0.4041805863380432,
          0.017898567020893097,
          0.032515283674001694
        ],
        "gender": [
          0.9398343563079834,
          0.07786577939987183
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 1.0534351797052094e-07,
          "disgust": 4.037323773703987e-21,
          "fear": 3.441428902695506e-07,
          "happy": 99.99980330466052,
          "sad": 2.0650746233784042e-09,
          "surprise": 0.00011666232480418523,
          "neutral": 7.99389672364488e-05
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 166,
          "h": 244,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 32,
        "gender": {
          "Woman": 73.32738041877747,
          "Man": 26.672622561454773
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 6.230959668755531,
          "indian": 2.973330207169056,
          "black": 1.732029765844345,
          "white": 68.60936880111694,
          "middle eastern": 8.159297704696655,
          "latino hispanic": 12.295018136501312
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "mouth",
                "brush with"
              ],
              [
                "mouth",
                "hold"
              ]
            ],
            "negative_action": [
              "wash",
              "no interaction"
            ],
            "position": "mouth"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.10950600355863571,
        0.08668670803308487,
        0.9862539172172546,
        0.9986920356750488
      ]
    ],
    "face_boxes": [
      [
        0.35492828488349915,
        0.17999067902565002,
        0.6154617667198181,
        0.4352945387363434
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4721351521355765,
            0.4730598908849061
          ],
          [
            0.21579078461023907,
            0.5150801330804825
          ],
          [
            0.3594320250339195,
            0.823228575848043
          ],
          [
            0.7262696544236266,
            0.7804711364209652
          ],
          [
            0.728479519660914,
            0.43103964868932965
          ],
          [
            0.8367629162879962,
            0.7716247696429491
          ],
          [
            0.7660472286947997,
            0.5371960500255227
          ],
          [
            0.38816027311865564,
            0.9603472609072924
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7196400587117644,
            0.9500264996662736
          ],
          [
            1.1792920280675419,
            1.1033635238185524
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4787647478474387,
            0.2894977802410722
          ],
          [
            0.5870481444745209,
            0.28507459685206415
          ],
          [
            0.33070377694918346,
            0.2953953580930829
          ],
          [
            0.6246158535084065,
            0.28507459685206415
          ]
        ],
        "dw_hand_1": [
          [
            0.7306893848982013,
            0.5283496832475066
          ],
          [
            0.6975414063388905,
            0.4929642161354423
          ],
          [
            0.6577638320677174,
            0.4575787490233779
          ],
          [
            0.6312454492202687,
            0.433988437615335
          ],
          [
            0.6069369316101074,
            0.4177700985223055
          ],
          [
            0.7152203282371896,
            0.40597494281828406
          ],
          [
            0.6621835625422923,
            0.401551759429276
          ],
          [
            0.6334553144575561,
            0.42366767637431624
          ],
          [
            0.6246158535084065,
            0.4443091988563538
          ],
          [
            0.728479519660914,
            0.41482130959630015
          ],
          [
            0.6621835625422923,
            0.41629570405930283
          ],
          [
            0.6511342363558552,
            0.44725798778235915
          ],
          [
            0.6621835625422923,
            0.4649507213383913
          ],
          [
            0.7395288458473509,
            0.42956525422632696
          ],
          [
            0.677652619203304,
            0.433988437615335
          ],
          [
            0.6754427539660166,
            0.46347632687538864
          ],
          [
            0.6909118106270283,
            0.47822027150541546
          ],
          [
            0.7505781720337878,
            0.44725798778235915
          ],
          [
            0.6997512715761779,
            0.4531555656343699
          ],
          [
            0.6975414063388905,
            0.47084829919040205
          ],
          [
            0.7152203282371896,
            0.4826434548944235
          ]
        ],
        "dw_hand_2": [
          [
            0.7483683067965005,
            0.7760479530319572
          ],
          [
            0.7682570939320871,
            0.7421368803828955
          ],
          [
            0.7815162853558114,
            0.7038026243448258
          ],
          [
            0.8014050724913979,
            0.6905330741778016
          ],
          [
            0.819083994389697,
            0.6949562575668097
          ],
          [
            0.8168741291524096,
            0.7067514132708311
          ],
          [
            0.8279234553388466,
            0.7067514132708311
          ],
          [
            0.8367629162879962,
            0.6964306520298124
          ],
          [
            0.8610714338981574,
            0.6875842852517963
          ],
          [
            0.8212938596269844,
            0.7332905136048794
          ],
          [
            0.8411826467625709,
            0.7318161191418767
          ],
          [
            0.85886156866087,
            0.7273929357528687
          ],
          [
            0.8654911643727322,
            0.725918541289866
          ],
          [
            0.830133320576134,
            0.7554064305499196
          ],
          [
            0.8566517034235827,
            0.7598296139389277
          ],
          [
            0.8610714338981574,
            0.7554064305499196
          ],
          [
            0.8632812991354448,
            0.7480344582349062
          ],
          [
            0.8389727815252835,
            0.7760479530319572
          ],
          [
            0.8566517034235827,
            0.7716247696429491
          ],
          [
            0.8433925119998583,
            0.7672015862539411
          ],
          [
            0.8279234553388466,
            0.7657271917909384
          ]
        ],
        "dw_face": [
          [
            0.3483826988474826,
            0.2806514134630561
          ],
          [
            0.35280242932205735,
            0.304241724871099
          ],
          [
            0.35722215979663213,
            0.3278320362791419
          ],
          [
            0.3638517555084943,
            0.35142234768718483
          ],
          [
            0.3771109469322187,
            0.3720638701692224
          ],
          [
            0.3969997340678052,
            0.39123099818825724
          ],
          [
            0.42351811691525393,
            0.4089237317442894
          ],
          [
            0.4544562302372774,
            0.42219328191131356
          ],
          [
            0.48981407403387567,
            0.43103964868932965
          ],
          [
            0.5273817830677613,
            0.42956525422632696
          ],
          [
            0.55390016591521,
            0.41482130959630015
          ],
          [
            0.5715790878135092,
            0.3927053926512599
          ],
          [
            0.5848382792372335,
            0.37353826463222506
          ],
          [
            0.5980974706609579,
            0.35142234768718483
          ],
          [
            0.6091467968473948,
            0.3278320362791419
          ],
          [
            0.6113566620846822,
            0.304241724871099
          ],
          [
            0.6135665273219696,
            0.27917701900005343
          ],
          [
            0.4301477126271161,
            0.2732794411480427
          ],
          [
            0.45224636499999,
            0.267381863296032
          ],
          [
            0.4743450173728639,
            0.2659074688330293
          ],
          [
            0.49644366974573784,
            0.267381863296032
          ],
          [
            0.5185423221186117,
            0.26885625775903466
          ],
          [
            0.5671593573389344,
            0.26885625775903466
          ],
          [
            0.5804185487626587,
            0.2659074688330293
          ],
          [
            0.5914678749490957,
            0.26295867990702393
          ],
          [
            0.60472706637282,
            0.26148428544402125
          ],
          [
            0.615776392559257,
            0.2644330743700266
          ],
          [
            0.5450607049660604,
            0.2880233857780695
          ],
          [
            0.5516903006779226,
            0.3057161193341017
          ],
          [
            0.5561100311524975,
            0.3219344584271312
          ],
          [
            0.5627396268643596,
            0.3381527975201607
          ],
          [
            0.5163324568813243,
            0.3528967421501875
          ],
          [
            0.5340113787796235,
            0.3543711366131902
          ],
          [
            0.5494804354406352,
            0.3543711366131902
          ],
          [
            0.5627396268643596,
            0.3543711366131902
          ],
          [
            0.5737889530507966,
            0.34994795322418215
          ],
          [
            0.4478266345254152,
            0.2909721747040749
          ],
          [
            0.4677154216610017,
            0.28507459685206415
          ],
          [
            0.4876042087965883,
            0.28507459685206415
          ],
          [
            0.5052831306948874,
            0.29244656916707756
          ],
          [
            0.4876042087965883,
            0.2953953580930829
          ],
          [
            0.4677154216610017,
            0.2953953580930829
          ],
          [
            0.564949492101647,
            0.2894977802410722
          ],
          [
            0.575998818288084,
            0.2821258079260588
          ],
          [
            0.5914678749490957,
            0.2806514134630561
          ],
          [
            0.60472706637282,
            0.28507459685206415
          ],
          [
            0.5936777401863831,
            0.2909721747040749
          ],
          [
            0.5782086835253714,
            0.29244656916707756
          ],
          [
            0.4853943435593009,
            0.3868078147992492
          ],
          [
            0.5119127264067496,
            0.38091023694723847
          ],
          [
            0.5384311092541982,
            0.3764870535582304
          ],
          [
            0.5494804354406352,
            0.3764870535582304
          ],
          [
            0.5583198963897849,
            0.37501265909522774
          ],
          [
            0.564949492101647,
            0.3779614480212331
          ],
          [
            0.5693692225762218,
            0.38238463141024115
          ],
          [
            0.5627396268643596,
            0.39123099818825724
          ],
          [
            0.55390016591521,
            0.39712857604026797
          ],
          [
            0.5406409744914856,
            0.401551759429276
          ],
          [
            0.5207521873558991,
            0.401551759429276
          ],
          [
            0.5008634002203126,
            0.3941797871142626
          ],
          [
            0.49202393927116306,
            0.3868078147992492
          ],
          [
            0.5185423221186117,
            0.3853334203362465
          ],
          [
            0.5450607049660604,
            0.38385902587324383
          ],
          [
            0.5561100311524975,
            0.38385902587324383
          ],
          [
            0.564949492101647,
            0.38385902587324383
          ],
          [
            0.55390016591521,
            0.3868078147992492
          ],
          [
            0.5406409744914856,
            0.38975660372525456
          ],
          [
            0.5163324568813243,
            0.38975660372525456
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "toothbrush",
      "possible_names": [
        "toothbrush"
      ],
      "box": [
        0.4964871194379391,
        0.3828125,
        0.6252927400468384,
        0.4234375
      ]
    },
    {
      "name": "toothbrush",
      "possible_names": [
        "toothbrush"
      ],
      "box": [
        0.4918032786885246,
        0.38125,
        0.6416861826697893,
        0.428125
      ]
    }
  ],
  "scene": "A sepia-toned photograph captures a moment in a bathroom with tiled walls a mirror and various toiletries visible on the counter creating an intimate everyday setting",
  "overall_past": "Before the current scene, the individual likely entered the bathroom after completing a nighttime routine or waking up, possibly having just finished a meal or snack that prompted the need to brush their teeth. They may have removed their outer clothing, changed into their pajamas, and settled into a relaxed state, perhaps reading or watching something before bed—or preparing for the day ahead. The presence of flowers on the counter suggests a deliberate effort to create a calming, personal atmosphere, indicating that the individual took a moment to care for their environment as part of their self-care ritual. The toothpaste tube’s position and the open cap imply recent use, meaning they had just applied toothpaste and were in the middle of brushing, likely after a brief pause or transition from another activity.",
  "overall_past_clean": "The individual completed a quiet, intentional sequence of actions, transitioning from a moment of stillness into a deliberate act of personal care, having paused to cultivate a serene space before moving into the next phase of their routine.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to rinse their mouth, spit into the sink, and then set down the toothbrush, possibly turning off the faucet with a slight flick of the wrist. They may glance briefly at their reflection in the mirror, adjusting their hoodie or brushing a stray hair from their face, before reaching for the toothpaste tube to squeeze out a fresh amount for the next brush. The presence of flowers on the counter suggests a touch of care in the space, hinting that this routine might be part of a calming evening ritual, possibly leading to the person stepping away from the sink to head to bed, closing the bathroom door behind them with a soft click.",
  "overall_future_clean": "The individual turns off the faucet with a practiced flick, glances at their reflection, adjusts their posture slightly, then applies a fresh bead of toothpaste, before stepping back from the sink and moving toward the bedroom, the bathroom door closing behind them with a quiet, deliberate click.",
  "future_scene_ok": false
}