{
  "image_path": "./ref_datasets/hico_det/images/train/train_00026364.jpg",
  "image_id": "train_00026364",
  "width": 480,
  "height": 640,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 26364,
  "annotations": {
    "objects": "[{'id': 559, 'bbox_human': [7, 472, 3, 638], 'bbox_object': [141, 267, 191, 486], 'connection': 1, 'invis': 0}, {'id': 560, 'bbox_human': [1, 466, 2, 638], 'bbox_object': [148, 263, 208, 474], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('toothbrush', 'brush_with'), ('toothbrush', 'hold')]",
    "negative_captions": "[('toothbrush', 'wash'), ('toothbrush', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[558, 559]",
    "negative_objects": "[560, 561]",
    "ambiguous_objects": "[]",
    "size": "[480, 640, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "baby",
        "gender": "unknown",
        "emotion": "neutral",
        "clothing_description": "The child is wearing blue denim overalls and an orange and white patterned shirt with short sleeves.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "shirt",
                "t-shirt",
                "tee"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "white",
                "orange"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "overalls",
                "jumpsuit",
                "dungarees"
              ],
              "name": "overalls",
              "type": "whole body",
              "color": [
                "blue"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "toothbrush"
            ],
            "name": "toothbrush",
            "position": "hand"
          }
        ],
        "description": "The child, who appears to be in the foreground, is exhibiting an expression of surprise. The child is wearing blue denim overalls and an orange and white patterned short-sleeved shirt. The child is holding a toothbrush in their hand and seems to be interacting with it. The overall mood seems curious or surprised.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The baby appears to be engaged in an activity (brushing teeth) without showing strong emotions, suggesting a neutral state.",
        "meaningful": true,
        "story": "A baby is learning to brush their teeth, possibly as part of a daily routine. The child seems curious and focused on the task, indicating a moment of early childhood development and care.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The baby is holding a toothbrush in its mouth while sitting on a green couch. The child appears to be exploring the toothbrush, possibly out of curiosity or as part of learning about oral hygiene. Its wide-eyed expression suggests surprise or fascination with the object, indicating a playful and inquisitive nature. The baby's grip on the toothbrush shows an attempt to control it, which could be a sign of developing motor skills. The overall scene conveys a moment of innocent exploration and learning.",
        "intention": "The individual is exploring the toothbrush with curiosity to understand its properties and function while developing fine motor control",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3703228377870151,
            0.21187122432248934
          ],
          [
            0.36896926632949284,
            0.24772698618471622
          ],
          [
            0.3657991535606839,
            0.28955381203974995
          ],
          [
            0.36477203887133375,
            0.3284569223012243
          ],
          [
            0.3675405422846476,
            0.36315651716930525
          ],
          [
            0.3882416430683363,
            0.3956890994949
          ],
          [
            0.4167118914070584,
            0.41778139770030975
          ],
          [
            0.44775621209825794,
            0.43783534158553394
          ],
          [
            0.4873347783372516,
            0.4576246387192181
          ],
          [
            0.532981973744574,
            0.46027847432664465
          ],
          [
            0.5835401427178155,
            0.45220134513718746
          ],
          [
            0.6407591428075518,
            0.4465761280485562
          ],
          [
            0.6876864288534438,
            0.4371940530836582
          ],
          [
            0.7255514545100077,
            0.4031517298093864
          ],
          [
            0.7577743938991001,
            0.36934034898877144
          ],
          [
            0.7854739240237644,
            0.33221612285290447
          ],
          [
            0.813781185944875,
            0.28682261146605015
          ],
          [
            0.39098469600791025,
            0.18092444432633265
          ],
          [
            0.41169416663192565,
            0.14463122561573982
          ],
          [
            0.4452694566476913,
            0.14125020655670337
          ],
          [
            0.48661981139864247,
            0.14110380823590926
          ],
          [
            0.5221286995070321,
            0.1552528403699398
          ],
          [
            0.6081731217248099,
            0.16443404981068202
          ],
          [
            0.6559365119252886,
            0.1652840253497873
          ],
          [
            0.7016334644385746,
            0.17662671181772435
          ],
          [
            0.7405293112709408,
            0.20152066089212894
          ],
          [
            0.7649934856664568,
            0.23546634880559786
          ],
          [
            0.5443157494068146,
            0.20370620701994216
          ],
          [
            0.5366768238090334,
            0.2114666405000857
          ],
          [
            0.5315987393969581,
            0.22010795772075653
          ],
          [
            0.5266728079035168,
            0.22447202195014274
          ],
          [
            0.495906858642896,
            0.2710548189601728
          ],
          [
            0.5099903413227626,
            0.2758964678006513
          ],
          [
            0.5201753481512978,
            0.27485817138637814
          ],
          [
            0.5392264685460498,
            0.278502278562103
          ],
          [
            0.5562678593964805,
            0.2858912279563291
          ],
          [
            0.42402895759968534,
            0.20494540674345835
          ],
          [
            0.44308062791824343,
            0.18886190094053745
          ],
          [
            0.4831178526083628,
            0.19296137509601458
          ],
          [
            0.4997423792169208,
            0.21555532701313496
          ],
          [
            0.4715200475284032,
            0.21670244447886944
          ],
          [
            0.4416716351395562,
            0.21293959766626358
          ],
          [
            0.6150753253982181,
            0.2337049591754164
          ],
          [
            0.6400856841178169,
            0.2168290623064552
          ],
          [
            0.6722919938110169,
            0.22216635702976156
          ],
          [
            0.6958414029507409,
            0.24335938904966628
          ],
          [
            0.6719485333987644,
            0.24776225856372286
          ],
          [
            0.6375320139385406,
            0.24158641829022337
          ],
          [
            0.45416047076384225,
            0.3537077893103872
          ],
          [
            0.4693507740894953,
            0.3201078916234629
          ],
          [
            0.5003374627658299,
            0.3031606942947422
          ],
          [
            0.5155060990935281,
            0.30720439766134533
          ],
          [
            0.53170164113953,
            0.30920498578676153
          ],
          [
            0.5636583514156795,
            0.33186997366803034
          ],
          [
            0.5824611042227065,
            0.37239602899977137
          ],
          [
            0.5447146421387081,
            0.39281074489865986
          ],
          [
            0.5145661473274231,
            0.4009961283632687
          ],
          [
            0.4962701383091154,
            0.40294066231165615
          ],
          [
            0.4737600631657101,
            0.3977069742977619
          ],
          [
            0.46351744631926217,
            0.3817024960049561
          ],
          [
            0.464958488657361,
            0.3515812823815005
          ],
          [
            0.48978336907568426,
            0.3147611506283283
          ],
          [
            0.5119705509571802,
            0.3112890411700521
          ],
          [
            0.5322406764541353,
            0.3170475640467235
          ],
          [
            0.5725606059744244,
            0.3639020925121648
          ],
          [
            0.5160351917857215,
            0.3891019496534552
          ],
          [
            0.5008747383242562,
            0.3891191796532699
          ],
          [
            0.48280501195362635,
            0.3801343393112932
          ]
        ],
        "visibility": [
          0.0001532451278762892,
          2.140660500430827e-18,
          1.6076714928203728e-06,
          1.5202720166369418e-20,
          0.07917775958776474,
          0.0005143998423591256,
          1.118857334382332e-16,
          1.1946599617649717e-20,
          7.597158173666685e-07,
          1.7295544873368614e-21,
          3.3029883082097422e-12,
          2.767950189257011e-14,
          3.107839940258428e-12,
          2.1301536889950512e-07,
          1.8302090699868658e-17,
          3.990727887037693e-12,
          3.314318519187509e-06,
          4.063609726490114e-10,
          4.812753856026249e-16,
          7.488454230042407e-07,
          3.212325137730896e-17,
          7.429696557281892e-16,
          0.9382212162017822,
          2.6279460143996403e-05,
          2.2413045641656026e-08,
          4.984732182578e-09,
          0.9073261618614197,
          0.9821605682373047,
          1.6490467942276155e-06
        ],
        "headpose": {
          "pitch": 12.860877376918829,
          "yaw": 9.539642397713124,
          "roll": 11.63916570894688
        },
        "attributes": {
          "5 oClock Shadow": 0.004178232047706842,
          "Arched Eyebrows": 0.11770672351121902,
          "Attractive": 0.026836752891540527,
          "Bags Under Eyes": 0.05052010342478752,
          "Bald": 0.0011753012659028172,
          "Bangs": 3.878033749060705e-05,
          "Big Lips": 0.15414810180664062,
          "Big Nose": 0.06591968983411789,
          "Black Hair": 0.012293089181184769,
          "Blond Hair": 0.01921129785478115,
          "Blurry": 0.0011324703227728605,
          "Brown Hair": 0.08253581076860428,
          "Bushy Eyebrows": 0.005582510959357023,
          "Chubby": 0.10909607261419296,
          "Double Chin": 0.00856748316437006,
          "Eyeglasses": 0.00035301531897857785,
          "Goatee": 0.0007112652529031038,
          "Gray Hair": 0.011541856452822685,
          "Heavy Makeup": 0.03363063558936119,
          "High Cheekbones": 0.01652618497610092,
          "Male": 0.4310484528541565,
          "Mouth Slightly Open": 0.9955881834030151,
          "Mustache": 0.00018268125131726265,
          "Narrow Eyes": 0.012459506280720234,
          "No Beard": 0.9884844422340393,
          "Oval Face": 0.20184405148029327,
          "Pale Skin": 0.08349525183439255,
          "Pointy Nose": 0.09150231629610062,
          "Receding Hairline": 0.506007969379425,
          "Rosy Cheeks": 0.002092107431963086,
          "Sideburns": 0.0014595106476917863,
          "Smiling": 0.0012954712146893144,
          "Straight Hair": 0.37326592206954956,
          "Wavy Hair": 0.007286555133759975,
          "Wearing Earrings": 0.03420911356806755,
          "Wearing Hat": 0.0002153907116735354,
          "Wearing Lipstick": 0.04457549750804901,
          "Wearing Necklace": 0.0036157676950097084,
          "Wearing Necktie": 0.0191009771078825,
          "Young": 0.9603406190872192
        },
        "age": [
          0.9999262094497681,
          0.22145165503025055,
          0.1967998743057251,
          7.41790936444886e-05,
          5.6038676120806485e-05,
          9.822250831348356e-06,
          5.046686783316545e-05,
          0.0008702479535713792
        ],
        "race": [
          0.993465006351471,
          0.006454930640757084,
          0.5732904076576233,
          0.03056877851486206,
          0.46221861243247986
        ],
        "gender": [
          0.9823262095451355,
          0.025517884641885757
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.11740227928385139,
          "disgust": 7.080561204020341e-05,
          "fear": 99.53010082244873,
          "happy": 0.023384232190437615,
          "sad": 0.3106917953118682,
          "surprise": 0.003576661038096063,
          "neutral": 0.014775335148442537
        },
        "dominant_emotion": "fear",
        "region": {
          "x": 0,
          "y": 0,
          "w": 309,
          "h": 354,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 13,
        "gender": {
          "Woman": 98.75778555870056,
          "Man": 1.2422087602317333
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 0.41251080110669136,
          "indian": 0.06492043612524867,
          "black": 0.005794932076241821,
          "white": 91.83560013771057,
          "middle eastern": 4.244169965386391,
          "latino hispanic": 3.437003493309021
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "mouth",
                "brush with"
              ],
              [
                "mouth",
                "hold"
              ]
            ],
            "negative_action": [
              "wash",
              "no interaction"
            ],
            "position": "mouth"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.00943145714700222,
        0.002501869108527899,
        0.9734769463539124,
        0.9979759454727173
      ]
    ],
    "face_boxes": [
      [
        0.3619351089000702,
        0.05303001403808594,
        0.7929916977882385,
        0.45459604263305664
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5865402890576256,
            0.4555323398051163
          ],
          [
            0.3391873317460219,
            0.4385940394674739
          ],
          [
            0.12624869892994564,
            0.5708740992471576
          ],
          [
            0.15851212814450263,
            0.5079604122787714
          ],
          [
            0.8338932463692292,
            0.47247064014275875
          ],
          [
            0.8532513038979634,
            0.7563888172308605
          ],
          [
            0.5499750692811278,
            0.6418536435191828
          ],
          [
            0.3047730072504945,
            0.945129878136019
          ],
          [
            0.0810798980295658,
            0.933837677910924
          ],
          [
            0.2682077874739965,
            0.9435167066752911
          ],
          [
            0.6553689380486806,
            0.9677142785862088
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.45963746748036793,
            0.20791052058339118
          ],
          [
            0.65321804276771,
            0.22888174957285318
          ],
          [
            0.37145076096057894,
            0.2579188358659545
          ],
          [
            0.79087534074982,
            0.32083252283434066
          ]
        ],
        "dw_hand_1": [
          [
            0.556427755124039,
            0.6434668149799109
          ],
          [
            0.5349188023143346,
            0.5950716711580754
          ],
          [
            0.5155607447856004,
            0.5418370129540563
          ],
          [
            0.4510338863564861,
            0.52409212688605
          ],
          [
            0.3563944939937857,
            0.5224789554253221
          ],
          [
            0.46178836276133856,
            0.5144130981216829
          ],
          [
            0.40801598073707684,
            0.5031208978965879
          ],
          [
            0.3671489703986379,
            0.5176394410431385
          ],
          [
            0.3477909128699037,
            0.5353843271111447
          ],
          [
            0.42952493354678156,
            0.5369974985718727
          ],
          [
            0.3606962845557266,
            0.5386106700326007
          ],
          [
            0.3434891223079629,
            0.5595818990220625
          ],
          [
            0.35209270343184473,
            0.5708740992471576
          ],
          [
            0.40801598073707684,
            0.5708740992471576
          ],
          [
            0.3413382270269924,
            0.5773267850900691
          ],
          [
            0.33488554118408087,
            0.5934584996973473
          ],
          [
            0.3499418081508742,
            0.6015243570009868
          ],
          [
            0.40156329489416553,
            0.6160429001475375
          ],
          [
            0.3434891223079629,
            0.6176560716082651
          ],
          [
            0.33058375062214,
            0.6289482718333602
          ],
          [
            0.33058375062214,
            0.6337877862155438
          ]
        ],
        "dw_hand_2": [
          [
            0.15851212814450263,
            0.5176394410431385
          ],
          [
            0.21013361488779386,
            0.4966682120536765
          ],
          [
            0.2639059969120556,
            0.469244297221303
          ],
          [
            0.29616942612661246,
            0.46117843991766366
          ],
          [
            0.31552748365534666,
            0.46117843991766366
          ],
          [
            0.23594435825943946,
            0.4208491533994675
          ],
          [
            0.2639059969120556,
            0.4079437817136446
          ],
          [
            0.302622111969524,
            0.41600963901728394
          ],
          [
            0.3284328553411695,
            0.42568866778165104
          ],
          [
            0.21013361488779386,
            0.43375452508529033
          ],
          [
            0.23594435825943946,
            0.42246232486019525
          ],
          [
            0.27681136859787825,
            0.43375452508529033
          ],
          [
            0.302622111969524,
            0.446659896771113
          ],
          [
            0.19077555735905966,
            0.45472575407475235
          ],
          [
            0.21873719601167566,
            0.45149941115329656
          ],
          [
            0.25745331106914404,
            0.46279161137839164
          ],
          [
            0.2854149497217603,
            0.4756969830642143
          ],
          [
            0.17356839511129582,
            0.48376284036785366
          ],
          [
            0.20368092904488247,
            0.4869891832893094
          ],
          [
            0.23809525354040986,
            0.4950550405929485
          ],
          [
            0.2660568921930261,
            0.5047340693573158
          ]
        ],
        "dw_face": [
          [
            0.3736016562415493,
            0.2175895493477583
          ],
          [
            0.3628471798366971,
            0.2546924929444989
          ],
          [
            0.3563944939937857,
            0.29179543654123935
          ],
          [
            0.3563944939937857,
            0.32889838013798
          ],
          [
            0.36929986567960843,
            0.3643881522739926
          ],
          [
            0.3929597137702835,
            0.3950384100278219
          ],
          [
            0.42952493354678156,
            0.4208491533994675
          ],
          [
            0.4703919438852203,
            0.4402072109282017
          ],
          [
            0.5177116400665706,
            0.45149941115329656
          ],
          [
            0.5671822315288914,
            0.4498862396925688
          ],
          [
            0.6166528229912122,
            0.44343355384965744
          ],
          [
            0.6661234144535331,
            0.4305281821638346
          ],
          [
            0.7069904247919718,
            0.4095569531743726
          ],
          [
            0.7371029587255582,
            0.38051986688127126
          ],
          [
            0.7586119115352631,
            0.3466432662059864
          ],
          [
            0.7779699690639973,
            0.31115349406997356
          ],
          [
            0.7930262360307907,
            0.27566372193396094
          ],
          [
            0.38865792320834264,
            0.18371294867247343
          ],
          [
            0.4166195618609587,
            0.1675812340651949
          ],
          [
            0.44888299107551577,
            0.16112854822228356
          ],
          [
            0.4832973155710434,
            0.16112854822228356
          ],
          [
            0.5134098495046298,
            0.16435489114373922
          ],
          [
            0.6058983465863598,
            0.17242074844737845
          ],
          [
            0.6446144616438282,
            0.17564709136883422
          ],
          [
            0.6833305767012966,
            0.1853261201332014
          ],
          [
            0.7198957964777947,
            0.20145783474047985
          ],
          [
            0.750008330411381,
            0.22404223519066963
          ],
          [
            0.5456732787191868,
            0.21275003496557474
          ],
          [
            0.5370696975953048,
            0.2256554066513976
          ],
          [
            0.5306170117523936,
            0.23856077833722028
          ],
          [
            0.5220134306285118,
            0.2514661500230432
          ],
          [
            0.48544821085201356,
            0.2837295792376002
          ],
          [
            0.5026553730997776,
            0.2837295792376002
          ],
          [
            0.5220134306285118,
            0.28534275069832804
          ],
          [
            0.5435223834382161,
            0.2885690936197838
          ],
          [
            0.5671822315288914,
            0.29179543654123935
          ],
          [
            0.42092135242289963,
            0.21275003496557474
          ],
          [
            0.44673209579454526,
            0.19984466327975187
          ],
          [
            0.47899552500910214,
            0.20145783474047985
          ],
          [
            0.5005044778188069,
            0.21920272080848607
          ],
          [
            0.47254283916619094,
            0.2256554066513976
          ],
          [
            0.44458120051357486,
            0.22404223519066963
          ],
          [
            0.6058983465863598,
            0.23049492103358116
          ],
          [
            0.6360108805199464,
            0.2175895493477583
          ],
          [
            0.6725761002964442,
            0.22242906372994184
          ],
          [
            0.6983868436680898,
            0.24178712125867605
          ],
          [
            0.6661234144535331,
            0.2466266356408596
          ],
          [
            0.6338599852389758,
            0.24178712125867605
          ],
          [
            0.45318478163745674,
            0.3547091235096255
          ],
          [
            0.4703919438852203,
            0.32405886575579645
          ],
          [
            0.5005044778188069,
            0.31115349406997356
          ],
          [
            0.5155607447856004,
            0.31276666553070154
          ],
          [
            0.5306170117523936,
            0.31437983699142935
          ],
          [
            0.5671822315288914,
            0.3369642374416193
          ],
          [
            0.5886911843385962,
            0.37084083811690416
          ],
          [
            0.5671822315288914,
            0.39019889564563837
          ],
          [
            0.5370696975953048,
            0.40310426733146104
          ],
          [
            0.5026553730997776,
            0.404717438792189
          ],
          [
            0.47684462972813196,
            0.3950384100278219
          ],
          [
            0.45963746748036793,
            0.3772935239598155
          ],
          [
            0.46178836276133856,
            0.3547091235096255
          ],
          [
            0.4832973155710434,
            0.33051155159870776
          ],
          [
            0.5134098495046298,
            0.32405886575579645
          ],
          [
            0.5521259645620982,
            0.34019058036307487
          ],
          [
            0.5800876032147144,
            0.3692276666561762
          ],
          [
            0.5478241740001571,
            0.3853593812634548
          ],
          [
            0.5069571636617184,
            0.38697255272418263
          ],
          [
            0.47684462972813196,
            0.3756803524990877
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "toothbrush",
      "possible_names": [
        "toothbrush"
      ],
      "box": [
        0.29375,
        0.2984375,
        0.55625,
        0.759375
      ]
    }
  ],
  "scene": "A baby is holding a toothbrush while sitting on a green couch wearing denim overalls and a patterned shirt with cars on it",
  "overall_past": "Before the current scene, the baby likely was introduced to the toothbrush by a caregiver during a routine oral hygiene activity. The caregiver probably demonstrated brushing motions or allowed the baby to hold the toothbrush, sparking the child’s curiosity. This interaction may have occurred after a meal or during a morning or evening hygiene ritual, setting the stage for the baby to independently explore the toothbrush while seated on the couch, showing early signs of imitating adult behaviors and developing fine motor control.",
  "overall_past_clean": "A caregiver guided the individual through a familiar oral care routine, demonstrating the motions and allowing hands-on interaction, which sparked interest and initiated a sequence of exploratory actions driven by observation and emerging motor skills.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the baby is likely to spit out the toothbrush, possibly with a surprised or giggly reaction, as the unfamiliar texture or taste may be overwhelming. This could be followed by the baby reaching for the toothbrush again, showing continued curiosity, or turning to look at an adult nearby for attention or guidance, indicating the beginning of a shared learning moment around brushing teeth.",
  "overall_future_clean": "The infant pauses mid-motion, eyes widening slightly as a soft gurgle escapes, then erupts into a burst of laughter, hands flailing toward the object before quickly snatching it back with renewed fascination, gaze darting to the nearby figure with a hopeful tilt of the head.",
  "future_scene_ok": true
}