{
  "image_path": "./ref_datasets/hico_det/images/train/train_00016066.jpg",
  "image_id": "train_00016066",
  "width": 640,
  "height": 466,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 16066,
  "annotations": {
    "objects": "[{'id': 245, 'bbox_human': [226, 528, 101, 400], 'bbox_object': [36, 589, 106, 439], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('bench', 'lie_on')]",
    "negative_captions": "[('bench', 'sit_on'), ('bench', 'no_interaction')]",
    "ambiguous_captions": "[('bench', 'inspect')]",
    "positive_objects": "[244]",
    "negative_objects": "[245, 246]",
    "ambiguous_objects": "[243]",
    "size": "[640, 466, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "child",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The child is wearing a plaid sleeveless top with pink and white colors and pink pants with a pattern. She also has on gray sandals and white socks.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "shirt",
                "blouse",
                "t-shirt"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "pink",
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "pants",
                "trousers",
                "leggings"
              ],
              "name": "pants",
              "type": "bottom",
              "color": [
                "pink"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "sneakers",
                "shoes"
              ],
              "name": "sneakers",
              "type": "footwear",
              "color": [
                "purple",
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "bench"
            ],
            "name": "bench",
            "position": "body"
          }
        ],
        "description": "A young child appears to be sleeping on a wooden bench in a grassy field. She is dressed in a pink and white plaid sleeveless top and patterned pink leggings, complemented by gray sandals and white socks. The bench is the main object she is in contact with, supporting her as she rests.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The child appears to be resting or sleeping peacefully, showing no strong emotions.",
        "meaningful": true,
        "story": "A young girl is taking a nap on a wooden bench in a grassy field. She seems comfortable and at ease, suggesting she might have been playing outside and needed a moment to rest.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "A child is lying on a wooden bench outdoors, seemingly asleep or resting with one arm stretched out along the backrest and the other resting by their side. The child's relaxed posture suggests they might be taking a nap or simply enjoying a moment of rest in a peaceful environment. Wearing pink checkered clothing and sneakers, the child appears comfortable and at ease, possibly indicating a sense of security and contentment in this natural setting surrounded by grass and trees. The overall scene conveys a tranquil atmosphere where the child has found a quiet spot to relax amidst nature.",
        "intention": "The individual is seeking comfort and tranquility by resting in a natural setting to recharge and connect with the peaceful environment",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.7232642371739659,
            0.5289537648640111
          ],
          [
            0.7251248194703034,
            0.532162869437058
          ],
          [
            0.723906817819391,
            0.5369486520803465
          ],
          [
            0.7247304210705416,
            0.5430976382652577
          ],
          [
            0.7262238150196416,
            0.5446833089258977
          ],
          [
            0.727572001516819,
            0.5536721045074837
          ],
          [
            0.7338076406291554,
            0.5545309873390315
          ],
          [
            0.7379589606608663,
            0.5602082022123729
          ],
          [
            0.7526983410120011,
            0.557018063683805
          ],
          [
            0.7603973869766507,
            0.5580204179285494
          ],
          [
            0.76739367885249,
            0.5486018673764059
          ],
          [
            0.7656136474439076,
            0.5428211070656558
          ],
          [
            0.7648948537451881,
            0.5353744141095113
          ],
          [
            0.7650544860533306,
            0.5278702964086901
          ],
          [
            0.7669096014329365,
            0.526686028130284
          ],
          [
            0.7624557371650423,
            0.5242264199885468
          ],
          [
            0.7653990553958075,
            0.5158829764308263
          ],
          [
            0.7292588462787015,
            0.5424974944093051
          ],
          [
            0.7320464839892729,
            0.5434309550401698
          ],
          [
            0.7224784706320081,
            0.5430821936821952
          ],
          [
            0.7275225543550083,
            0.5442731149499216
          ],
          [
            0.7295528186219079,
            0.5449406891640968
          ],
          [
            0.7419284486344881,
            0.5461126363474778
          ],
          [
            0.7373645901679993,
            0.5438982240266408
          ],
          [
            0.7455868370831013,
            0.5426211877515315
          ],
          [
            0.7462761086012636,
            0.5399345619264809
          ],
          [
            0.7528238766959736,
            0.5360871160929368
          ],
          [
            0.7362114858414446,
            0.5525204660262453
          ],
          [
            0.73412642372506,
            0.5588124814317096
          ],
          [
            0.736690366161721,
            0.5623678952035255
          ],
          [
            0.7355844466813972,
            0.5660191522208845
          ],
          [
            0.7367759605603559,
            0.5546420822108472
          ],
          [
            0.739599263987371,
            0.5591873401955254
          ],
          [
            0.7431712361318724,
            0.5607686854081239
          ],
          [
            0.7388224636869771,
            0.5562571868218212
          ],
          [
            0.7402871449078832,
            0.5553135959594838
          ],
          [
            0.7295557617076806,
            0.5423382005393322
          ],
          [
            0.727405980761562,
            0.5445438735255576
          ],
          [
            0.7327824463801724,
            0.5443935601861838
          ],
          [
            0.7297822049685887,
            0.5491091748967922
          ],
          [
            0.728052455080407,
            0.547251210046063
          ],
          [
            0.7285321905144623,
            0.5447913245289403
          ],
          [
            0.7430773936212063,
            0.5466585834650523
          ],
          [
            0.7367681234010628,
            0.5465198394932095
          ],
          [
            0.7425301083496638,
            0.5438100508134983
          ],
          [
            0.7479181304574013,
            0.5444584419068056
          ],
          [
            0.7443433480603354,
            0.5481382082898802
          ],
          [
            0.7416811381067548,
            0.5448959392685601
          ],
          [
            0.743488180318049,
            0.5490572856000272
          ],
          [
            0.7395093151501246,
            0.554890996469887
          ],
          [
            0.7393875112490995,
            0.5580646693523789
          ],
          [
            0.7427832178771496,
            0.5563874808942372
          ],
          [
            0.7411215823675905,
            0.55350623402692
          ],
          [
            0.7452231439096587,
            0.55056844278028
          ],
          [
            0.7446722513863019,
            0.5497231232030928
          ],
          [
            0.745619999723775,
            0.5542946715504022
          ],
          [
            0.7426840163767338,
            0.5559667707732088
          ],
          [
            0.7393492428319794,
            0.5616400461120886
          ],
          [
            0.7402375524597509,
            0.5578355974832391
          ],
          [
            0.7387015688632216,
            0.5548035950839044
          ],
          [
            0.7468367353081703,
            0.5547360521675545
          ],
          [
            0.7369708849915436,
            0.556208561710753
          ],
          [
            0.7422487178019115,
            0.5595588141756508
          ],
          [
            0.7444943711161613,
            0.5553695534285704
          ],
          [
            0.7467262471360819,
            0.5490604291877302
          ],
          [
            0.7445031547120639,
            0.553831607413979
          ],
          [
            0.7415451584117754,
            0.555826338429454
          ],
          [
            0.7396138465830259,
            0.5538795330566837
          ]
        ],
        "visibility": [
          0.9818913340568542,
          1.0,
          0.023066537454724312,
          0.0015859281411394477,
          0.9410471320152283,
          0.8390467166900635,
          0.0003748788731172681,
          0.9544299840927124,
          1.4054961638976238e-07,
          0.9999977350234985,
          0.00022433271806221455,
          1.4535768059431575e-05,
          3.231148366467096e-05,
          1.2913539571002275e-08,
          0.9995960593223572,
          0.337028443813324,
          1.9591352611314505e-06,
          0.6041746139526367,
          1.5481526133953594e-05,
          0.00037927425000816584,
          7.043552963104105e-10,
          0.06404244899749756,
          0.9964210987091064,
          0.5171685814857483,
          0.9999874830245972,
          1.0,
          0.999866247177124,
          0.9999971389770508,
          0.9999982118606567
        ],
        "headpose": {
          "pitch": -44.63921699990067,
          "yaw": 5.9536411117473955,
          "roll": 19.67470995141669
        },
        "attributes": {
          "5 oClock Shadow": 0.0007420724723488092,
          "Arched Eyebrows": 0.02992662414908409,
          "Attractive": 0.20306281745433807,
          "Bags Under Eyes": 0.0016930518904700875,
          "Bald": 1.3779996152152307e-05,
          "Bangs": 0.005688851699233055,
          "Big Lips": 0.1217970922589302,
          "Big Nose": 0.010813469998538494,
          "Black Hair": 0.004525971133261919,
          "Blond Hair": 0.09956707060337067,
          "Blurry": 0.18996350467205048,
          "Brown Hair": 0.08814164251089096,
          "Bushy Eyebrows": 0.0009963427437469363,
          "Chubby": 0.0022637187503278255,
          "Double Chin": 4.0745486330706626e-05,
          "Eyeglasses": 0.1423313468694687,
          "Goatee": 0.00037191814044490457,
          "Gray Hair": 0.0007128294091671705,
          "Heavy Makeup": 0.01147279143333435,
          "High Cheekbones": 0.013238049112260342,
          "Male": 0.02635198086500168,
          "Mouth Slightly Open": 0.005924707744270563,
          "Mustache": 0.00026660875300876796,
          "Narrow Eyes": 0.015875453129410744,
          "No Beard": 0.9773944616317749,
          "Oval Face": 0.03431662172079086,
          "Pale Skin": 0.06174330785870552,
          "Pointy Nose": 0.10659673810005188,
          "Receding Hairline": 0.022472023963928223,
          "Rosy Cheeks": 0.0003325998259242624,
          "Sideburns": 0.004778735805302858,
          "Smiling": 0.0023289655800908804,
          "Straight Hair": 0.6753700375556946,
          "Wavy Hair": 0.04395872354507446,
          "Wearing Earrings": 0.007411719299852848,
          "Wearing Hat": 0.003281062701717019,
          "Wearing Lipstick": 0.033097390085458755,
          "Wearing Necklace": 0.09359530359506607,
          "Wearing Necktie": 0.00016279661213047802,
          "Young": 0.9952580332756042
        },
        "age": [
          0.8788846731185913,
          0.8242617845535278,
          0.9987819790840149,
          0.004720277152955532,
          1.4197238670021761e-05,
          8.349339708502157e-08,
          4.0952980384645343e-07,
          2.785871267008133e-08
        ],
        "race": [
          0.8840683698654175,
          0.0008018699591048062,
          0.9999641180038452,
          0.0021428975742310286,
          0.04770290106534958
        ],
        "gender": [
          0.018904367461800575,
          0.9845274686813354
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.001594747655847855,
          "disgust": 1.1895023547016739e-07,
          "fear": 0.0008193212057539594,
          "happy": 98.6561717204843,
          "sad": 0.00021164996474782658,
          "surprise": 0.044036869647242766,
          "neutral": 1.2971583138813598
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 77,
          "h": 54,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 33,
        "gender": {
          "Woman": 8.423179388046265,
          "Man": 91.57682061195374
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 29.07002817749641,
          "indian": 1.8575599065351598,
          "black": 0.14493348444673604,
          "white": 39.46695453322476,
          "middle eastern": 20.88664223114941,
          "latino hispanic": 8.573875299230183
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "head",
                "lie on"
              ]
            ],
            "negative_action": [
              "sit on",
              "no interaction"
            ],
            "position": "head"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.3575146496295929,
        0.2215011715888977,
        0.8131550550460815,
        0.8654903173446655
      ]
    ],
    "face_boxes": [
      [
        0.7082785367965698,
        0.49457308650016785,
        0.7901396751403809,
        0.5743704438209534
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.689754451914794,
            0.496814311630793
          ],
          [
            0.6932629593958458,
            0.42866623253838243
          ],
          [
            0.6471511467877361,
            0.34468577143460377
          ],
          [
            0.6020417648884985,
            0.2689656835541478
          ],
          [
            0.6862459444337421,
            0.5649623907232034
          ],
          [
            0.6621876074208153,
            0.5966271547459397
          ],
          [
            0.6281049633191692,
            0.6214082744159072
          ],
          [
            0.5619445365336206,
            0.4796052007488712
          ],
          [
            0.5619445365336206,
            0.5773529505581873
          ],
          [
            0.45869417351981,
            0.6847378024613797
          ],
          [
            0.5829955814199316,
            0.556702017499881
          ],
          [
            0.4807476491149929,
            0.6971283622963634
          ],
          [
            0.402558053822981,
            0.7962528409762332
          ],
          [
            0.7564160940547785,
            0.5415579999237898
          ],
          [
            0.7544112326370346,
            0.5649623907232034
          ],
          [
            0.745389356257187,
            0.48098192961942476
          ],
          [
            0.7413796334216991,
            0.5388045421826823
          ]
        ],
        "dw_hand_1": [
          [
            0.6261001019014252,
            0.622785003286461
          ],
          [
            0.6160757948127058,
            0.6269151898981221
          ],
          [
            0.6050490570151144,
            0.628291918768676
          ],
          [
            0.5980320420530107,
            0.6351755631214447
          ],
          [
            0.5900125963820351,
            0.6420592074742133
          ],
          [
            0.6050490570151144,
            0.6489428518269821
          ],
          [
            0.5990344727618826,
            0.6613334116619658
          ],
          [
            0.5970296113441387,
            0.6627101405325194
          ],
          [
            0.5970296113441387,
            0.6613334116619658
          ],
          [
            0.611063641268346,
            0.6558264961797509
          ],
          [
            0.6060514877239862,
            0.6695937848852882
          ],
          [
            0.6040466263062424,
            0.6682170560147346
          ],
          [
            0.6060514877239862,
            0.6640868694030733
          ],
          [
            0.6170782255215777,
            0.6613334116619658
          ],
          [
            0.6130685026860899,
            0.670970513755842
          ],
          [
            0.611063641268346,
            0.6695937848852882
          ],
          [
            0.6130685026860899,
            0.6654635982736271
          ],
          [
            0.6230928097748094,
            0.6640868694030733
          ],
          [
            0.6200855176481935,
            0.6723472426263959
          ],
          [
            0.6190830869393217,
            0.6723472426263959
          ],
          [
            0.6200855176481935,
            0.6695937848852882
          ]
        ],
        "dw_hand_2": [
          [
            0.5980320420530107,
            0.26758895468359395
          ],
          [
            0.5860028735465473,
            0.26758895468359395
          ],
          [
            0.5759785664578277,
            0.2703424124247014
          ],
          [
            0.5689615514957242,
            0.2689656835541478
          ],
          [
            0.5619445365336206,
            0.26758895468359395
          ],
          [
            0.5779834278755718,
            0.2496914793663953
          ],
          [
            0.5729712743312121,
            0.24143110614307275
          ],
          [
            0.5699639822045963,
            0.23730091953141155
          ],
          [
            0.5659542593691084,
            0.23179400404919662
          ],
          [
            0.5829955814199316,
            0.2428078350136265
          ],
          [
            0.5789858585844438,
            0.23592419066085782
          ],
          [
            0.5759785664578277,
            0.23041727517864277
          ],
          [
            0.5709664129134682,
            0.22628708856698157
          ],
          [
            0.5890101656731632,
            0.24005437727251902
          ],
          [
            0.5860028735465473,
            0.23317073291975024
          ],
          [
            0.5829955814199316,
            0.2276638174375353
          ],
          [
            0.5789858585844438,
            0.2235336308258741
          ],
          [
            0.5960271806352668,
            0.2386776484019653
          ],
          [
            0.5950247499263949,
            0.23454746179030408
          ],
          [
            0.5920174577997791,
            0.23041727517864277
          ],
          [
            0.5890101656731632,
            0.22628708856698157
          ]
        ],
        "dw_face": [
          [
            0.7544112326370346,
            0.49337248945440854
          ],
          [
            0.7463917869660589,
            0.4947492183249624
          ],
          [
            0.7393747720039553,
            0.4961259471955161
          ],
          [
            0.7313553263329797,
            0.4988794049366236
          ],
          [
            0.725340742079748,
            0.5030095915482847
          ],
          [
            0.7203285885353884,
            0.5112699647716072
          ],
          [
            0.7163188656999004,
            0.5195303379949299
          ],
          [
            0.7123091428644127,
            0.5305441689593597
          ],
          [
            0.709301850737797,
            0.540181271053236
          ],
          [
            0.7072969893200529,
            0.5498183731471122
          ],
          [
            0.7103042814466688,
            0.5594554752409885
          ],
          [
            0.7163188656999004,
            0.562208932982096
          ],
          [
            0.723335880662004,
            0.566339119593757
          ],
          [
            0.7303528956241078,
            0.5677158484643109
          ],
          [
            0.7383723412950834,
            0.5690925773348648
          ],
          [
            0.745389356257187,
            0.566339119593757
          ],
          [
            0.7524063712192905,
            0.566339119593757
          ],
          [
            0.765437970434626,
            0.5305441689593597
          ],
          [
            0.7664404011434979,
            0.5360510844415748
          ],
          [
            0.7664404011434979,
            0.5415579999237898
          ],
          [
            0.765437970434626,
            0.5484416442765586
          ],
          [
            0.7634331090168821,
            0.5539485597587733
          ],
          [
            0.7604258168902662,
            0.5608322041115424
          ],
          [
            0.7604258168902662,
            0.562208932982096
          ],
          [
            0.7594233861813942,
            0.5635856618526496
          ],
          [
            0.7584209554725223,
            0.5635856618526496
          ],
          [
            0.7574185247636503,
            0.5649623907232034
          ],
          [
            0.7544112326370346,
            0.5594554752409885
          ],
          [
            0.7514039405104187,
            0.562208932982096
          ],
          [
            0.7483966483838028,
            0.5649623907232034
          ],
          [
            0.745389356257187,
            0.5677158484643109
          ],
          [
            0.7403772027128273,
            0.5525718308882197
          ],
          [
            0.7393747720039553,
            0.556702017499881
          ],
          [
            0.7383723412950834,
            0.5608322041115424
          ],
          [
            0.7383723412950834,
            0.5649623907232034
          ],
          [
            0.7393747720039553,
            0.566339119593757
          ],
          [
            0.7564160940547785,
            0.534674355571021
          ],
          [
            0.7564160940547785,
            0.5388045421826823
          ],
          [
            0.7574185247636503,
            0.5443114576648973
          ],
          [
            0.7544112326370346,
            0.5470649154060048
          ],
          [
            0.7544112326370346,
            0.5429347287943435
          ],
          [
            0.7544112326370346,
            0.5388045421826823
          ],
          [
            0.7534088019281626,
            0.5608322041115424
          ],
          [
            0.7534088019281626,
            0.5635856618526496
          ],
          [
            0.7524063712192905,
            0.5649623907232034
          ],
          [
            0.7504015098015466,
            0.566339119593757
          ],
          [
            0.7514039405104187,
            0.5635856618526496
          ],
          [
            0.7514039405104187,
            0.562208932982096
          ],
          [
            0.7283480342063638,
            0.5456881865354509
          ],
          [
            0.7313553263329797,
            0.5525718308882197
          ],
          [
            0.7333601877507236,
            0.5608322041115424
          ],
          [
            0.7323577570418516,
            0.562208932982096
          ],
          [
            0.7323577570418516,
            0.5649623907232034
          ],
          [
            0.7293504649152359,
            0.566339119593757
          ],
          [
            0.725340742079748,
            0.5635856618526496
          ],
          [
            0.7243383113708761,
            0.5635856618526496
          ],
          [
            0.723335880662004,
            0.562208932982096
          ],
          [
            0.7223334499531322,
            0.5608322041115424
          ],
          [
            0.7243383113708761,
            0.5539485597587733
          ],
          [
            0.72634317278862,
            0.5498183731471122
          ],
          [
            0.7283480342063638,
            0.5470649154060048
          ],
          [
            0.7293504649152359,
            0.5539485597587733
          ],
          [
            0.7293504649152359,
            0.562208932982096
          ],
          [
            0.727345603497492,
            0.5635856618526496
          ],
          [
            0.72634317278862,
            0.5635856618526496
          ],
          [
            0.725340742079748,
            0.562208932982096
          ],
          [
            0.72634317278862,
            0.5608322041115424
          ],
          [
            0.727345603497492,
            0.5525718308882197
          ]
        ],
        "dw_foot_1": [
          [
            0.36847540972133475,
            0.8306710627400766
          ],
          [
            0.3885240238987738,
            0.8389314359633994
          ],
          [
            0.3885240238987738,
            0.7962528409762332
          ]
        ],
        "dw_foot_2": [
          [
            0.4757354955706331,
            0.7700949924357119
          ],
          [
            0.45869417351981,
            0.7577044326007282
          ],
          [
            0.44265528217785893,
            0.6916214468141482
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "bench",
      "possible_names": [
        "bench"
      ],
      "box": [
        0.05625,
        0.22746781115879827,
        0.9203125,
        0.9420600858369099
      ]
    }
  ],
  "scene": "A wooden bench sits amidst a grassy field with trees in the background and a child resting on it wearing pink clothing and sneakers.",
  "overall_past": "Before the current scene, the child likely wandered through the grassy field, perhaps playing or exploring near the trees, drawn by the quiet and inviting presence of the wooden bench. They may have climbed onto it to get a better view of the surroundings or simply to sit and rest after some activity. The pink checkered clothing and sneakers suggest they were dressed for a casual outing, possibly with family or friends, and the relaxed posture indicates they felt safe and comfortable enough to let go and rest, perhaps after a period of play or a short walk. The peaceful setting likely encouraged this moment of stillness, making the bench a natural spot to pause and enjoy the calm of nature.",
  "overall_past_clean": "The figure moved through the open space with purpose, pausing only to step over a low root, then slowed as the quiet of the area drew them in, eventually settling onto the surface with a soft exhale, having been guided by the stillness of the surroundings.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the child is likely to wake up slowly, stretching their arms and legs as they take in the peaceful surroundings. They may sit up, glance around with curiosity, and then hop off the bench to explore the grassy field—perhaps chasing a butterfly, picking a wildflower, or running toward the trees, drawn by the rustling leaves and the soft sunlight filtering through the branches.",
  "overall_future_clean": "The figure rises with deliberate ease, limbs unfolding like dawn breaking over the horizon, then moves with quiet purpose toward the edge of the clearing, feet sinking slightly into the soft earth as the wind lifts the hair at the nape of the neck and the first true step is taken into the dappled light beyond.",
  "future_scene_ok": true
}