{
  "image_path": "./ref_datasets/hico_det/images/train/train_00016503.jpg",
  "image_id": "train_00016503",
  "width": 640,
  "height": 480,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 16503,
  "annotations": {
    "objects": "[{'id': 202, 'bbox_human': [186, 637, 6, 477], 'bbox_object': [214, 263, 341, 395], 'connection': 1, 'invis': 0}, {'id': 203, 'bbox_human': [172, 638, 19, 477], 'bbox_object': [214, 265, 345, 394], 'connection': 1, 'invis': 0}, {'id': 205, 'bbox_human': [156, 633, 17, 474], 'bbox_object': [201, 275, 330, 396], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('apple', 'hold'), ('apple', 'inspect'), ('apple', 'pick')]",
    "negative_captions": "[('apple', 'buy'), ('apple', 'cut'), ('apple', 'eat'), ('apple', 'peel'), ('apple', 'smell'), ('apple', 'wash'), ('apple', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[201, 202, 204]",
    "negative_objects": "[198, 199, 200, 203, 205, 206, 207]",
    "ambiguous_objects": "[]",
    "size": "[640, 480, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a sleeveless top.",
        "clothing": [
          {
            "possible_names": [
              "sleeveless",
              "tank top"
            ],
            "name": "tank top",
            "type": "top",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "bracelet",
              "earring"
            ],
            "name": "earring",
            "type": "accessory",
            "color": [
              "greenish-blue"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "apple"
            ],
            "name": "apple",
            "position": "hand"
          }
        ],
        "description": "The person is an adult female in the foreground, showing a neutral emotion. She is wearing a black tank top and blue-green earrings. She is holding an apple in her hand.",
        "blurry": false,
        "face_seen": false,
        "emotion_description": "The person appears to be focused on picking an apple, showing a neutral expression as their face is not fully visible.",
        "meaningful": true,
        "story": "A woman is engaged in apple picking at an orchard. She seems to be carefully selecting an apple from the tree, suggesting she might be enjoying a leisurely day outdoors or participating in a seasonal activity.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is carefully examining an apple she has just picked from a tree, likely assessing its quality before deciding whether to keep it. Her posture suggests focus and attention to detail as she leans slightly forward, her hand gently cradling the fruit. The surrounding environment indicates she is in an orchard, possibly engaging in apple picking for leisure or work purposes. Her expression, though not fully visible, seems concentrated on the task at hand, indicating a sense of purpose and enjoyment in the activity. The presence of other apples on the tree and around her suggests she may be selecting the best ones for personal use or sale.",
        "intention": "The individual is selecting high quality apples from the tree with deliberate care indicating a clear intention to choose the best fruit for personal use or sale",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3748554179178817,
            0.25764502116612026
          ],
          [
            0.3751406278461218,
            0.26388611708368576
          ],
          [
            0.3640242441956486,
            0.29915090118135723
          ],
          [
            0.36373788448316713,
            0.3204860031604767
          ],
          [
            0.3606926293777568,
            0.33496861457824706
          ],
          [
            0.36182469108275006,
            0.3623789140156337
          ],
          [
            0.3693443117397172,
            0.3888754044260298
          ],
          [
            0.3746023940188544,
            0.4085352148328508
          ],
          [
            0.38585637116006444,
            0.4193615879331316
          ],
          [
            0.41278582470757624,
            0.4414904866899763
          ],
          [
            0.4302454649337701,
            0.4319423709596907
          ],
          [
            0.4435221900897367,
            0.4224234410694667
          ],
          [
            0.45715434923768045,
            0.41786104610988073
          ],
          [
            0.4722022971936635,
            0.3883383699825832
          ],
          [
            0.4798182935586997,
            0.38226458685738696
          ],
          [
            0.48358662022011617,
            0.37317951066153393
          ],
          [
            0.4979673919933182,
            0.36269786953926086
          ],
          [
            0.37388466697718414,
            0.24614182178463254
          ],
          [
            0.3884514738406454,
            0.2584967119353158
          ],
          [
            0.39885662474802563,
            0.26037235174860274
          ],
          [
            0.4092580884162869,
            0.26664209025246755
          ],
          [
            0.4243606312998704,
            0.2864359438419342
          ],
          [
            0.4397219707923276,
            0.31405600479670936
          ],
          [
            0.4487069875001907,
            0.31936171139989583
          ],
          [
            0.4687536422695432,
            0.3319585485117776
          ],
          [
            0.46920835418360574,
            0.3341334274836949
          ],
          [
            0.47639824843832423,
            0.33932729874338424
          ],
          [
            0.43432164830820896,
            0.3186706457819258
          ],
          [
            0.42283005437680654,
            0.3233630657196045
          ],
          [
            0.41582969214235027,
            0.334805029630661
          ],
          [
            0.4084785109119756,
            0.3373559994356973
          ],
          [
            0.40787763366741797,
            0.34111280526433674
          ],
          [
            0.41304351910948756,
            0.3434123890740531
          ],
          [
            0.4175143877310412,
            0.3479036365236555
          ],
          [
            0.41965087716068544,
            0.35595216580799643
          ],
          [
            0.4187718393547194,
            0.36328528608594624
          ],
          [
            0.387239347504718,
            0.27165213099547797
          ],
          [
            0.3894920127200229,
            0.2815888698611941
          ],
          [
            0.4031953554068293,
            0.2944510536534446
          ],
          [
            0.40916205367871694,
            0.30507119638579233
          ],
          [
            0.3985104048890727,
            0.2981107388223921
          ],
          [
            0.3891668299479144,
            0.28006992765835353
          ],
          [
            0.44500120910150665,
            0.33435976760728015
          ],
          [
            0.43707053661346434,
            0.3368975588253566
          ],
          [
            0.4453641127262797,
            0.3452921220234462
          ],
          [
            0.4615044825843402,
            0.35359741364206587
          ],
          [
            0.44401261668120107,
            0.35912872041974747
          ],
          [
            0.44452201074787545,
            0.3350943497249058
          ],
          [
            0.3790750705770084,
            0.35631305490221293
          ],
          [
            0.390901664059077,
            0.3671460313456399
          ],
          [
            0.4014780059456825,
            0.3611476293631962
          ],
          [
            0.4058707685342856,
            0.3660147053854806
          ],
          [
            0.40775751689715045,
            0.3605900168418884
          ],
          [
            0.4142761353935514,
            0.3733533799648285
          ],
          [
            0.41850294843316077,
            0.38921540634972707
          ],
          [
            0.4096761578960078,
            0.38457749911717004
          ],
          [
            0.40108851455152034,
            0.39344325065612795
          ],
          [
            0.38978469228105883,
            0.3859668987137931
          ],
          [
            0.38725963921419215,
            0.3851048486573356
          ],
          [
            0.37860369868576527,
            0.3626557767391205
          ],
          [
            0.3817784670740366,
            0.36346487828663415
          ],
          [
            0.39571586618466037,
            0.36583700520651685
          ],
          [
            0.4077077589929104,
            0.3768544912338257
          ],
          [
            0.40902497560850215,
            0.3829976984432765
          ],
          [
            0.4207008442708425,
            0.38725697653634206
          ],
          [
            0.40871584223849433,
            0.3838890280042376
          ],
          [
            0.40037977168602606,
            0.38085692269461496
          ],
          [
            0.39065534855638234,
            0.3673557928630284
          ]
        ],
        "visibility": [
          0.9999990463256836,
          0.9999926090240479,
          1.0,
          0.9999998807907104,
          1.0,
          0.9999966621398926,
          0.10470566898584366,
          0.9994943141937256,
          0.009708068333566189,
          0.999936580657959,
          0.9889754056930542,
          0.9900206327438354,
          0.6466607451438904,
          0.00013798606232739985,
          0.9999995231628418,
          0.06325645744800568,
          1.6761533743192558e-06,
          0.07980380952358246,
          0.0002607971546240151,
          3.0591641007049475e-06,
          0.00029462744714692235,
          0.00017724146891850978,
          0.9633390307426453,
          0.008087228052318096,
          0.04489626735448837,
          0.9515324234962463,
          0.04379381984472275,
          0.04446913301944733,
          0.5790863633155823
        ],
        "headpose": {
          "pitch": 15.262889275924941,
          "yaw": 1.7701634786061027,
          "roll": 48.10560630557384
        },
        "attributes": {
          "5 oClock Shadow": 0.0009491483797319233,
          "Arched Eyebrows": 0.001951960613951087,
          "Attractive": 0.08672714978456497,
          "Bags Under Eyes": 0.0014284108765423298,
          "Bald": 7.864542084234927e-08,
          "Bangs": 0.13248972594738007,
          "Big Lips": 0.039410870522260666,
          "Big Nose": 0.0036256383173167706,
          "Black Hair": 0.010295061394572258,
          "Blond Hair": 0.01119781844317913,
          "Blurry": 0.014091662131249905,
          "Brown Hair": 0.36795270442962646,
          "Bushy Eyebrows": 0.0002740491181612015,
          "Chubby": 0.0013758536661043763,
          "Double Chin": 5.725586015614681e-05,
          "Eyeglasses": 0.03623563051223755,
          "Goatee": 0.006641794927418232,
          "Gray Hair": 0.00012090600648662075,
          "Heavy Makeup": 0.010906103067100048,
          "High Cheekbones": 0.006039278581738472,
          "Male": 0.1517757773399353,
          "Mouth Slightly Open": 0.19650770723819733,
          "Mustache": 0.0014134818920865655,
          "Narrow Eyes": 0.035510264337062836,
          "No Beard": 0.8949264883995056,
          "Oval Face": 0.035688575357198715,
          "Pale Skin": 0.0013878338504582644,
          "Pointy Nose": 0.13903871178627014,
          "Receding Hairline": 0.00024117187422234565,
          "Rosy Cheeks": 0.0007118860958144069,
          "Sideburns": 0.010125759989023209,
          "Smiling": 0.0013809667434543371,
          "Straight Hair": 0.0960402861237526,
          "Wavy Hair": 0.17041674256324768,
          "Wearing Earrings": 0.011679758317768574,
          "Wearing Hat": 0.033490151166915894,
          "Wearing Lipstick": 0.019763244315981865,
          "Wearing Necklace": 0.020223043859004974,
          "Wearing Necktie": 0.00039344653487205505,
          "Young": 0.9814999103546143
        },
        "age": [
          0.13243120908737183,
          0.8555749654769897,
          0.9911494255065918,
          0.5327640771865845,
          0.05674509331583977,
          7.529579306719825e-05,
          1.6937043255893514e-05,
          1.3709477286738547e-07
        ],
        "race": [
          0.9944899082183838,
          0.00023536168737336993,
          0.9938604831695557,
          0.056602802127599716,
          0.046489376574754715
        ],
        "gender": [
          0.033235225826501846,
          0.9731821417808533
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 1.2222040444612503,
          "disgust": 0.1635405351407826,
          "fear": 42.35734045505524,
          "happy": 1.977972686290741,
          "sad": 53.91305685043335,
          "surprise": 0.01328065263805911,
          "neutral": 0.35260652657598257
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 148,
          "h": 131,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 32,
        "gender": {
          "Woman": 38.70163857936859,
          "Man": 61.29835844039917
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 23.483803868293762,
          "indian": 6.749801337718964,
          "black": 3.9634548127651215,
          "white": 33.47845375537872,
          "middle eastern": 13.357555866241455,
          "latino hispanic": 18.966929614543915
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "hand",
                "hold"
              ],
              [
                "hand",
                "inspect"
              ],
              [
                "hand",
                "pick"
              ]
            ],
            "negative_action": [
              "buy",
              "cut",
              "eat",
              "peel",
              "smell",
              "wash",
              "no interaction"
            ],
            "position": "hand"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.29130619764328003,
        0.02365620993077755,
        0.9984514117240906,
        0.9976072907447815
      ]
    ],
    "face_boxes": [
      [
        0.3202468454837799,
        0.26602017879486084,
        0.47600722312927246,
        0.4492090046405792
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5901940378877851,
            0.17543722082067414
          ],
          [
            0.6024477726883358,
            0.6308676975744743
          ],
          [
            0.4554029550817278,
            0.7677010695139568
          ],
          [
            0.5580279840363396,
            0.25508649702425346
          ],
          [
            0.8628396372000375,
            0.6574174563090007
          ],
          [
            0.9547426482041678,
            1.0148180546583954
          ],
          [
            1.0864702973100875,
            0.5798104692388465
          ],
          [
            -1.0,
            -1.0
          ],
          [
            1.0864702973100875,
            0.82896974351671
          ],
          [
            1.016011322206921,
            0.5471338431040447
          ],
          [
            -1.0,
            -1.0
          ],
          [
            1.0864702973100875,
            0.9576339589224921
          ],
          [
            0.3634999440775978,
            0.36128553196235924
          ],
          [
            0.35890479352739124,
            0.35515866456208406
          ],
          [
            0.433958919180764,
            0.24079047309027773
          ],
          [
            0.39719771477911203,
            0.28163625575878004
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.4477443708313835,
            0.7677010695139568
          ],
          [
            0.42323690123028224,
            0.7493204673131308
          ],
          [
            0.4017928653293186,
            0.7248129977120293
          ],
          [
            0.38034882942835485,
            0.718686130311754
          ],
          [
            0.3604365103774601,
            0.7248129977120293
          ],
          [
            0.369626811477873,
            0.7697433586473817
          ],
          [
            0.3543096429771847,
            0.7881239608482077
          ],
          [
            0.35890479352739124,
            0.7840393825813574
          ],
          [
            0.36196822722752897,
            0.7799548043145074
          ],
          [
            0.3711585283279419,
            0.8024199847821835
          ],
          [
            0.35277792612711584,
            0.8146737195827343
          ],
          [
            0.3604365103774601,
            0.7962931173819083
          ],
          [
            0.3711585283279419,
            0.7779125151810823
          ],
          [
            0.3772853957282173,
            0.8208005869830095
          ],
          [
            0.3558413598272535,
            0.82488516524986
          ],
          [
            0.3634999440775978,
            0.8024199847821835
          ],
          [
            0.3711585283279419,
            0.7819970934479326
          ],
          [
            0.3880074136786991,
            0.8330543217835603
          ],
          [
            0.369626811477873,
            0.8330543217835603
          ],
          [
            0.369626811477873,
            0.8146737195827343
          ],
          [
            0.3711585283279419,
            0.7962931173819083
          ]
        ],
        "dw_face": [
          [
            0.3711585283279419,
            0.3735392667629101
          ],
          [
            0.38034882942835485,
            0.3878352906968858
          ],
          [
            0.3926025642289055,
            0.3980467363640113
          ],
          [
            0.4048562990294563,
            0.4123427602979872
          ],
          [
            0.42170518438021337,
            0.4245964950985378
          ],
          [
            0.43855406973097055,
            0.43072336249881327
          ],
          [
            0.4538712382316589,
            0.4388925190325136
          ],
          [
            0.4691884067323473,
            0.4388925190325136
          ],
          [
            0.4799104246828291,
            0.4245964950985378
          ],
          [
            0.4799104246828291,
            0.40213131463086155
          ],
          [
            0.4691884067323473,
            0.38375071243003556
          ],
          [
            0.4584663887818653,
            0.3633278210957846
          ],
          [
            0.4446809371312458,
            0.3449472188949586
          ],
          [
            0.433958919180764,
            0.32860890582755753
          ],
          [
            0.417110033830007,
            0.3163551710270069
          ],
          [
            0.4033245821793875,
            0.30001685795960603
          ],
          [
            0.389539130528768,
            0.2918477014259055
          ],
          [
            0.3604365103774601,
            0.3653701102292095
          ],
          [
            0.3604365103774601,
            0.3674123993626349
          ],
          [
            0.35890479352739124,
            0.3674123993626349
          ],
          [
            0.35890479352739124,
            0.3674123993626349
          ],
          [
            0.35890479352739124,
            0.3653701102292095
          ],
          [
            0.3543096429771847,
            0.3653701102292095
          ],
          [
            0.3543096429771847,
            0.36128553196235924
          ],
          [
            0.3543096429771847,
            0.3572009536955092
          ],
          [
            0.3558413598272535,
            0.3531163754286589
          ],
          [
            0.3558413598272535,
            0.3490317971618089
          ],
          [
            0.369626811477873,
            0.3714969776294849
          ],
          [
            0.3757536788781485,
            0.38375071243003556
          ],
          [
            0.38034882942835485,
            0.39600444723058636
          ],
          [
            0.3880074136786991,
            0.40825818203113695
          ],
          [
            0.39413428107897436,
            0.4103004711645621
          ],
          [
            0.3987294316291809,
            0.4103004711645621
          ],
          [
            0.4048562990294563,
            0.40825818203113695
          ],
          [
            0.4048562990294563,
            0.4041736037642869
          ],
          [
            0.4017928653293186,
            0.40213131463086155
          ],
          [
            0.37269024517801075,
            0.3714969776294849
          ],
          [
            0.37269024517801075,
            0.3735392667629101
          ],
          [
            0.3711585283279419,
            0.3735392667629101
          ],
          [
            0.369626811477873,
            0.3714969776294849
          ],
          [
            0.369626811477873,
            0.3714969776294849
          ],
          [
            0.3711585283279419,
            0.3714969776294849
          ],
          [
            0.3711585283279419,
            0.3694546884960598
          ],
          [
            0.36656337777773534,
            0.3694546884960598
          ],
          [
            0.36656337777773534,
            0.3653701102292095
          ],
          [
            0.36656337777773534,
            0.3633278210957846
          ],
          [
            0.3680950946278042,
            0.3653701102292095
          ],
          [
            0.3711585283279419,
            0.3674123993626349
          ],
          [
            0.42936376863055764,
            0.4245964950985378
          ],
          [
            0.42476861808035105,
            0.42663878423196294
          ],
          [
            0.4186417506800758,
            0.42051191683168754
          ],
          [
            0.4186417506800758,
            0.42051191683168754
          ],
          [
            0.417110033830007,
            0.4184696276982626
          ],
          [
            0.42170518438021337,
            0.41642733856483727
          ],
          [
            0.4308954854806263,
            0.4123427602979872
          ],
          [
            0.43549063603083304,
            0.4184696276982626
          ],
          [
            0.4400857865810394,
            0.4245964950985378
          ],
          [
            0.4400857865810394,
            0.4327656516322384
          ],
          [
            0.43702235288090174,
            0.4327656516322384
          ],
          [
            0.433958919180764,
            0.42868107336538813
          ],
          [
            0.4308954854806263,
            0.4245964950985378
          ],
          [
            0.4263003349304199,
            0.4245964950985378
          ],
          [
            0.42323690123028224,
            0.42051191683168754
          ],
          [
            0.42476861808035105,
            0.41642733856483727
          ],
          [
            0.4308954854806263,
            0.41438504943141236
          ],
          [
            0.43549063603083304,
            0.4184696276982626
          ],
          [
            0.43702235288090174,
            0.4245964950985378
          ],
          [
            0.433958919180764,
            0.42663878423196294
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "apple",
      "possible_names": [
        "apple"
      ],
      "box": [
        0.334375,
        0.7104166666666667,
        0.4109375,
        0.8229166666666666
      ]
    },
    {
      "name": "apple",
      "possible_names": [
        "apple"
      ],
      "box": [
        0.3140625,
        0.6875,
        0.4296875,
        0.825
      ]
    }
  ],
  "scene": "An apple orchard scene with ripe red apples hanging from branches amidst green foliage and grass under natural daylight conditions showcasing a serene agricultural setting",
  "overall_past": "Before the current scene, the individual likely walked through the orchard, inspecting the trees and identifying the ripest apples based on their color, size, and position on the branches. She may have gathered a small basket or container earlier, possibly placing a few apples inside as she moved from tree to tree. The careful way she is now holding the apple suggests she has already made several selections, refining her choices to ensure only the highest quality fruit is kept. This indicates a deliberate and thoughtful process, possibly driven by a desire to harvest the best apples for eating, preserving, or selling.",
  "overall_past_clean": "The individual moved deliberately through the rows of trees, pausing at each to assess the fruit, selecting only those with the deepest hue and most promising form, carefully transferring them into a container with practiced precision.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to place the inspected apple into a nearby basket or container, then continue selecting and evaluating other apples from the tree, moving methodically through the branches to gather only the ripest and most perfect fruit. This suggests a deliberate and mindful process, possibly for personal consumption, gift-giving, or preparing for sale, reflecting a harmonious connection with the natural environment and the seasonal harvest.",
  "overall_future_clean": "The hand reaches forward, plucks another fruit with precision, inspects it briefly, then deposits it into the waiting container before moving steadily to the next branch, each motion deliberate and purposeful, as the gathering continues with quiet focus and intention.",
  "future_scene_ok": true
}