{
  "image_path": "./ref_datasets/hico_det/images/train/train_00012102.jpg",
  "image_id": "train_00012102",
  "width": 640,
  "height": 463,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 12102,
  "annotations": {
    "objects": "[{'id': 378, 'bbox_human': [1, 638, 3, 447], 'bbox_object': [146, 375, 143, 399], 'connection': 1, 'invis': 0}, {'id': 381, 'bbox_human': [2, 638, 19, 445], 'bbox_object': [141, 375, 77, 400], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('knife', 'hold'), ('knife', 'wield')]",
    "negative_captions": "[('knife', 'cut_with'), ('knife', 'stick'), ('knife', 'wash'), ('knife', 'no_interaction')]",
    "ambiguous_captions": "[('knife', 'lick')]",
    "positive_objects": "[377, 380]",
    "negative_objects": "[376, 378, 379, 382]",
    "ambiguous_objects": "[381]",
    "size": "[640, 463, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark top.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "hair",
                "long hair"
              ],
              "name": "hair",
              "type": "accessory",
              "color": [
                "black"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "knife"
            ],
            "name": "knife",
            "position": "hand"
          }
        ],
        "description": "The person is in the foreground, an adult female, showing a neutral emotion. She has long hair and is wearing a dark top, holding a knife in her hand.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, neither displaying strong emotions nor engaging directly with the camera.",
        "meaningful": true,
        "story": "The individual is holding a knife close to their face, suggesting a moment of contemplation or tension. The setting seems to be indoors, possibly a kitchen or similar environment, adding an element of intrigue or suspense to the scene.",
        "race": "asian",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a large knife close to their face with a firm grip, suggesting a deliberate and possibly intense action. Their expression appears serious and focused, indicating they might be deeply engaged in a task or experiencing strong emotions that necessitate such an action. The setting seems to be indoors, possibly a kitchen given the presence of the knife, which could imply preparation for cooking or another domestic activity, although the intensity of their demeanor suggests there may be more complex motivations at play. The black and white tone of the image adds a dramatic effect, enhancing the gravity of the scene and the person's actions.",
        "intention": "The individual is performing a precise and deliberate act with the knife likely driven by a need for control or expression of intense focus in a high-stakes moment",
        "intention_ok": false
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.47546656004020144,
            0.41054114100742545
          ],
          [
            0.4808570411588464,
            0.45768624064143293
          ],
          [
            0.4869841890143497,
            0.5083023931685144
          ],
          [
            0.4909679142492158,
            0.5501677481637476
          ],
          [
            0.5059971965849399,
            0.5998854763674831
          ],
          [
            0.5305470579436846,
            0.6510451588134859
          ],
          [
            0.5540944813617639,
            0.6838568062445368
          ],
          [
            0.5734833459768977,
            0.7082006948224484
          ],
          [
            0.596474621870688,
            0.7194942854245994
          ],
          [
            0.6370319414883852,
            0.690268762536124
          ],
          [
            0.6763327663498265,
            0.6285864866210222
          ],
          [
            0.729012451853071,
            0.5777745243944676
          ],
          [
            0.7703747639698642,
            0.5297985288766532
          ],
          [
            0.8026781452553614,
            0.459722371132276
          ],
          [
            0.8037735140749387,
            0.37500279084358346
          ],
          [
            0.798919150020395,
            0.2958644417765993
          ],
          [
            0.7838652952441147,
            0.215286643738292
          ],
          [
            0.44366319687770944,
            0.3318855975079558
          ],
          [
            0.4431337620796902,
            0.2976831261370882
          ],
          [
            0.4520447926329715,
            0.2871638350705974
          ],
          [
            0.4689232001347201,
            0.27008620017621665
          ],
          [
            0.48216857883547026,
            0.27539145302824014
          ],
          [
            0.5127631788807256,
            0.22847780626668346
          ],
          [
            0.5370992240629026,
            0.17101639945063463
          ],
          [
            0.568873235902616,
            0.14667881675356517
          ],
          [
            0.6109787336417607,
            0.1378741558964184
          ],
          [
            0.6505930205008813,
            0.14487550564659704
          ],
          [
            0.5092126899531909,
            0.31387668507807565
          ],
          [
            0.5035225198205028,
            0.33799774688690104
          ],
          [
            0.491167875751853,
            0.36679575098256056
          ],
          [
            0.4863305849688394,
            0.39553627619144544
          ],
          [
            0.514714686492724,
            0.4862866984293513
          ],
          [
            0.5188136358878441,
            0.47342395414654326
          ],
          [
            0.5269233908504247,
            0.47512269866058243
          ],
          [
            0.5397412025502749,
            0.45629350927942
          ],
          [
            0.5550717913678713,
            0.4348145403710459
          ],
          [
            0.47616298613803726,
            0.39024511548848256
          ],
          [
            0.47635719664394854,
            0.3649110470388966
          ],
          [
            0.490719469556851,
            0.3534500872562859
          ],
          [
            0.5053622179265533,
            0.35532494093010136
          ],
          [
            0.49672643465123006,
            0.36921846186147356
          ],
          [
            0.4850600721580641,
            0.3886212159438988
          ],
          [
            0.5684327618352004,
            0.2957541813860702
          ],
          [
            0.5804864588592734,
            0.2564478467843004
          ],
          [
            0.5938874902469771,
            0.22989046592029735
          ],
          [
            0.6233104880899191,
            0.23925024357448205
          ],
          [
            0.6074559213859694,
            0.25307728941887114
          ],
          [
            0.5865903413189308,
            0.27183863720162643
          ],
          [
            0.5295216160161155,
            0.580119059432329
          ],
          [
            0.5239241807056325,
            0.5423914440911848
          ],
          [
            0.5256506233875241,
            0.5059517088292448
          ],
          [
            0.5308988163513797,
            0.49431626261917394
          ],
          [
            0.5396688086113759,
            0.47664499238698943
          ],
          [
            0.5685111355036497,
            0.48130872506339106
          ],
          [
            0.6085721865828548,
            0.5000512833140655
          ],
          [
            0.578933885799987,
            0.5255179318407736
          ],
          [
            0.5618095905120883,
            0.5515806640382536
          ],
          [
            0.5483143702149391,
            0.5652696352908362
          ],
          [
            0.5438458784350327,
            0.5766862119211528
          ],
          [
            0.5362989859389408,
            0.5774499779312524
          ],
          [
            0.5380970219948462,
            0.5724387527873067
          ],
          [
            0.5379462053733213,
            0.5428479158447982
          ],
          [
            0.5444510237979038,
            0.5316980936320539
          ],
          [
            0.5525183814976897,
            0.5080503287487507
          ],
          [
            0.5938677865479673,
            0.5056271054280536
          ],
          [
            0.547562116969909,
            0.5070898420315618
          ],
          [
            0.5380993256611484,
            0.5308876954196081
          ],
          [
            0.5345543753355742,
            0.5378614017824375
          ]
        ],
        "visibility": [
          1.0,
          1.0,
          0.999987006187439,
          0.985645592212677,
          1.0,
          1.0,
          0.0010127100395038724,
          0.06665471941232681,
          0.9924248456954956,
          0.0017774589359760284,
          1.9294654762802566e-09,
          1.9757524505337187e-09,
          6.695163028780371e-05,
          2.3326417704083724e-06,
          4.2170282199549547e-07,
          5.470576436295005e-09,
          0.00011820143845397979,
          1.662459254703208e-07,
          2.3573078067329334e-07,
          2.5940697411853432e-15,
          9.964456507215646e-19,
          2.898004983231152e-14,
          0.9999256134033203,
          1.109766833984338e-09,
          2.9757302850118295e-13,
          7.986535044413046e-11,
          3.0966611497262875e-09,
          5.928213475669963e-10,
          4.000399300707613e-08
        ],
        "headpose": {
          "pitch": -0.4995226299368562,
          "yaw": 40.14708012995874,
          "roll": -19.624146060991087
        },
        "attributes": {
          "5 oClock Shadow": 0.0010267768520861864,
          "Arched Eyebrows": 0.008938946761190891,
          "Attractive": 0.48302409052848816,
          "Bags Under Eyes": 0.049361713230609894,
          "Bald": 1.3158664158297029e-09,
          "Bangs": 0.4007333815097809,
          "Big Lips": 0.2248767763376236,
          "Big Nose": 0.01019138190895319,
          "Black Hair": 0.09520364552736282,
          "Blond Hair": 0.000680711935274303,
          "Blurry": 0.0002777212648652494,
          "Brown Hair": 0.4924611449241638,
          "Bushy Eyebrows": 0.02306632697582245,
          "Chubby": 0.0006533714476972818,
          "Double Chin": 5.975979729555547e-05,
          "Eyeglasses": 0.0026228860951960087,
          "Goatee": 3.0101775337243453e-05,
          "Gray Hair": 4.661937055061571e-05,
          "Heavy Makeup": 0.05110789090394974,
          "High Cheekbones": 0.04379379004240036,
          "Male": 0.07481422275304794,
          "Mouth Slightly Open": 0.10917548090219498,
          "Mustache": 5.4354991334548686e-06,
          "Narrow Eyes": 0.17602014541625977,
          "No Beard": 0.999057948589325,
          "Oval Face": 0.07520737498998642,
          "Pale Skin": 0.12955591082572937,
          "Pointy Nose": 0.1079537644982338,
          "Receding Hairline": 3.362041388754733e-05,
          "Rosy Cheeks": 0.000622806022875011,
          "Sideburns": 5.308105028234422e-05,
          "Smiling": 0.0029639529529958963,
          "Straight Hair": 0.13781702518463135,
          "Wavy Hair": 0.49332407116889954,
          "Wearing Earrings": 0.008387700654566288,
          "Wearing Hat": 0.00015604618238285184,
          "Wearing Lipstick": 0.17695488035678864,
          "Wearing Necklace": 0.006946702022105455,
          "Wearing Necktie": 0.002587714698165655,
          "Young": 0.9957923889160156
        },
        "age": [
          0.005668569356203079,
          0.9489902853965759,
          0.9974276423454285,
          0.868604302406311,
          0.039206087589263916,
          8.491980406688526e-05,
          2.8249212391529e-06,
          4.168674738735945e-09
        ],
        "race": [
          0.9262934327125549,
          0.0049372706562280655,
          0.9948937892913818,
          0.02109234780073166,
          0.27477842569351196
        ],
        "gender": [
          0.010280312038958073,
          0.9922477006912231
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.02135597896995023,
          "disgust": 2.4203047899185037e-08,
          "fear": 39.23337161540985,
          "happy": 55.122363567352295,
          "sad": 0.006337009835988283,
          "surprise": 3.4065697342157364,
          "neutral": 2.2100016474723816
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 306,
          "h": 386,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 25,
        "gender": {
          "Woman": 99.99901056289673,
          "Man": 0.000987254134088289
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 99.99571442578521,
          "indian": 1.7888454451474673e-06,
          "black": 2.1876992633576118e-07,
          "white": 0.0036568517677146133,
          "middle eastern": 2.5331537489821712e-06,
          "latino hispanic": 0.0006277603380484848
        },
        "dominant_race": "asian"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "hand",
                "hold"
              ],
              [
                "hand",
                "wield"
              ]
            ],
            "negative_action": [
              "cut with",
              "stick",
              "wash",
              "no interaction"
            ],
            "position": "hand"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.002357959747314453,
        0.0376087948679924,
        0.9984334111213684,
        0.9640827775001526
      ]
    ],
    "face_boxes": [
      [
        0.4598854184150696,
        0.04509436711668968,
        0.7796708941459656,
        0.6787288784980774
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6971336327907112,
            0.8317095466389027
          ],
          [
            0.4124780777427885,
            0.7850019210300946
          ],
          [
            0.04385937336418362,
            0.9520170671464386
          ],
          [
            0.1585407480597496,
            0.4594639243626439
          ],
          [
            0.9817891878386338,
            0.8784171722477109
          ],
          [
            1.1149014977531302,
            0.9265401804507252
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4882497003095018,
            0.33774102126090183
          ],
          [
            0.6029310750050678,
            0.2556488307969358
          ],
          [
            0.47391452847255594,
            0.4198332117248674
          ],
          [
            0.8036234807223082,
            0.2726334219274115
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.16263651144173413,
            0.44247933323216837
          ],
          [
            0.15649286636875734,
            0.3490640820145521
          ],
          [
            0.14010981284081936,
            0.25281806560852327
          ],
          [
            0.18311532835165661,
            0.19054123146344576
          ],
          [
            0.22407296217150155,
            0.15091051882566922
          ],
          [
            0.13601404945883483,
            0.17355664033297025
          ],
          [
            0.20359414526157912,
            0.1254336321299557
          ],
          [
            0.2261208438624937,
            0.14807975363725673
          ],
          [
            0.23226448893547058,
            0.17921817070979523
          ],
          [
            0.1585407480597496,
            0.196202761840271
          ],
          [
            0.2404560156994396,
            0.16789510995614498
          ],
          [
            0.2506954241544008,
            0.2075258225939215
          ],
          [
            0.24864754246340864,
            0.23017194410122227
          ],
          [
            0.18516321004264888,
            0.22734117891280978
          ],
          [
            0.26298271430035436,
            0.2075258225939215
          ],
          [
            0.26912635937333107,
            0.24149500485487277
          ],
          [
            0.26503059599134654,
            0.26980265673899906
          ],
          [
            0.2097377903345558,
            0.26697189155058626
          ],
          [
            0.26912635937333107,
            0.24715653523169803
          ],
          [
            0.28550941290126913,
            0.27546418711582427
          ],
          [
            0.27936576782829226,
            0.3009410738115378
          ]
        ],
        "dw_face": [
          [
            0.4636751200175947,
            0.3575563775797898
          ],
          [
            0.47186664678156376,
            0.4198332117248674
          ],
          [
            0.48210605523652494,
            0.4764485154931196
          ],
          [
            0.49848910876446306,
            0.5302330540729594
          ],
          [
            0.5210158073653778,
            0.5811868274643864
          ],
          [
            0.5496861510392692,
            0.6293098356674007
          ],
          [
            0.5783564947131608,
            0.6689405483051772
          ],
          [
            0.6172662468420134,
            0.67177131349359
          ],
          [
            0.6582238806618586,
            0.6434636616094638
          ],
          [
            0.6909899877177343,
            0.6066637141600999
          ],
          [
            0.719660331391626,
            0.5670330015223232
          ],
          [
            0.7462827933745251,
            0.5160792281308961
          ],
          [
            0.7626658469024632,
            0.45663315917423136
          ],
          [
            0.76880949197544,
            0.4000178554059791
          ],
          [
            0.7667616102844477,
            0.33774102126090183
          ],
          [
            0.7606179652114708,
            0.2782949523042368
          ],
          [
            0.7524264384475019,
            0.2216796485359845
          ],
          [
            0.4595793566356102,
            0.3066026041883628
          ],
          [
            0.46572300170858705,
            0.2867872478694748
          ],
          [
            0.47186664678156376,
            0.27546418711582427
          ],
          [
            0.48210605523652494,
            0.26980265673899906
          ],
          [
            0.49439334538247853,
            0.2641411263621738
          ],
          [
            0.5394467425843079,
            0.21318735297074676
          ],
          [
            0.564021322876215,
            0.1933719966518585
          ],
          [
            0.588595903168122,
            0.17355664033297025
          ],
          [
            0.6193141285330057,
            0.16789510995614498
          ],
          [
            0.6479844722068971,
            0.17355664033297025
          ],
          [
            0.52306368905637,
            0.3037718389999503
          ],
          [
            0.5189679256743854,
            0.3349102560724891
          ],
          [
            0.514872162292401,
            0.36321790795661535
          ],
          [
            0.5107763989104164,
            0.38869479465232887
          ],
          [
            0.5128242806014087,
            0.44814086360899363
          ],
          [
            0.5251115707473624,
            0.44814086360899363
          ],
          [
            0.5394467425843079,
            0.4368178028553431
          ],
          [
            0.5599255594942305,
            0.4283255072901054
          ],
          [
            0.5783564947131608,
            0.41700244653645485
          ],
          [
            0.47391452847255594,
            0.36321790795661535
          ],
          [
            0.47801029185454047,
            0.3405717864493143
          ],
          [
            0.49439334538247853,
            0.3292487256956638
          ],
          [
            0.5107763989104164,
            0.3349102560724891
          ],
          [
            0.5005369904554552,
            0.3518948472029648
          ],
          [
            0.4882497003095018,
            0.36321790795661535
          ],
          [
            0.5742607313311762,
            0.2811257174926493
          ],
          [
            0.5865480214771297,
            0.24998730042011078
          ],
          [
            0.6111226017690367,
            0.23583347447804776
          ],
          [
            0.6356971820609436,
            0.23866423966646028
          ],
          [
            0.6213620102239981,
            0.2613103611737613
          ],
          [
            0.5988353116230831,
            0.27546418711582427
          ],
          [
            0.5373988608933157,
            0.5500484103918474
          ],
          [
            0.5292073341293468,
            0.5189099933193089
          ],
          [
            0.5353509792023236,
            0.49060234143518267
          ],
          [
            0.5435425059662924,
            0.4821100458699449
          ],
          [
            0.5537819144212538,
            0.47361775030470715
          ],
          [
            0.5865480214771297,
            0.4764485154931196
          ],
          [
            0.6172662468420134,
            0.4934331066235954
          ],
          [
            0.6029310750050678,
            0.5189099933193089
          ],
          [
            0.5865480214771297,
            0.5415561148266097
          ],
          [
            0.5660692045672073,
            0.5613714711454979
          ],
          [
            0.5558297961122459,
            0.5642022363339106
          ],
          [
            0.5455903876572847,
            0.5613714711454979
          ],
          [
            0.5414946242753003,
            0.5472176452034352
          ],
          [
            0.5435425059662924,
            0.5245715236961339
          ],
          [
            0.5537819144212538,
            0.5104176977540709
          ],
          [
            0.5824522580951452,
            0.49626387181200793
          ],
          [
            0.6111226017690367,
            0.49626387181200793
          ],
          [
            0.5845001397861376,
            0.5104176977540709
          ],
          [
            0.5578776778032382,
            0.5274022888845467
          ],
          [
            0.5496861510392692,
            0.5358945844497844
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "knife",
      "possible_names": [
        "knife"
      ],
      "box": [
        0.228125,
        0.30885529157667385,
        0.5859375,
        0.8617710583153347
      ]
    },
    {
      "name": "knife",
      "possible_names": [
        "knife"
      ],
      "box": [
        0.2203125,
        0.16630669546436286,
        0.5859375,
        0.8639308855291576
      ]
    }
  ],
  "scene": "A black and white photograph captures a hand holding a large knife with a dark handle against an indistinct background suggesting a somber and intense atmosphere",
  "overall_past": "Before this moment, the individual likely experienced a buildup of emotional tension—perhaps a personal crisis, a decision of great consequence, or a moment of internal conflict—leading them to confront a deeply significant act. The firm grip on the knife, held close to the face in a focused, almost ritualistic manner, suggests not a moment of spontaneous violence, but one of deliberate contemplation. The kitchen setting, while mundane, becomes charged with symbolic weight: the knife, a tool of creation and destruction, represents both the potential for care and the threat of harm. It is plausible that the person had been preparing food as a way to ground themselves, but the act of cooking was interrupted by a sudden emotional surge—perhaps a memory, a realization, or a decision to end something—causing them to pause, the knife now held not for cutting, but as a physical manifestation of their inner struggle. The black and white imagery underscores the moral and emotional gravity of the moment, suggesting that this is not just a physical act, but a pivotal psychological turning point.",
  "overall_past_clean": "A storm of unresolved emotions erupted from within, triggered by a long-suppressed truth that finally demanded acknowledgment, shattering the fragile calm of denial and forcing a confrontation with a choice that could no longer be avoided.",
  "past_scene_ok": true,
  "overall_future": "The knife is held close to the face with deliberate intent, suggesting a moment of decision or confrontation—possibly internal. Given the somber tone and the intensity of the grip, the next moment may involve a sudden, decisive action: the blade moving forward, perhaps slicing through something symbolic—a veil, a piece of fabric, or even air as if breaking a long-held silence or restraint. This could represent a turning point—either a release of suppressed emotion, a commitment to a difficult choice, or the beginning of a transformative act, blurring the line between preparation and rupture.",
  "overall_future_clean": "The blade cuts through the stillness with a sharp, unyielding motion, severing the tension in a single, decisive arc as if tearing open a long-closed wound, and the air itself seems to recoil in the wake of that irreversible act.",
  "future_scene_ok": true
}