{
  "image_path": "./ref_datasets/hico_det/images/train/train_00025813.jpg",
  "image_id": "train_00025813",
  "width": 640,
  "height": 430,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 25813,
  "annotations": {
    "objects": "[{'id': 539, 'bbox_human': [80, 571, 1, 427], 'bbox_object': [253, 320, 213, 426], 'connection': 1, 'invis': 0}, {'id': 541, 'bbox_human': [85, 569, 3, 427], 'bbox_object': [255, 318, 219, 427], 'connection': 1, 'invis': 0}, {'id': 543, 'bbox_human': [82, 566, 2, 428], 'bbox_object': [258, 314, 215, 430], 'connection': 1, 'invis': 0}, {'id': 545, 'bbox_human': [53, 569, 2, 426], 'bbox_object': [258, 327, 219, 426], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('tie', 'adjust'), ('tie', 'hold'), ('tie', 'pull'), ('tie', 'wear')]",
    "negative_captions": "[('tie', 'cut'), ('tie', 'inspect'), ('tie', 'no_interaction')]",
    "ambiguous_captions": "[('tie', 'tie')]",
    "positive_objects": "[538, 540, 542, 544]",
    "negative_objects": "[539, 541, 545]",
    "ambiguous_objects": "[543]",
    "size": "[640, 430, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a white dress shirt and a black tie.",
        "clothing": [
          {
            "possible_names": [
              "shirt",
              "dress shirt",
              "button-up shirt"
            ],
            "name": "dress shirt",
            "type": "top",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "tie",
              "necktie"
            ],
            "name": "tie",
            "type": "accessory",
            "color": [
              "black"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "tie",
              "necktie"
            ],
            "name": "tie",
            "position": "hand"
          }
        ],
        "description": "The person is an adult male in the foreground, with a neutral expression. He is wearing a white dress shirt and a black tie, holding the tie with his hand. The background appears to be blurred foliage, suggesting an outdoor setting.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, neither displaying strong emotions nor appearing particularly engaged.",
        "meaningful": true,
        "story": "The individual seems to be preparing for an important event, possibly a formal gathering or a professional meeting, as indicated by the act of adjusting their tie. The setting suggests an outdoor environment, perhaps before heading into the event.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is adjusting their tie with one hand, suggesting they are preparing for an event or ensuring their appearance is neat and presentable. Their gaze is directed slightly off-camera, indicating they might be focused on something or someone not visible in the frame, possibly reflecting a moment of contemplation or readiness. The formal attire and the act of fixing the tie imply a sense of importance or formality to the occasion, while their calm demeanor suggests confidence or a composed state of mind as they engage in this preparatory action.",
        "intention": "The individual is meticulously preparing to make a strong impression at a significant event by ensuring their appearance is flawless and composed",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.33654044922441245,
            0.1326481730438942
          ],
          [
            0.3395181743428111,
            0.18444686949847147
          ],
          [
            0.342037786450237,
            0.23279709277358956
          ],
          [
            0.3497355105355382,
            0.28260800434505423
          ],
          [
            0.36529047004878523,
            0.32627449194062197
          ],
          [
            0.38687225747853515,
            0.3604842938458009
          ],
          [
            0.41466889418661596,
            0.3905844203657486
          ],
          [
            0.4434758648276329,
            0.409798760588383
          ],
          [
            0.47168800346553325,
            0.4127943097554964
          ],
          [
            0.4991257801651955,
            0.40945540741828595
          ],
          [
            0.5209521174430847,
            0.3867699311025119
          ],
          [
            0.5389076389372349,
            0.35395934684728075
          ],
          [
            0.5511667311191559,
            0.3176421279527024
          ],
          [
            0.5569185815751553,
            0.2765817417258836
          ],
          [
            0.5629384197294712,
            0.23759295639405614
          ],
          [
            0.5672933116555214,
            0.19657276508420013
          ],
          [
            0.5722080327570438,
            0.15445999069467337
          ],
          [
            0.3735901158303022,
            0.11267024639040925
          ],
          [
            0.39207092821598055,
            0.08133397157802139
          ],
          [
            0.4200697548687458,
            0.07115375231270775
          ],
          [
            0.44815317168831825,
            0.07696698187197562
          ],
          [
            0.47302568405866624,
            0.09274501602515034
          ],
          [
            0.49732698053121566,
            0.09352849935772412
          ],
          [
            0.5202378004789352,
            0.08304891570461946
          ],
          [
            0.5432640433311462,
            0.08102436208249722
          ],
          [
            0.5637833490967751,
            0.09249811394270076
          ],
          [
            0.5715661846101284,
            0.12261164433932384
          ],
          [
            0.487639969587326,
            0.12349730298368639
          ],
          [
            0.48853874281048776,
            0.15498259146744234
          ],
          [
            0.4900417037308216,
            0.18538534142250238
          ],
          [
            0.4913663662970066,
            0.21825774729845926
          ],
          [
            0.4611861828714609,
            0.23635301423627278
          ],
          [
            0.47333867847919464,
            0.24225912664419788
          ],
          [
            0.48412328734993937,
            0.250275046009558
          ],
          [
            0.49433145150542257,
            0.24383361418777924
          ],
          [
            0.5033733949065209,
            0.23604529331688867
          ],
          [
            0.4085554774850607,
            0.13099251015241756
          ],
          [
            0.4219869267195463,
            0.11965966612793678
          ],
          [
            0.43770758248865604,
            0.12166998022022438
          ],
          [
            0.45037362575531004,
            0.13483659825055702
          ],
          [
            0.43524440973997114,
            0.1374484990522315
          ],
          [
            0.4209050476551056,
            0.13934103618824603
          ],
          [
            0.5022511653602123,
            0.13754816740454232
          ],
          [
            0.5181064307689667,
            0.12466306421051787
          ],
          [
            0.5317149683833122,
            0.12228287331685672
          ],
          [
            0.5435429207980633,
            0.13830947250226805
          ],
          [
            0.5325638085603714,
            0.14549754370882662
          ],
          [
            0.5187774911522866,
            0.14185458061306977
          ],
          [
            0.4319152843207121,
            0.28453639100160316
          ],
          [
            0.4518181622028351,
            0.2792369795003999
          ],
          [
            0.4691062640398741,
            0.27653267217236893
          ],
          [
            0.48017829582095145,
            0.28173641809989447
          ],
          [
            0.4909726925194263,
            0.2764676249304483
          ],
          [
            0.5025129951536655,
            0.2824088180580012
          ],
          [
            0.5158232092857361,
            0.2886395817183181
          ],
          [
            0.5021209850907326,
            0.2991149286099051
          ],
          [
            0.4902984775602818,
            0.3014366070693514
          ],
          [
            0.47802647538483145,
            0.3027845156153175
          ],
          [
            0.46719257086515426,
            0.30045120486389365
          ],
          [
            0.44986230358481405,
            0.2954890629777877
          ],
          [
            0.4390882711857557,
            0.28690520029923444
          ],
          [
            0.4700831238180399,
            0.2868716404683566
          ],
          [
            0.47955327928066255,
            0.291832378457155
          ],
          [
            0.49179672822356224,
            0.28858222248546306
          ],
          [
            0.5090092822909356,
            0.28805138217254334
          ],
          [
            0.49041109159588814,
            0.28268254460686465
          ],
          [
            0.478604356944561,
            0.2854575147660468
          ],
          [
            0.4687534052878618,
            0.283047825315862
          ]
        ],
        "visibility": [
          5.914234879611513e-09,
          1.1807693226728588e-05,
          1.8396334192853463e-14,
          2.3419384487244344e-11,
          0.46308404207229614,
          0.5483253002166748,
          6.38952315057395e-07,
          3.544358584406382e-09,
          4.227253612043569e-06,
          2.3103009089142645e-11,
          1.4389086710336896e-13,
          1.4134606915292011e-18,
          1.1179451320231237e-07,
          1.1110332624611821e-13,
          2.029874740516746e-10,
          1.7907344560562838e-16,
          1.019300339662535e-13,
          6.478547760107103e-14,
          2.032257695334171e-17,
          4.767006220643931e-14,
          4.407586334431632e-20,
          1.595742044089913e-22,
          3.800040726531506e-09,
          1.87036174040917e-17,
          7.027380066748634e-11,
          1.5522817406465883e-11,
          1.0434739877718258e-10,
          9.68420646002251e-15,
          2.8127031259650437e-10
        ],
        "headpose": {
          "pitch": -3.9647327141219955,
          "yaw": -10.162681154744284,
          "roll": 1.9275901609081996
        },
        "attributes": {
          "5 oClock Shadow": 0.04138828441500664,
          "Arched Eyebrows": 0.0016455920413136482,
          "Attractive": 0.18196657299995422,
          "Bags Under Eyes": 0.26368606090545654,
          "Bald": 5.2805170014380565e-08,
          "Bangs": 0.20661091804504395,
          "Big Lips": 0.021782925352454185,
          "Big Nose": 0.35885098576545715,
          "Black Hair": 0.04216856136918068,
          "Blond Hair": 0.000498150649946183,
          "Blurry": 0.00015681301010772586,
          "Brown Hair": 0.5554062128067017,
          "Bushy Eyebrows": 0.5999408960342407,
          "Chubby": 0.30168241262435913,
          "Double Chin": 0.015491069294512272,
          "Eyeglasses": 0.0010268448386341333,
          "Goatee": 0.6204670667648315,
          "Gray Hair": 0.003434674581512809,
          "Heavy Makeup": 0.00045020869583822787,
          "High Cheekbones": 0.046296775341033936,
          "Male": 0.999976634979248,
          "Mouth Slightly Open": 0.0588119812309742,
          "Mustache": 0.1036885529756546,
          "Narrow Eyes": 0.005555285606533289,
          "No Beard": 0.007818193174898624,
          "Oval Face": 0.5792047381401062,
          "Pale Skin": 0.0014409791911020875,
          "Pointy Nose": 0.025402653962373734,
          "Receding Hairline": 4.296210681786761e-05,
          "Rosy Cheeks": 0.0035106006544083357,
          "Sideburns": 0.9566149115562439,
          "Smiling": 0.01510682888329029,
          "Straight Hair": 0.001629496575333178,
          "Wavy Hair": 0.9493361711502075,
          "Wearing Earrings": 8.522353164153174e-05,
          "Wearing Hat": 0.0004711582441814244,
          "Wearing Lipstick": 8.744144724914804e-05,
          "Wearing Necklace": 5.2567087550414726e-05,
          "Wearing Necktie": 0.5413967967033386,
          "Young": 0.7491831183433533
        },
        "age": [
          0.0006886438932269812,
          0.07650070637464523,
          0.9862316250801086,
          0.8835843205451965,
          0.086316779255867,
          0.0543496310710907,
          2.2642232579528354e-05,
          2.8682393349299673e-06
        ],
        "race": [
          0.990918755531311,
          0.004252421669661999,
          0.17154337465763092,
          0.18144412338733673,
          0.6183633208274841
        ],
        "gender": [
          0.999554455280304,
          0.0010369601659476757
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.00916614881134592,
          "disgust": 1.8209610175290436e-05,
          "fear": 0.005893789420952089,
          "happy": 99.51857924461365,
          "sad": 0.00614435484749265,
          "surprise": 0.11883610859513283,
          "neutral": 0.34136720933020115
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 202,
          "h": 210,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 29,
        "gender": {
          "Woman": 0.01298831048188731,
          "Man": 99.98700618743896
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.006893065121170289,
          "indian": 0.009604579672164376,
          "black": 9.05719556937799e-05,
          "white": 93.78960095582013,
          "middle eastern": 4.787943425055946,
          "latino hispanic": 1.40586419960047
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "hand",
                "adjust"
              ],
              [
                "hand",
                "hold"
              ],
              [
                "hand",
                "pull"
              ],
              [
                "hand",
                "wear"
              ]
            ],
            "negative_action": [
              "cut",
              "inspect",
              "no interaction"
            ],
            "position": "hand"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.13272380828857422,
        0.004148261621594429,
        0.8804942965507507,
        0.98945552110672
      ]
    ],
    "face_boxes": [
      [
        0.352517306804657,
        0.009806149639189243,
        0.5634490251541138,
        0.3951791524887085
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4712863844612406,
            0.6047050866969796
          ],
          [
            0.23515217608461772,
            0.6310942418199484
          ],
          [
            0.18034969769004316,
            0.9861483289289844
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7074205928378635,
            0.5783159315740108
          ],
          [
            0.821861062426534,
            0.9837493148268963
          ],
          [
            0.5446249952539801,
            0.880591708437109
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4285726880654693,
            0.12970029448353967
          ],
          [
            0.5252829440558949,
            0.13449832268771575
          ],
          [
            0.33992162007424565,
            0.17288254832112512
          ],
          [
            0.5671907216517461,
            0.18247860472947744
          ]
        ],
        "dw_hand_1": [
          [
            0.5333421320550972,
            0.8685966379266684
          ],
          [
            0.514000080857012,
            0.7894291725577618
          ],
          [
            0.49788170485860767,
            0.7126607212909434
          ],
          [
            0.4656449528617991,
            0.6790745238617104
          ],
          [
            0.43663187606467135,
            0.6622814251470935
          ],
          [
            0.45275025206307584,
            0.676675509759622
          ],
          [
            0.4140661496669054,
            0.6598824110450054
          ],
          [
            0.41890166246642657,
            0.6838725520658863
          ],
          [
            0.43340820086499043,
            0.7006656507805031
          ],
          [
            0.43018452566530974,
            0.7198577635972074
          ],
          [
            0.3947240984688204,
            0.7126607212909434
          ],
          [
            0.40761879926754363,
            0.7318528341076477
          ],
          [
            0.4237371752659481,
            0.7414488905160002
          ],
          [
            0.4172898248665863,
            0.7654390315368813
          ],
          [
            0.3850530728697777,
            0.7582419892306167
          ],
          [
            0.3979477736685011,
            0.7726360738431454
          ],
          [
            0.4140661496669054,
            0.7846311443535856
          ],
          [
            0.40923063686738426,
            0.8110202994765545
          ],
          [
            0.38182939767009677,
            0.8038232571702902
          ],
          [
            0.3915004232691395,
            0.8158183276807308
          ],
          [
            0.40600696166770334,
            0.825414384089083
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.43179636326515014,
            0.710261707188855
          ],
          [
            0.4221253376661075,
            0.6982666366784147
          ],
          [
            0.42534901286578836,
            0.7078626930867672
          ],
          [
            0.4285726880654693,
            0.7126607212909434
          ],
          [
            0.438243713664512,
            0.7270548059034717
          ],
          [
            0.4221253376661075,
            0.7174587494951193
          ],
          [
            0.42534901286578836,
            0.7318528341076477
          ],
          [
            0.42534901286578836,
            0.7438479046180886
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4172898248665863,
            0.7558429751285288
          ],
          [
            0.41890166246642657,
            0.7678380456389691
          ],
          [
            0.4205135000662672,
            0.7702370597410572
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4043951240678627,
            0.7966262148640259
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.3495926456732882,
            0.13209930858562766
          ],
          [
            0.3495926456732882,
            0.17288254832112512
          ],
          [
            0.35281632087296905,
            0.21606480215871057
          ],
          [
            0.3576518336724904,
            0.259247055996296
          ],
          [
            0.36571102167169267,
            0.30003029573179324
          ],
          [
            0.38182939767009677,
            0.3336164931610265
          ],
          [
            0.4043951240678627,
            0.36240466238608354
          ],
          [
            0.43018452566530974,
            0.38399578930487627
          ],
          [
            0.457585764862597,
            0.3935918457132287
          ],
          [
            0.4865988416597247,
            0.3911928316111403
          ],
          [
            0.5123882432571716,
            0.37439973289652384
          ],
          [
            0.5317302944552568,
            0.3432125495693787
          ],
          [
            0.5462368328538206,
            0.3072273380380578
          ],
          [
            0.5559078584528632,
            0.2664440983025602
          ],
          [
            0.5607433712523845,
            0.2256608585670629
          ],
          [
            0.5639670464520654,
            0.18247860472947744
          ],
          [
            0.5639670464520654,
            0.13689733678980387
          ],
          [
            0.3850530728697777,
            0.10571015346265897
          ],
          [
            0.4027832864680224,
            0.09371508295221842
          ],
          [
            0.4237371752659481,
            0.09131606885013031
          ],
          [
            0.44307922646403314,
            0.09611409705430653
          ],
          [
            0.46242127766211816,
            0.10091212525848275
          ],
          [
            0.5011053800582885,
            0.10571015346265897
          ],
          [
            0.5172237560566929,
            0.10091212525848275
          ],
          [
            0.5317302944552568,
            0.09851311115639463
          ],
          [
            0.5462368328538206,
            0.10091212525848275
          ],
          [
            0.559131533652544,
            0.11290719576892304
          ],
          [
            0.48176332886020357,
            0.13689733678980387
          ],
          [
            0.4833751664600438,
            0.1632864919127728
          ],
          [
            0.48498700405988426,
            0.19207466113782973
          ],
          [
            0.4865988416597247,
            0.2208628303628868
          ],
          [
            0.457585764862597,
            0.2424539572816795
          ],
          [
            0.46886862806147994,
            0.2448529713837675
          ],
          [
            0.48176332886020357,
            0.2496509995879437
          ],
          [
            0.4930461920590865,
            0.2472519854858556
          ],
          [
            0.502717217658129,
            0.2424539572816795
          ],
          [
            0.4043951240678627,
            0.13449832268771575
          ],
          [
            0.4205135000662672,
            0.12010423807518736
          ],
          [
            0.438243713664512,
            0.12250325217727548
          ],
          [
            0.45275025206307584,
            0.14169536499398008
          ],
          [
            0.43502003846483106,
            0.14649339319815619
          ],
          [
            0.41890166246642657,
            0.1440943790960682
          ],
          [
            0.502717217658129,
            0.1440943790960682
          ],
          [
            0.514000080857012,
            0.12490226627936345
          ],
          [
            0.5301184568554163,
            0.12250325217727548
          ],
          [
            0.5430131576541397,
            0.139296350891892
          ],
          [
            0.5301184568554163,
            0.14889240730024442
          ],
          [
            0.5156119184568524,
            0.14889240730024442
          ],
          [
            0.43179636326515014,
            0.29043423932344103
          ],
          [
            0.4511384144632352,
            0.2808381829150889
          ],
          [
            0.47209230326116086,
            0.2784391688130005
          ],
          [
            0.48015149126036294,
            0.2784391688130005
          ],
          [
            0.4882106792595652,
            0.2784391688130005
          ],
          [
            0.5011053800582885,
            0.2832371970171767
          ],
          [
            0.514000080857012,
            0.29043423932344103
          ],
          [
            0.502717217658129,
            0.30003029573179324
          ],
          [
            0.4914343544592459,
            0.3048283239359694
          ],
          [
            0.47853965366052265,
            0.3072273380380578
          ],
          [
            0.46080944006227786,
            0.3048283239359694
          ],
          [
            0.446302901663714,
            0.30003029573179324
          ],
          [
            0.43663187606467135,
            0.29043423932344103
          ],
          [
            0.457585764862597,
            0.29043423932344103
          ],
          [
            0.48015149126036294,
            0.29043423932344103
          ],
          [
            0.4946580296589268,
            0.29043423932344103
          ],
          [
            0.5091645680574907,
            0.29043423932344103
          ],
          [
            0.4946580296589268,
            0.29043423932344103
          ],
          [
            0.47853965366052265,
            0.29043423932344103
          ],
          [
            0.457585764862597,
            0.29043423932344103
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "tie",
      "possible_names": [
        "tie"
      ],
      "box": [
        0.3953125,
        0.49534883720930234,
        0.5,
        0.9906976744186047
      ]
    }
  ],
  "scene": "A black and white portrait captures an individual adjusting their tie against a blurred natural backdrop suggesting a formal yet serene setting with no distinct cultural indicators visible",
  "overall_past": "Before the current scene, the individual likely arrived at a quiet, secluded spot within a formal setting—perhaps a garden, a quiet courtyard, or a secluded area near a venue—after a brief moment of transition, such as stepping out from a gathering or entering the space. They may have paused to collect themselves, perhaps after a conversation or a moment of reflection, before the main event began. The act of adjusting the tie suggests they were preparing to enter a significant moment—such as a ceremony, interview, or public appearance—indicating that they had already undergone some form of preparation (like changing into formal attire) and were now taking a final, deliberate moment to ensure their appearance was impeccable, possibly to project confidence or composure in anticipation of a pivotal encounter.",
  "overall_past_clean": "Stepping away from the gathering’s hum, the figure moved with purpose through the hushed space, pausing only to steady breath and mind, having already shed the weight of expectation and now aligning every gesture with intent, as if each motion carved the path to what would follow.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to step forward into the event—perhaps a ceremony, interview, or formal gathering—having completed their final preparations. The slight off-camera focus suggests anticipation, and with the tie now perfectly adjusted, they would likely take a moment to compose themselves before entering the space, possibly exhaling softly or straightening their jacket, then walking purposefully into the light, ready to make a confident entrance.",
  "overall_future_clean": "A decisive stride cuts through the stillness as the figure emerges into the spotlight, shoulders squared and gaze fixed ahead, commanding the room with unwavering presence.",
  "future_scene_ok": true
}