{
  "image_path": "./ref_datasets/hico_det/images/train/train_00030827.jpg",
  "image_id": "train_00030827",
  "width": 640,
  "height": 427,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 30827,
  "annotations": {
    "objects": "[{'id': 460, 'bbox_human': [292, 344, 184, 295], 'bbox_object': [303, 339, 286, 309], 'connection': 1, 'invis': 0}, {'id': 462, 'bbox_human': [293, 343, 183, 299], 'bbox_object': [305, 337, 289, 307], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('skateboard', 'ride'), ('skateboard', 'stand_on')]",
    "negative_captions": "[('skateboard', 'carry'), ('skateboard', 'flip'), ('skateboard', 'grind'), ('skateboard', 'hold'), ('skateboard', 'jump'), ('skateboard', 'pick_up'), ('skateboard', 'sit_on'), ('skateboard', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[459, 461]",
    "negative_objects": "[453, 454, 455, 456, 457, 458, 460, 462]",
    "ambiguous_objects": "[]",
    "size": "[640, 427, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a white t-shirt, dark pants, and dark footwear.",
        "clothing": [
          {
            "possible_names": [
              "t-shirt",
              "shirt"
            ],
            "name": "t shirt",
            "type": "top",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "pants",
              "jeans"
            ],
            "name": "pants",
            "type": "bottom",
            "color": [
              "dark"
            ]
          },
          {
            "possible_names": [
              "shoe"
            ],
            "name": "shoe",
            "type": "footwear",
            "color": [
              "dark"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "skateboard"
            ],
            "name": "skateboard",
            "position": "foot"
          }
        ],
        "description": "The person is a teenager in the foreground, possibly of unknown gender, riding a skateboard. They are wearing a white t-shirt and dark pants. Emotion is not clearly visible. There is a physical contact with a skateboard under their feet.",
        "blurry": false,
        "face_seen": false,
        "emotion_description": "The person's face is not visible, so their emotional state cannot be determined.",
        "meaningful": true,
        "story": "A young adult male is skateboarding down an empty street during twilight. The setting suggests a peaceful evening activity, possibly for leisure or practice. The urban environment around him includes palm trees and a bridge, indicating a suburban or city outskirts location.",
        "race": "unknown",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is skateboarding down an empty street during what appears to be early evening as the sky shows hues of pink and purple from the setting sun. They seem focused on maintaining balance while moving forward, possibly enjoying the solitude and freedom of the open road. Their casual attire suggests they are dressed for comfort and leisure, indicating this activity might be a form of relaxation or exercise. The surrounding environment, including palm trees and a bridge, adds to the serene atmosphere, potentially enhancing their enjoyment of the moment.",
        "intention": "The individual is seeking freedom and tranquility through skateboarding in a peaceful setting to enjoy the moment and engage in a mindful form of movement",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.4946356190235487,
            0.4615375823342868
          ],
          [
            0.49575320311955046,
            0.4660601124551313
          ],
          [
            0.49663390405476093,
            0.46933767970248824
          ],
          [
            0.4973689331007855,
            0.4728211517436084
          ],
          [
            0.49864048258002314,
            0.476163137633093
          ],
          [
            0.5005651172250509,
            0.478824037339385
          ],
          [
            0.5021296481468848,
            0.48050635839713063
          ],
          [
            0.5042913912662438,
            0.481345886289176
          ],
          [
            0.5069063742245946,
            0.4815634202303078
          ],
          [
            0.5085675061813423,
            0.480459817399465
          ],
          [
            0.5098765998014382,
            0.47732777450347114
          ],
          [
            0.5105736133243356,
            0.47465303264042336
          ],
          [
            0.5108488239347935,
            0.47154016373507673
          ],
          [
            0.5115924855428082,
            0.46803452091976405
          ],
          [
            0.5117070909057345,
            0.46427531767226493
          ],
          [
            0.5118991705988135,
            0.46106806906939113
          ],
          [
            0.5121835677751473,
            0.45659006762640175
          ],
          [
            0.4984958632183926,
            0.457334361534208
          ],
          [
            0.49951739130275585,
            0.4545520832802628
          ],
          [
            0.5006464959255287,
            0.4538800552482388
          ],
          [
            0.5023457902882781,
            0.45371537114434035
          ],
          [
            0.5037531166204384,
            0.45324360690175913
          ],
          [
            0.5068782158195972,
            0.4534109304803955
          ],
          [
            0.5078649637954575,
            0.4539139833128066
          ],
          [
            0.5086726391954082,
            0.45425279138877106
          ],
          [
            0.5097081075821605,
            0.45500863240530115
          ],
          [
            0.5104974689228194,
            0.456391806664695
          ],
          [
            0.5059727882700307,
            0.45899345548546167
          ],
          [
            0.5062772621001516,
            0.46166319095717506
          ],
          [
            0.5070461684039661,
            0.4643010344143175
          ],
          [
            0.5075790722455297,
            0.4663318244459319
          ],
          [
            0.5052655727735588,
            0.4686069906495733
          ],
          [
            0.5061747969261238,
            0.46819246361669625
          ],
          [
            0.5070322959550789,
            0.4679899339334508
          ],
          [
            0.507844307592937,
            0.4678901084971372
          ],
          [
            0.5082876639706748,
            0.4681252787128345
          ],
          [
            0.4995885440813644,
            0.46012495145545673
          ],
          [
            0.5007457200969968,
            0.4592392703847927
          ],
          [
            0.5028033543910299,
            0.4586536148073842
          ],
          [
            0.5033072983579976,
            0.45974369956801747
          ],
          [
            0.5025877439017806,
            0.4603222971099721
          ],
          [
            0.5007352930094514,
            0.46021309892801826
          ],
          [
            0.5073820959244456,
            0.4590095160756473
          ],
          [
            0.507844620517322,
            0.458397562705621
          ],
          [
            0.5097358844109944,
            0.45784028368516283
          ],
          [
            0.5100205593875476,
            0.4587025301797049
          ],
          [
            0.5094982758164406,
            0.45927312997082237
          ],
          [
            0.5078554770776204,
            0.4595569335086244
          ],
          [
            0.5038441951785769,
            0.47332694371754047
          ],
          [
            0.5051222653793437,
            0.47255668356172137
          ],
          [
            0.5063951292208263,
            0.47275676293371516
          ],
          [
            0.5071481226810387,
            0.4721850417217869
          ],
          [
            0.5080234424344131,
            0.47230383910316015
          ],
          [
            0.5089811698666641,
            0.47256492810649753
          ],
          [
            0.509548327752522,
            0.4728438405138707
          ],
          [
            0.5087412702185767,
            0.47339627925429945
          ],
          [
            0.508052188370909,
            0.4743235817159766
          ],
          [
            0.5073325612715313,
            0.47464270526328267
          ],
          [
            0.5060702274952616,
            0.4747669727916341
          ],
          [
            0.5045627789305789,
            0.4745081266299184
          ],
          [
            0.5042759669678551,
            0.47369773398278425
          ],
          [
            0.5055496474461896,
            0.47355567288263145
          ],
          [
            0.5072780741112572,
            0.4731885682543451
          ],
          [
            0.5083145531160491,
            0.47297660480497994
          ],
          [
            0.5096987565713269,
            0.4725883979388965
          ],
          [
            0.5081726530832904,
            0.4737263919119454
          ],
          [
            0.5070936914001193,
            0.47401558016805434
          ],
          [
            0.505521718944822,
            0.4747271955751104
          ]
        ],
        "visibility": [
          0.9999979734420776,
          0.6783889532089233,
          0.9999990463256836,
          0.00022256909869611263,
          0.745877206325531,
          0.9999862909317017,
          0.0013264258159324527,
          1.8953991457237862e-05,
          1.0,
          0.009571931324899197,
          0.09118501096963882,
          0.021856313571333885,
          0.9991497993469238,
          0.9621248841285706,
          0.0002408182481303811,
          3.247366475989111e-05,
          0.6451589465141296,
          0.0005971709033474326,
          1.1329525512193683e-10,
          4.7274701501009986e-05,
          1.294669531087464e-14,
          1.111158907940446e-12,
          0.001613506698049605,
          0.8960001468658447,
          9.092899501926544e-13,
          1.8248803076298392e-12,
          2.8854715949933052e-08,
          0.00011914486822206527,
          0.008060297928750515
        ],
        "headpose": {
          "pitch": 0.496583567520488,
          "yaw": -20.125176295104666,
          "roll": -1.4845074651564214
        },
        "attributes": {
          "5 oClock Shadow": 0.01959948055446148,
          "Arched Eyebrows": 0.0001246383908437565,
          "Attractive": 0.013913639821112156,
          "Bags Under Eyes": 0.0006697378121316433,
          "Bald": 7.405846645269776e-06,
          "Bangs": 0.05155850201845169,
          "Big Lips": 0.020752860233187675,
          "Big Nose": 0.014028218574821949,
          "Black Hair": 0.5047051310539246,
          "Blond Hair": 0.0005839217337779701,
          "Blurry": 0.8600438237190247,
          "Brown Hair": 0.0210147462785244,
          "Bushy Eyebrows": 0.005030167289078236,
          "Chubby": 0.008684959262609482,
          "Double Chin": 0.0006986320368014276,
          "Eyeglasses": 0.0019115791656076908,
          "Goatee": 0.0017296860460191965,
          "Gray Hair": 0.0006527646328322589,
          "Heavy Makeup": 0.002405997132882476,
          "High Cheekbones": 0.029795188456773758,
          "Male": 0.8956924676895142,
          "Mouth Slightly Open": 0.009070307947695255,
          "Mustache": 0.0011070689652115107,
          "Narrow Eyes": 0.08785714954137802,
          "No Beard": 0.8947691321372986,
          "Oval Face": 0.05685852840542793,
          "Pale Skin": 0.00013025198131799698,
          "Pointy Nose": 0.05308851972222328,
          "Receding Hairline": 0.0038685325998812914,
          "Rosy Cheeks": 0.00026485175476409495,
          "Sideburns": 0.0020604676101356745,
          "Smiling": 0.0024759231600910425,
          "Straight Hair": 0.14117279648780823,
          "Wavy Hair": 0.10627318918704987,
          "Wearing Earrings": 0.014110992662608624,
          "Wearing Hat": 0.019216462969779968,
          "Wearing Lipstick": 0.002072502626106143,
          "Wearing Necklace": 0.01882942020893097,
          "Wearing Necktie": 0.0008011967875063419,
          "Young": 0.8916183114051819
        },
        "age": [
          0.002806000644341111,
          0.4617420434951782,
          0.9814468622207642,
          0.5968271493911743,
          0.23692454397678375,
          0.006247612182050943,
          0.0012529840460047126,
          2.1796487999381498e-05
        ],
        "race": [
          0.05761927738785744,
          0.1739690899848938,
          0.9742498397827148,
          0.36790841817855835,
          0.5657394528388977
        ],
        "gender": [
          0.7798805832862854,
          0.26531004905700684
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 5.274041369557381,
          "disgust": 1.585743447662935e-06,
          "fear": 4.600267484784126,
          "happy": 0.029970562900416553,
          "sad": 80.70611357688904,
          "surprise": 0.021755907800979912,
          "neutral": 9.367845952510834
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 14,
          "h": 16,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 25,
        "gender": {
          "Woman": 27.04613506793976,
          "Man": 72.95386791229248
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 17.803435027599335,
          "indian": 21.127623319625854,
          "black": 17.48686134815216,
          "white": 14.111778140068054,
          "middle eastern": 11.64940744638443,
          "latino hispanic": 17.820897698402405
        },
        "dominant_race": "indian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.4610745310783386,
        0.43851715326309204,
        0.5344659090042114,
        0.6989889144897461
      ]
    ],
    "face_boxes": [
      [
        0.4969392418861389,
        0.45484083890914917,
        0.5121813416481018,
        0.4819694757461548
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5001305006987726,
            0.48528403061195613
          ],
          [
            0.4838880617326747,
            0.48464895306761424
          ],
          [
            0.4836055845332642,
            0.5252939159054946
          ],
          [
            0.5127007360725353,
            0.5147092901664633
          ],
          [
            0.5163729396648705,
            0.485919108156298
          ],
          [
            0.5177853256619225,
            0.5286809961419847
          ],
          [
            0.5047913744890441,
            0.5591647182703949
          ],
          [
            0.4782385177444667,
            0.5621284134773237
          ],
          [
            0.4728714509556691,
            0.616321697261164
          ],
          [
            0.46948172456274434,
            0.6264829379706341
          ],
          [
            0.4991418305008362,
            0.5617050284477625
          ],
          [
            0.4997067848996569,
            0.6133580020542354
          ],
          [
            0.5014016480961193,
            0.6810996067840358
          ],
          [
            0.5016841252955297,
            0.46347970158955154
          ],
          [
            0.5084635780813793,
            0.46305631655999036
          ],
          [
            0.49462219531026974,
            0.46559662673735785
          ],
          [
            0.5118533044743041,
            0.4660200117669191
          ]
        ],
        "dw_hand_1": [
          [
            0.5036614656914026,
            0.5600114883295173
          ],
          [
            0.5002717392984778,
            0.5629751835364462
          ],
          [
            0.496882012905553,
            0.5659388787433749
          ],
          [
            0.49546962690850094,
            0.5701727290389875
          ],
          [
            0.4934922865126282,
            0.5744065793345999
          ],
          [
            0.49716449010496333,
            0.5705961140685486
          ],
          [
            0.49575210410791143,
            0.576100119452845
          ],
          [
            0.4943397181108594,
            0.5803339697484576
          ],
          [
            0.49292733211380735,
            0.584144435014509
          ],
          [
            0.4997067848996569,
            0.5722896541867938
          ],
          [
            0.4985768761020154,
            0.5777936595710901
          ],
          [
            0.4974469673043738,
            0.5820275098667025
          ],
          [
            0.4965995357061426,
            0.5862613601623151
          ],
          [
            0.5019666024949402,
            0.5731364242459162
          ],
          [
            0.5014016480961193,
            0.5786404296302126
          ],
          [
            0.5005542164978881,
            0.5824508948962638
          ],
          [
            0.4997067848996569,
            0.5862613601623151
          ],
          [
            0.5045088972896338,
            0.5739831943050389
          ],
          [
            0.5039439428908129,
            0.5786404296302126
          ],
          [
            0.5036614656914026,
            0.5816041248371414
          ],
          [
            0.5033789884919921,
            0.5849912050736313
          ]
        ],
        "dw_hand_2": [
          [
            0.5158079852660497,
            0.514285905136902
          ],
          [
            0.5172203712631017,
            0.5117455949595344
          ],
          [
            0.5191977116589744,
            0.509205284782167
          ],
          [
            0.5200451432572056,
            0.5087818997526057
          ],
          [
            0.5231523924507201,
            0.5087818997526057
          ],
          [
            0.5214575292542577,
            0.5079351296934832
          ],
          [
            0.5248472556471825,
            0.5087818997526057
          ],
          [
            0.5265421188436449,
            0.5096286698117283
          ],
          [
            0.5282369820401073,
            0.5104754398708506
          ],
          [
            0.5231523924507201,
            0.509205284782167
          ],
          [
            0.5259771644448241,
            0.5104754398708506
          ],
          [
            0.5279545048406968,
            0.5117455949595344
          ],
          [
            0.5285194592395177,
            0.512592365018657
          ],
          [
            0.5234348696501305,
            0.510898824900412
          ],
          [
            0.5262596416442344,
            0.5117455949595344
          ],
          [
            0.5276720276412864,
            0.512592365018657
          ],
          [
            0.5279545048406968,
            0.5138625201073408
          ],
          [
            0.5234348696501305,
            0.512592365018657
          ],
          [
            0.5254122100460032,
            0.5134391350777795
          ],
          [
            0.5271070732424656,
            0.5138625201073408
          ],
          [
            0.5276720276412864,
            0.5147092901664633
          ]
        ],
        "dw_face": [
          [
            0.4965995357061426,
            0.4639030866191129
          ],
          [
            0.4965995357061426,
            0.46686678182604163
          ],
          [
            0.496882012905553,
            0.4698304770329704
          ],
          [
            0.49716449010496333,
            0.4727941722398992
          ],
          [
            0.4980119217031945,
            0.4753344824172667
          ],
          [
            0.4991418305008362,
            0.4778747925946343
          ],
          [
            0.5005542164978881,
            0.47956833271287924
          ],
          [
            0.5022490796943505,
            0.48083848780156296
          ],
          [
            0.5042264200902233,
            0.48168525786068556
          ],
          [
            0.5059212832866857,
            0.4812618728311242
          ],
          [
            0.5076161464831481,
            0.47956833271287924
          ],
          [
            0.5087460552807898,
            0.4774514075650729
          ],
          [
            0.5093110096796105,
            0.47491109738770537
          ],
          [
            0.5098759640784313,
            0.4719474021807767
          ],
          [
            0.5101584412778417,
            0.46898370697384795
          ],
          [
            0.5104409184772521,
            0.4660200117669191
          ],
          [
            0.5101584412778417,
            0.46305631655999036
          ],
          [
            0.4994243077002466,
            0.46093939141218404
          ],
          [
            0.5005542164978881,
            0.4600926213530616
          ],
          [
            0.5016841252955297,
            0.45966923632350026
          ],
          [
            0.5028140340931714,
            0.45966923632350026
          ],
          [
            0.5039439428908129,
            0.45966923632350026
          ],
          [
            0.5064862376855065,
            0.4600926213530616
          ],
          [
            0.5073336692837377,
            0.45966923632350026
          ],
          [
            0.5081811008819689,
            0.45966923632350026
          ],
          [
            0.5090285324802001,
            0.45966923632350026
          ],
          [
            0.509593486879021,
            0.4605160063826228
          ],
          [
            0.505356328887865,
            0.4626329315304291
          ],
          [
            0.5056388060872753,
            0.4643264716486741
          ],
          [
            0.5056388060872753,
            0.4660200117669191
          ],
          [
            0.5059212832866857,
            0.46771355188516417
          ],
          [
            0.5036614656914026,
            0.4698304770329704
          ],
          [
            0.5045088972896338,
            0.4698304770329704
          ],
          [
            0.505356328887865,
            0.47025386206253167
          ],
          [
            0.5062037604860962,
            0.47025386206253167
          ],
          [
            0.5070511920843274,
            0.4698304770329704
          ],
          [
            0.5005542164978881,
            0.46305631655999036
          ],
          [
            0.5016841252955297,
            0.4626329315304291
          ],
          [
            0.502531556893761,
            0.4626329315304291
          ],
          [
            0.5033789884919921,
            0.4626329315304291
          ],
          [
            0.502531556893761,
            0.46305631655999036
          ],
          [
            0.5016841252955297,
            0.46347970158955154
          ],
          [
            0.5067687148849169,
            0.4626329315304291
          ],
          [
            0.5076161464831481,
            0.4626329315304291
          ],
          [
            0.5084635780813793,
            0.4626329315304291
          ],
          [
            0.5090285324802001,
            0.46305631655999036
          ],
          [
            0.5081811008819689,
            0.46305631655999036
          ],
          [
            0.5076161464831481,
            0.46305631655999036
          ],
          [
            0.5022490796943505,
            0.4744877123581442
          ],
          [
            0.5036614656914026,
            0.47364094229902165
          ],
          [
            0.5050738516884545,
            0.4732175572694604
          ],
          [
            0.5056388060872753,
            0.47364094229902165
          ],
          [
            0.5059212832866857,
            0.4732175572694604
          ],
          [
            0.5067687148849169,
            0.47364094229902165
          ],
          [
            0.5073336692837377,
            0.4744877123581442
          ],
          [
            0.5067687148849169,
            0.4753344824172667
          ],
          [
            0.5062037604860962,
            0.47575786744682796
          ],
          [
            0.505356328887865,
            0.47618125247638915
          ],
          [
            0.5042264200902233,
            0.47575786744682796
          ],
          [
            0.5033789884919921,
            0.4753344824172667
          ],
          [
            0.502531556893761,
            0.4744877123581442
          ],
          [
            0.5042264200902233,
            0.474064327328583
          ],
          [
            0.505356328887865,
            0.474064327328583
          ],
          [
            0.5062037604860962,
            0.474064327328583
          ],
          [
            0.5070511920843274,
            0.4744877123581442
          ],
          [
            0.5062037604860962,
            0.47491109738770537
          ],
          [
            0.505356328887865,
            0.47491109738770537
          ],
          [
            0.5039439428908129,
            0.4744877123581442
          ]
        ],
        "dw_foot_1": [
          [
            0.49377476371203854,
            0.6921076175526285
          ],
          [
            0.5022490796943505,
            0.6938011576708734
          ],
          [
            0.5022490796943505,
            0.6895673073752611
          ]
        ],
        "dw_foot_2": [
          [
            0.47089411055979624,
            0.6387611038279106
          ],
          [
            0.46524456657158836,
            0.6341038685027367
          ],
          [
            0.4697642017621547,
            0.626059552941073
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "skateboard",
      "possible_names": [
        "skateboard"
      ],
      "box": [
        0.4734375,
        0.6697892271662763,
        0.5296875,
        0.7236533957845434
      ]
    },
    {
      "name": "skateboard",
      "possible_names": [
        "skateboard"
      ],
      "box": [
        0.4765625,
        0.6768149882903981,
        0.5265625,
        0.7189695550351288
      ]
    }
  ],
  "scene": "A serene urban street at dusk with palm trees and an overpass casting shadows on the road while a skateboarder glides along the asphalt under a twilight sky tinged with purple hues and scattered clouds creating a tranquil atmosphere devoid of bustling activity",
  "overall_past": "Before the current scene, the individual likely arrived at the quiet urban street after a day of routine activities, perhaps having left home or a nearby destination with the intention of unwinding. They may have retrieved their skateboard from a bag or storage, adjusted their gear, and taken a moment to observe the peaceful surroundings—perhaps pausing to appreciate the soft light of the setting sun filtering through the palm trees. This brief pause allowed them to mentally prepare for the ride, embracing the calm of the moment before beginning their glide down the empty road, seeking both physical movement and a sense of personal freedom in the tranquil, twilight atmosphere.",
  "overall_past_clean": "The individual stepped off the curb with deliberate calm, having just emerged from a routine day of obligations, their body already shifting into a rhythm of release as they paused to absorb the hush of the street, the fading light painting the air with stillness, before setting motion into the quiet.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the skateboarder is likely to slow down near the base of the overpass, where the long shadows stretch across the road, and pause to rest briefly, perhaps leaning against the cool concrete pillar for a moment. The quiet stillness of the twilight hour may invite a brief moment of reflection—gazing up at the fading sky, feeling the cool evening breeze through the palm fronds—before pushing off again, continuing the journey along the quiet street with a sense of calm purpose, as if the city has momentarily surrendered to the rhythm of the moment.",
  "overall_future_clean": "The skateboarder accelerates smoothly into the gathering dusk, wheels humming against the pavement as the city's pulse slows to match the rhythm of motion, each turn a quiet defiance of stillness, carving a path through the hush with unwavering intent.",
  "future_scene_ok": true
}