{
  "image_path": "./ref_datasets/hico_det/images/train/train_00021754.jpg",
  "image_id": "train_00021754",
  "width": 427,
  "height": 640,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 21754,
  "annotations": {
    "objects": "[{'id': 455, 'bbox_human': [1, 348, 22, 335], 'bbox_object': [21, 247, 351, 425], 'connection': 1, 'invis': 0}, {'id': 460, 'bbox_human': [1, 346, 24, 335], 'bbox_object': [22, 242, 355, 423], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('skateboard', 'flip'), ('skateboard', 'ride')]",
    "negative_captions": "[('skateboard', 'carry'), ('skateboard', 'grind'), ('skateboard', 'hold'), ('skateboard', 'sit_on'), ('skateboard', 'stand_on'), ('skateboard', 'no_interaction')]",
    "ambiguous_captions": "[('skateboard', 'jump'), ('skateboard', 'pick_up')]",
    "positive_objects": "[454, 459]",
    "negative_objects": "[453, 455, 456, 460, 461, 462]",
    "ambiguous_objects": "[457, 458]",
    "size": "[427, 640, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "teenager",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a striped sweater, jeans, and shoes.",
        "clothing": [
          {
            "possible_names": [
              "sweater",
              "shirt"
            ],
            "name": "sweater",
            "type": "top",
            "color": [
              "blue",
              "black",
              "white"
            ]
          },
          {
            "possible_names": [
              "jeans",
              "pants",
              "trousers"
            ],
            "name": "jeans",
            "type": "bottom",
            "color": [
              "blue"
            ]
          },
          {
            "possible_names": [
              "shoes"
            ],
            "name": "shoes",
            "type": "footwear",
            "color": [
              "brown"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "skateboard"
            ],
            "name": "skateboard",
            "position": "body"
          }
        ],
        "description": "The person is a teenager who appears to be male. He is performing a skateboard trick, jumping with the skateboard separated from his feet. He is wearing a blue, black, and white striped sweater, blue jeans, and brown shoes. His emotion is not clearly visible in the image.",
        "blurry": false,
        "face_seen": false,
        "emotion_description": "The person's face is not visible, so their emotional state cannot be determined.",
        "meaningful": true,
        "story": "A teenager is performing a skateboarding trick at an outdoor skate park. He appears to be mid-air, suggesting he is skilled and confident in his abilities.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is performing a skateboard trick, likely an ollie, as they leap into the air with the skateboard beneath them. Their body is angled forward, suggesting focus and control over the movement, while their arms are outstretched for balance. The individual appears to be enjoying the activity, possibly motivated by a passion for skateboarding or the thrill of mastering new tricks. The setting seems to be a casual outdoor environment, perhaps a park or a recreational area, where the person has chosen to practice their skills away from busy streets. The presence of trash bins and a fence indicates this might be a designated space for such activities, providing a safe and appropriate location for practicing skateboarding techniques.",
        "intention": "The individual is motivated by a passion for skateboarding and the desire to master new tricks in a safe and suitable environment",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3730999096933916,
            0.15314459621108004
          ],
          [
            0.3681396865334229,
            0.15721026201333319
          ],
          [
            0.3598047413128839,
            0.16394584165619952
          ],
          [
            0.36019587780010265,
            0.17310565592987198
          ],
          [
            0.3553810102080533,
            0.18149932138621808
          ],
          [
            0.35416288589625583,
            0.19179765635303087
          ],
          [
            0.3631163251244452,
            0.20257978950228012
          ],
          [
            0.3662581978214349,
            0.20696140495794157
          ],
          [
            0.37784164124964553,
            0.21192546401705062
          ],
          [
            0.394833542743069,
            0.21613060065678188
          ],
          [
            0.41390183475273595,
            0.21306096251521792
          ],
          [
            0.4244761047414331,
            0.20995815758194242
          ],
          [
            0.4318676422415229,
            0.20531052925757
          ],
          [
            0.4384286407644273,
            0.19882185629435947
          ],
          [
            0.44786225373468175,
            0.19550714758890014
          ],
          [
            0.45144647704833085,
            0.19028007750000273
          ],
          [
            0.4595280580594014,
            0.18534732604665416
          ],
          [
            0.39562119030561604,
            0.1603734090658171
          ],
          [
            0.4025193377456844,
            0.15708837133965323
          ],
          [
            0.41082340660363226,
            0.1576937290706805
          ],
          [
            0.41830152139571164,
            0.15934205212231195
          ],
          [
            0.4270794633321038,
            0.1620696000488741
          ],
          [
            0.4364456044028299,
            0.1651942361678396
          ],
          [
            0.44251345216171045,
            0.16835700731192316
          ],
          [
            0.45564527948710704,
            0.17419833344008243
          ],
          [
            0.4548848925246248,
            0.17780926610742295
          ],
          [
            0.45126570327978305,
            0.1821865389389651
          ],
          [
            0.4246563999179854,
            0.175450130126306
          ],
          [
            0.41789566581167076,
            0.181436771314059
          ],
          [
            0.4118098708529582,
            0.18632247314921446
          ],
          [
            0.4066572537107905,
            0.19133524830852236
          ],
          [
            0.40444134884193295,
            0.18991046590464455
          ],
          [
            0.4063256468889346,
            0.19012258137975419
          ],
          [
            0.4065530163741662,
            0.19273615713630404
          ],
          [
            0.40893556218994387,
            0.19330140394823891
          ],
          [
            0.41122394024468295,
            0.1951812390770231
          ],
          [
            0.39949935046515367,
            0.16759191565215587
          ],
          [
            0.4041791905045469,
            0.16908467369420188
          ],
          [
            0.4112988303201419,
            0.17007058236215794
          ],
          [
            0.4129644453266306,
            0.17247250133327077
          ],
          [
            0.4079251779126818,
            0.17109806622777665
          ],
          [
            0.4003731015136147,
            0.167458238825202
          ],
          [
            0.43679005663384557,
            0.1788978859782219
          ],
          [
            0.43386028873039034,
            0.17916402641151633
          ],
          [
            0.4407348798724392,
            0.18177570498415402
          ],
          [
            0.4429667553561872,
            0.18462825263185162
          ],
          [
            0.43621760317616415,
            0.18544380829802581
          ],
          [
            0.434833754421118,
            0.1815784358552524
          ],
          [
            0.3845879266636154,
            0.19157341410006795
          ],
          [
            0.3928283188565593,
            0.19461859783955981
          ],
          [
            0.39953557509329457,
            0.19509806696857726
          ],
          [
            0.4021807386947739,
            0.19611470784459795
          ],
          [
            0.40530021567933333,
            0.1959101105374949
          ],
          [
            0.40859709235887215,
            0.1989607334136963
          ],
          [
            0.4076072492500578,
            0.20010525371347154
          ],
          [
            0.40433559436868294,
            0.20221593731216023
          ],
          [
            0.3952182254172281,
            0.20558150357433727
          ],
          [
            0.38966491191273106,
            0.20584852610315596
          ],
          [
            0.3849926671283067,
            0.20313343607953618
          ],
          [
            0.3828016969024158,
            0.19825202258569855
          ],
          [
            0.3870085636163165,
            0.1953614796910967
          ],
          [
            0.39422908105272714,
            0.19734723142215183
          ],
          [
            0.40123641447065345,
            0.20238239009465492
          ],
          [
            0.4047661788011323,
            0.20149248327527727
          ],
          [
            0.41019955236563205,
            0.19945848499025617
          ],
          [
            0.4019006044420361,
            0.1999369173177651
          ],
          [
            0.39429393983996003,
            0.19977394406284604
          ],
          [
            0.38969640326603633,
            0.1955557795507567
          ]
        ],
        "visibility": [
          0.14425012469291687,
          0.9999806880950928,
          0.9911862015724182,
          0.9999926090240479,
          0.782291054725647,
          0.02616747096180916,
          0.9988595247268677,
          0.9999995231628418,
          0.0005332647124305367,
          0.999792754650116,
          0.21675600111484528,
          0.002374209463596344,
          0.5223268866539001,
          4.696367614087649e-05,
          0.9999991655349731,
          0.9925244450569153,
          4.414337126945611e-06,
          0.19054070115089417,
          0.0005257887532934546,
          0.2958618402481079,
          8.429035369772464e-05,
          1.641108497096866e-06,
          1.5129748476283567e-07,
          4.591347035898252e-08,
          0.0013446625089272857,
          0.0009894977556541562,
          1.7063133554984233e-06,
          3.9125206967582926e-05,
          0.9998476505279541
        ],
        "headpose": {
          "pitch": -33.33155196099942,
          "yaw": 1.8628369793687167,
          "roll": 24.5637866800685
        },
        "attributes": {
          "5 oClock Shadow": 0.018756357952952385,
          "Arched Eyebrows": 0.00014392200682777911,
          "Attractive": 0.024764366447925568,
          "Bags Under Eyes": 0.0062800622545182705,
          "Bald": 4.1139605855278205e-06,
          "Bangs": 0.4928283095359802,
          "Big Lips": 0.06660106033086777,
          "Big Nose": 0.025187989696860313,
          "Black Hair": 0.0010266297031193972,
          "Blond Hair": 0.11766514182090759,
          "Blurry": 0.8709814548492432,
          "Brown Hair": 0.030384227633476257,
          "Bushy Eyebrows": 0.005389474797993898,
          "Chubby": 0.0013617759104818106,
          "Double Chin": 0.0001281069708056748,
          "Eyeglasses": 0.032157305628061295,
          "Goatee": 0.038167934864759445,
          "Gray Hair": 0.0016941167414188385,
          "Heavy Makeup": 0.0026545675937086344,
          "High Cheekbones": 0.008298651315271854,
          "Male": 0.9848653078079224,
          "Mouth Slightly Open": 0.025975966826081276,
          "Mustache": 0.01712943986058235,
          "Narrow Eyes": 0.1437220573425293,
          "No Beard": 0.5962144136428833,
          "Oval Face": 0.03042967990040779,
          "Pale Skin": 0.0006496808491647243,
          "Pointy Nose": 0.07410629093647003,
          "Receding Hairline": 0.0003487028006929904,
          "Rosy Cheeks": 0.0001587487931828946,
          "Sideburns": 0.008221547119319439,
          "Smiling": 0.009552855044603348,
          "Straight Hair": 0.2195560485124588,
          "Wavy Hair": 0.026813674718141556,
          "Wearing Earrings": 0.00031678221421316266,
          "Wearing Hat": 0.01462255883961916,
          "Wearing Lipstick": 0.004883222281932831,
          "Wearing Necklace": 0.03091479279100895,
          "Wearing Necktie": 0.002800880465656519,
          "Young": 0.9531955718994141
        },
        "age": [
          0.0002951450296677649,
          0.6636707186698914,
          0.9993327260017395,
          0.3198714256286621,
          8.492466440657154e-05,
          3.972532431362197e-05,
          8.954790246207267e-06,
          8.810771667810968e-09
        ],
        "race": [
          0.9992623925209045,
          0.008884747512638569,
          0.9962314963340759,
          0.00014224536425899714,
          0.0020965011790394783
        ],
        "gender": [
          0.9992684721946716,
          0.00238935649394989
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.0007599578566441778,
          "disgust": 4.269187434124966e-09,
          "fear": 0.001336070454271976,
          "happy": 97.75466322898865,
          "sad": 1.3991895131766796,
          "surprise": 1.014939510213253e-06,
          "neutral": 0.8440486155450344
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 59,
          "h": 50,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 34,
        "gender": {
          "Woman": 35.854822397232056,
          "Man": 64.14517760276794
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 9.383366071186428,
          "indian": 3.5055456909862572,
          "black": 0.38648680759142684,
          "white": 48.32947244223788,
          "middle eastern": 25.1807734477981,
          "latino hispanic": 13.214356494805603
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "standalone",
                "flip"
              ],
              [
                "standalone",
                "ride"
              ]
            ],
            "negative_action": [
              "carry",
              "grind",
              "hold",
              "sit on",
              "stand on",
              "no interaction"
            ],
            "position": "standalone"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.001222418388351798,
        0.042879484593868256,
        0.8079395294189453,
        0.5250973105430603
      ]
    ],
    "face_boxes": [
      [
        0.3507278859615326,
        0.15846684575080872,
        0.4440450668334961,
        0.2115035355091095
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.3582613790621523,
            0.1391630885036041
          ],
          [
            0.2669712243184365,
            0.12335052549218135
          ],
          [
            0.0738574354374995,
            0.07766978790362673
          ],
          [
            -0.0016325002159577472,
            0.06244287537410855
          ],
          [
            0.4495515338058681,
            0.15497565151502685
          ],
          [
            0.5636642272355127,
            0.17840167079120875
          ],
          [
            0.6953327196543334,
            0.19479988428453607
          ],
          [
            0.20552592785632023,
            0.28850396138926354
          ],
          [
            0.2845270233076127,
            0.4068053587339818
          ],
          [
            0.18972570876606176,
            0.4372591837930182
          ],
          [
            0.33719442027514096,
            0.2838187575340271
          ],
          [
            0.4811519719863851,
            0.33769860186924544
          ],
          [
            0.6777769206651574,
            0.44897219343110917
          ],
          [
            0.40039529663617496,
            0.18894337946549059
          ],
          [
            0.4319957348166919,
            0.1936285833207269
          ],
          [
            0.3670392785567404,
            0.15497565151502685
          ],
          [
            0.4600850131993736,
            0.17488776789978147
          ]
        ],
        "dw_hand_1": [
          [
            0.7076217789467567,
            0.19948508813977242
          ],
          [
            0.7199108382391799,
            0.20768419488643602
          ],
          [
            0.7339554774305206,
            0.21471200066929058
          ],
          [
            0.7497556965207791,
            0.2229111074159543
          ],
          [
            0.7620447558132027,
            0.22759631127119065
          ],
          [
            0.7620447558132027,
            0.20417029199500875
          ],
          [
            0.7778449749034613,
            0.21236939874167246
          ],
          [
            0.7831117146002138,
            0.2229111074159543
          ],
          [
            0.7848672944991315,
            0.23111021416261793
          ],
          [
            0.7655559156110376,
            0.20182769006739062
          ],
          [
            0.7831117146002138,
            0.21002679681405426
          ],
          [
            0.7883784542969668,
            0.22173980645214514
          ],
          [
            0.7901340341958843,
            0.23345281609023613
          ],
          [
            0.7673114955099554,
            0.20182769006739062
          ],
          [
            0.7831117146002138,
            0.20885549585024518
          ],
          [
            0.7883784542969668,
            0.21939720452452702
          ],
          [
            0.7901340341958843,
            0.2287676122349997
          ],
          [
            0.7655559156110376,
            0.20065638910358147
          ],
          [
            0.7778449749034613,
            0.20651289392262698
          ],
          [
            0.7848672944991315,
            0.21354069970548153
          ],
          [
            0.7866228743980492,
            0.21939720452452702
          ]
        ],
        "dw_hand_2": [
          [
            0.005389819379712715,
            0.0671280792293449
          ],
          [
            0.010656559076465543,
            0.06947068115696312
          ],
          [
            0.014167718874300742,
            0.06947068115696312
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.007145399278630346,
            0.06478547730172676
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.3723060182534931,
            0.16668866115311784
          ],
          [
            0.3670392785567404,
            0.17020256404454512
          ],
          [
            0.3652836986578227,
            0.17605906886359052
          ],
          [
            0.36177253885998745,
            0.18074427271882695
          ],
          [
            0.36001695896107,
            0.18660077753787235
          ],
          [
            0.36001695896107,
            0.1912859813931088
          ],
          [
            0.36001695896107,
            0.1971424862121542
          ],
          [
            0.36177253885998745,
            0.20417029199500875
          ],
          [
            0.3670392785567404,
            0.20885549585024518
          ],
          [
            0.3740615981524108,
            0.21236939874167246
          ],
          [
            0.38283949764699887,
            0.21236939874167246
          ],
          [
            0.391617397141587,
            0.2111980977778633
          ],
          [
            0.40039529663617496,
            0.20768419488643602
          ],
          [
            0.4091731961307629,
            0.20768419488643602
          ],
          [
            0.4179510956253511,
            0.2053415929588179
          ],
          [
            0.4249734152210214,
            0.20065638910358147
          ],
          [
            0.4319957348166919,
            0.19597118524834514
          ],
          [
            0.3968841368383397,
            0.18191557368263603
          ],
          [
            0.40039529663617496,
            0.18308687464644507
          ],
          [
            0.40741761623184547,
            0.18425817561025423
          ],
          [
            0.41268435592859815,
            0.1877720785016815
          ],
          [
            0.4179510956253511,
            0.19011468042929963
          ],
          [
            0.42672899511993906,
            0.1936285833207269
          ],
          [
            0.4284845750188567,
            0.1936285833207269
          ],
          [
            0.43024015491777434,
            0.1936285833207269
          ],
          [
            0.4319957348166919,
            0.19479988428453607
          ],
          [
            0.435506894614527,
            0.19479988428453607
          ],
          [
            0.4179510956253511,
            0.19479988428453607
          ],
          [
            0.41443993582751587,
            0.19831378717596335
          ],
          [
            0.41268435592859815,
            0.20182769006739062
          ],
          [
            0.4091731961307629,
            0.2053415929588179
          ],
          [
            0.3951285569394221,
            0.20182769006739062
          ],
          [
            0.3968841368383397,
            0.2029989910311997
          ],
          [
            0.39863971673725734,
            0.20417029199500875
          ],
          [
            0.4039064564340101,
            0.2053415929588179
          ],
          [
            0.40741761623184547,
            0.20651289392262698
          ],
          [
            0.3951285569394221,
            0.18660077753787235
          ],
          [
            0.39863971673725734,
            0.1877720785016815
          ],
          [
            0.4039064564340101,
            0.19011468042929963
          ],
          [
            0.40741761623184547,
            0.1912859813931088
          ],
          [
            0.4021508765350926,
            0.1912859813931088
          ],
          [
            0.3968841368383397,
            0.18894337946549059
          ],
          [
            0.42321783532210394,
            0.19479988428453607
          ],
          [
            0.4249734152210214,
            0.19597118524834514
          ],
          [
            0.42672899511993906,
            0.19597118524834514
          ],
          [
            0.4284845750188567,
            0.1971424862121542
          ],
          [
            0.42672899511993906,
            0.1971424862121542
          ],
          [
            0.4249734152210214,
            0.19597118524834514
          ],
          [
            0.38283949764699887,
            0.20065638910358147
          ],
          [
            0.3881062373437516,
            0.2029989910311997
          ],
          [
            0.3933729770405044,
            0.2053415929588179
          ],
          [
            0.3951285569394221,
            0.20651289392262698
          ],
          [
            0.3968841368383397,
            0.20768419488643602
          ],
          [
            0.3951285569394221,
            0.20885549585024518
          ],
          [
            0.3933729770405044,
            0.20885549585024518
          ],
          [
            0.3933729770405044,
            0.20885549585024518
          ],
          [
            0.391617397141587,
            0.20885549585024518
          ],
          [
            0.3898618172426693,
            0.20885549585024518
          ],
          [
            0.38459507754591643,
            0.20651289392262698
          ],
          [
            0.38283949764699887,
            0.20417029199500875
          ],
          [
            0.38283949764699887,
            0.20182769006739062
          ],
          [
            0.38635065744483416,
            0.20417029199500875
          ],
          [
            0.3933729770405044,
            0.20651289392262698
          ],
          [
            0.3933729770405044,
            0.20885549585024518
          ],
          [
            0.3933729770405044,
            0.20885549585024518
          ],
          [
            0.391617397141587,
            0.20768419488643602
          ],
          [
            0.391617397141587,
            0.20651289392262698
          ],
          [
            0.38635065744483416,
            0.20417029199500875
          ]
        ],
        "dw_foot_1": [
          [
            0.7813561347012961,
            0.4606852030692002
          ],
          [
            0.7708226553077907,
            0.4571713001777729
          ],
          [
            0.6865548201597453,
            0.459513902105391
          ]
        ],
        "dw_foot_2": [
          [
            0.2371263660368372,
            0.5075372416215638
          ],
          [
            0.19674802836173227,
            0.5016807368025183
          ],
          [
            0.170414329877968,
            0.42671747511873637
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "skateboard",
      "possible_names": [
        "skateboard"
      ],
      "box": [
        0.04918032786885246,
        0.5484375,
        0.5784543325526932,
        0.6640625
      ]
    }
  ],
  "scene": "A skateboarder performs an aerial trick over a trash can on a green court surrounded by a chain-link fence and trees with a striped shirt and jeans as the focal point of the action shot",
  "overall_past": "Before the current scene, the individual likely approached the trash can from a short distance, building momentum by rolling steadily across the green court. They may have taken a moment to assess the space, checking the positioning of the trash can and the surrounding area for clearance, then began to crouch slightly in preparation for the jump. With focused intent, they pushed down on the tail of the skateboard to initiate the ollie, launching themselves and the board into the air just as they cleared the obstacle.",
  "overall_past_clean": "The individual accelerated smoothly across the surface, eyes locked on the target, body lowering into a controlled stance as they gauged the space and timing, then drove forcefully into the motion that would lift them and their board into the air.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to land smoothly back on the ground, maintaining balance and control as they roll forward on the skateboard to absorb the impact of the trick. The momentum from the ollie will carry them past the trash can, and they may immediately begin preparing for the next maneuver—perhaps a grind or a flip—using the surrounding environment, such as the edge of the fence or a nearby rail, as part of their routine. The casual, focused demeanor suggests a practiced flow, indicating that this moment is part of a continuous sequence of tricks rather than a one-off attempt.",
  "overall_future_clean": "The body shifts seamlessly into motion, the board slicing through the air with precision as momentum carries forward, the edge of the surface catching beneath the wheels to initiate a controlled grind, the stance adjusting mid-motion to maintain balance and drive into the next trick with fluid, deliberate force.",
  "future_scene_ok": false
}