{
  "image_path": "./ref_datasets/hico_det/images/train/train_00008926.jpg",
  "image_id": "train_00008926",
  "width": 640,
  "height": 494,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 8926,
  "annotations": {
    "objects": "[{'id': 246, 'bbox_human': [264, 586, 50, 455], 'bbox_object': [192, 539, 208, 458], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('bench', 'sit_on')]",
    "negative_captions": "[('bench', 'inspect'), ('bench', 'lie_on'), ('bench', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[245]",
    "negative_objects": "[243, 244, 246]",
    "ambiguous_objects": "[]",
    "size": "[640, 494, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "senior",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a teal and gray long-sleeve shirt and dark blue pants. He has a black cap with a logo on it.",
        "clothing": [
          {
            "possible_names": [
              "shirt",
              "sweater",
              "long-sleeve shirt"
            ],
            "name": "long sleeve shirt",
            "type": "top",
            "color": [
              "teal",
              "gray"
            ]
          },
          {
            "possible_names": [
              "pants",
              "jeans"
            ],
            "name": "pants",
            "type": "bottom",
            "color": [
              "dark blue"
            ]
          },
          {
            "possible_names": [
              "cap",
              "hat"
            ],
            "name": "cap",
            "type": "headwear",
            "color": [
              "black"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "cane",
              "walking stick",
              "stick"
            ],
            "name": "cane",
            "position": "body"
          },
          {
            "standalone": false,
            "possible_names": [
              "chair",
              "bench",
              "seat"
            ],
            "name": "chair",
            "position": "body"
          }
        ],
        "description": "The person is a senior male sitting on a chair outdoors. He appears neutral in emotion. He is wearing a teal and gray long-sleeve shirt and dark blue pants, along with a black cap with a logo. The person has a cane leaning against him and is sitting on a chair. There is a bike and a column in the background.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "An elderly man sits quietly on a bench in a park, perhaps enjoying a moment of solitude. He holds a cane, indicating he may need assistance walking. The setting suggests a peaceful day out, possibly reflecting on life or simply resting.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The elderly man is seated on a white chair, holding a cane in his right hand, suggesting he may need support for walking. He appears to be resting or waiting, possibly taking a break from a walk given the presence of the bicycle nearby which could belong to him or someone accompanying him. His expression seems contemplative or perhaps slightly concerned, indicating he might be deep in thought or observing something off-camera that has caught his attention. The setting, an outdoor area with trees and a pathway, suggests a peaceful environment where he might enjoy spending time alone or with company, reflecting on memories or simply enjoying the tranquility around him.",
        "intention": "The individual is taking a momentary pause in a serene outdoor setting likely seeking reflection or observing something of interest nearby while preparing to continue their journey",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.6008862616494298,
            0.19067576346609758
          ],
          [
            0.6008270155638457,
            0.21427502419784483
          ],
          [
            0.5982600577175617,
            0.2416129063980782
          ],
          [
            0.5990855885669589,
            0.2700422978111607
          ],
          [
            0.6035439927130938,
            0.2950867544784237
          ],
          [
            0.612967112660408,
            0.3161510648997689
          ],
          [
            0.6266168352216482,
            0.33371965122609004
          ],
          [
            0.6404872085899115,
            0.3476055276538679
          ],
          [
            0.6590203396975994,
            0.35313064366699715
          ],
          [
            0.6700083330273628,
            0.34170228749634285
          ],
          [
            0.6764421366155148,
            0.32565295647995673
          ],
          [
            0.6829227335751057,
            0.3117645086064512
          ],
          [
            0.6883436791598797,
            0.2970238349698333
          ],
          [
            0.6958462089300156,
            0.2800824120942398
          ],
          [
            0.7002999722957611,
            0.2627261785360483
          ],
          [
            0.7024505451321602,
            0.2433479546535353
          ],
          [
            0.7071265742182732,
            0.22577579784007207
          ],
          [
            0.6472111154347658,
            0.2035041589003343
          ],
          [
            0.6563502006232739,
            0.1936692216618341
          ],
          [
            0.6638967968523503,
            0.19598351412939158
          ],
          [
            0.6724471315741539,
            0.19760774263003578
          ],
          [
            0.6800503894686699,
            0.20141278297794976
          ],
          [
            0.69514729231596,
            0.20755295232240006
          ],
          [
            0.6983667254447937,
            0.20669014106395273
          ],
          [
            0.703041659295559,
            0.2083784211502384
          ],
          [
            0.706479312479496,
            0.20965874050310265
          ],
          [
            0.7072625622153282,
            0.21514716129071318
          ],
          [
            0.685839457064867,
            0.23128334809894022
          ],
          [
            0.6864410094916821,
            0.24735828932480292
          ],
          [
            0.6874568514525891,
            0.2639510206848021
          ],
          [
            0.6881371267139912,
            0.27980496526247095
          ],
          [
            0.6650132160633803,
            0.27775875469933636
          ],
          [
            0.6714373245835304,
            0.28135294084124235
          ],
          [
            0.6780914269387722,
            0.2865507535123632
          ],
          [
            0.6845037281513214,
            0.2867782222114594
          ],
          [
            0.6892008014023304,
            0.2842230738898521
          ],
          [
            0.6508417032659054,
            0.22109836412344866
          ],
          [
            0.6563117388635874,
            0.21931273831047027
          ],
          [
            0.6664885930716992,
            0.22174370144060265
          ],
          [
            0.6681112289428711,
            0.22775138051886307
          ],
          [
            0.664326123520732,
            0.23117048248105687
          ],
          [
            0.6547955419868231,
            0.22666391959557167
          ],
          [
            0.6911664359271527,
            0.23253211511774102
          ],
          [
            0.6934274487197399,
            0.22832872220861766
          ],
          [
            0.7003102764487267,
            0.2297520608554485
          ],
          [
            0.7009936586022377,
            0.23464421029032967
          ],
          [
            0.699345787614584,
            0.23921738751986732
          ],
          [
            0.6932108044624329,
            0.23808194654673218
          ],
          [
            0.6472448945045471,
            0.2999172326524248
          ],
          [
            0.6586237974464894,
            0.29807454854370613
          ],
          [
            0.6713912576436997,
            0.29886099394516424
          ],
          [
            0.6751776203513146,
            0.3004595644560903
          ],
          [
            0.6786376923322678,
            0.30154443655902075
          ],
          [
            0.6805436924099922,
            0.3058877821393341
          ],
          [
            0.6804071791470051,
            0.3111110660228652
          ],
          [
            0.6780761830508709,
            0.3114542671543384
          ],
          [
            0.6747381068766117,
            0.31376029798376415
          ],
          [
            0.6704364806413651,
            0.31584344701728356
          ],
          [
            0.6616251446306706,
            0.31178855509893133
          ],
          [
            0.6534301299601794,
            0.30651938480886853
          ],
          [
            0.6488376628607512,
            0.2996449026501613
          ],
          [
            0.6601559143513441,
            0.30077439281139295
          ],
          [
            0.6734253443777561,
            0.3047334810017574
          ],
          [
            0.6762172557413578,
            0.30762124930316137
          ],
          [
            0.6796510867774487,
            0.3101667373286568
          ],
          [
            0.6764004841446877,
            0.3081618957673972
          ],
          [
            0.6721596769988537,
            0.3078529574127815
          ],
          [
            0.6601630445569754,
            0.3036409814348105
          ]
        ],
        "visibility": [
          0.00594007782638073,
          0.9677538275718689,
          0.9999713897705078,
          0.07320341467857361,
          0.952238917350769,
          0.9999998807907104,
          0.00026335680740885437,
          0.2226388305425644,
          0.644701361656189,
          3.549569953520404e-07,
          0.0004739116702694446,
          0.0003386824100743979,
          0.9988493919372559,
          3.5361019001811655e-08,
          0.40696388483047485,
          1.0090010424401719e-11,
          5.031646423958591e-07,
          1.1510984876395014e-07,
          1.2389993742090155e-07,
          0.9985451698303223,
          2.980573080013649e-11,
          7.25789233519471e-16,
          5.682135751500228e-12,
          2.4587628807970496e-11,
          7.017133402120734e-11,
          1.7617324266083756e-11,
          3.572581249930429e-12,
          1.3928251997932795e-13,
          5.076441880191851e-07
        ],
        "headpose": {
          "pitch": -13.917111490547942,
          "yaw": -34.80694453870846,
          "roll": 14.990777954486218
        },
        "attributes": {
          "5 oClock Shadow": 0.03210899606347084,
          "Arched Eyebrows": 0.00012699338549282402,
          "Attractive": 0.008751656860113144,
          "Bags Under Eyes": 0.672919511795044,
          "Bald": 0.0003837008844129741,
          "Bangs": 0.007767960429191589,
          "Big Lips": 0.0379779189825058,
          "Big Nose": 0.6407086849212646,
          "Black Hair": 0.0023914100602269173,
          "Blond Hair": 0.002191617852076888,
          "Blurry": 0.07188477367162704,
          "Brown Hair": 0.0029812862630933523,
          "Bushy Eyebrows": 0.00046116980956867337,
          "Chubby": 0.04279610887169838,
          "Double Chin": 0.021128490567207336,
          "Eyeglasses": 0.0004970357986167073,
          "Goatee": 0.0026190457865595818,
          "Gray Hair": 0.09212915599346161,
          "Heavy Makeup": 4.9869944632519037e-05,
          "High Cheekbones": 0.08494903147220612,
          "Male": 0.999250590801239,
          "Mouth Slightly Open": 0.4319509267807007,
          "Mustache": 0.0039152586832642555,
          "Narrow Eyes": 0.015610354952514172,
          "No Beard": 0.949124813079834,
          "Oval Face": 0.04790937155485153,
          "Pale Skin": 0.013385951519012451,
          "Pointy Nose": 0.021345315501093864,
          "Receding Hairline": 0.0005578979034908116,
          "Rosy Cheeks": 7.428506069118157e-05,
          "Sideburns": 0.0012997437734156847,
          "Smiling": 0.058965053409338,
          "Straight Hair": 0.01276753842830658,
          "Wavy Hair": 0.009818492457270622,
          "Wearing Earrings": 0.00047660720883868635,
          "Wearing Hat": 0.947585940361023,
          "Wearing Lipstick": 0.00013932697765994817,
          "Wearing Necklace": 0.0007548054563812912,
          "Wearing Necktie": 0.035605769604444504,
          "Young": 0.03492071479558945
        },
        "age": [
          0.0005631144740618765,
          0.0014648637734353542,
          0.008015033788979053,
          0.002130163600668311,
          0.07652067393064499,
          0.9069665670394897,
          0.9623351097106934,
          0.9897342920303345
        ],
        "race": [
          0.5267518758773804,
          0.5137530565261841,
          0.936130702495575,
          0.11677158623933792,
          0.10455852001905441
        ],
        "gender": [
          0.9975838661193848,
          0.00431798305362463
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.0009857491610110237,
          "disgust": 7.202614490039917e-08,
          "fear": 0.24798504623681583,
          "happy": 0.00016049150237265267,
          "sad": 99.73161218950821,
          "surprise": 2.3197301019401556e-07,
          "neutral": 0.019260287501531095
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 104,
          "h": 125,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 61,
        "gender": {
          "Woman": 7.315360754728317,
          "Man": 92.6846444606781
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 2.27380311950408,
          "indian": 4.428998970508698,
          "black": 0.5582472575310161,
          "white": 56.42295999253273,
          "middle eastern": 21.78386488153161,
          "latino hispanic": 14.53212177370527
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "body",
                "sit on"
              ]
            ],
            "negative_action": [
              "inspect",
              "lie on",
              "no interaction"
            ],
            "position": "body"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.4127216339111328,
        0.09948693215847015,
        0.8999484777450562,
        0.9308195114135742
      ]
    ],
    "face_boxes": [
      [
        0.5997260212898254,
        0.1790110170841217,
        0.7090304493904114,
        0.34991785883903503
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5623168307046096,
            0.373950061849576
          ],
          [
            0.5198899962007999,
            0.36570517093385596
          ],
          [
            0.5983796400328478,
            0.6529022044981057
          ],
          [
            0.7065680680175621,
            0.6460314620683391
          ],
          [
            0.6047436652084193,
            0.3821949527652961
          ],
          [
            0.6047436652084193,
            0.6322899772088054
          ],
          [
            0.6927793468038242,
            0.6941266590767061
          ],
          [
            0.5209506670633951,
            0.824670765242274
          ],
          [
            0.8232418629030386,
            0.7133647378800528
          ],
          [
            0.856122659643491,
            0.918112862287102
          ],
          [
            0.582469577093919,
            0.7697048258041403
          ],
          [
            0.8232418629030386,
            0.7106164409081462
          ],
          [
            0.8444552801549434,
            0.9002489319697082
          ],
          [
            0.6577772083381813,
            0.22966447082447464
          ],
          [
            0.6949006885290145,
            0.23516106476828794
          ],
          [
            0.5867122605443,
            0.2324127677963813
          ],
          [
            0.7023253845671814,
            0.24615425265591467
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.697022030254205,
            0.6432831650964321
          ],
          [
            0.6938400176664192,
            0.630915828722852
          ],
          [
            0.6949006885290145,
            0.6212967893211788
          ],
          [
            0.6949006885290145,
            0.6254192347790389
          ],
          [
            0.6927793468038242,
            0.6364124226666655
          ],
          [
            0.7182354475061098,
            0.6212967893211788
          ],
          [
            0.7118714223305386,
            0.635038274180712
          ],
          [
            0.7065680680175621,
            0.641909016610479
          ],
          [
            0.7033860554297764,
            0.6460314620683391
          ],
          [
            0.7224781309564907,
            0.6336641256947589
          ],
          [
            0.7161141057809193,
            0.6446573135823856
          ],
          [
            0.7139927640557289,
            0.6529022044981057
          ],
          [
            0.7108107514679431,
            0.6529022044981057
          ],
          [
            0.7245994726816815,
            0.6501539075261992
          ],
          [
            0.7203567892313003,
            0.6570246499559658
          ],
          [
            0.7192961183687052,
            0.6625212438997793
          ],
          [
            0.7161141057809193,
            0.6652695408716858
          ],
          [
            0.723538801819086,
            0.6652695408716858
          ],
          [
            0.7203567892313003,
            0.6693919863295459
          ],
          [
            0.7192961183687052,
            0.6735144317874059
          ],
          [
            0.7161141057809193,
            0.677636877245266
          ]
        ],
        "dw_face": [
          [
            0.5962582983076572,
            0.21454883747898773
          ],
          [
            0.5962582983076572,
            0.23516106476828794
          ],
          [
            0.5962582983076572,
            0.2543991435716348
          ],
          [
            0.5983796400328478,
            0.27501137086093497
          ],
          [
            0.6026223234832286,
            0.2942494496642819
          ],
          [
            0.6100470195213953,
            0.3107392314957221
          ],
          [
            0.6206537281473476,
            0.3244807163552555
          ],
          [
            0.6323211076358953,
            0.3368480527288356
          ],
          [
            0.6450491579870384,
            0.3450929436445557
          ],
          [
            0.6598985500633716,
            0.3492153891024158
          ],
          [
            0.6736872712771099,
            0.3423446466726492
          ],
          [
            0.6821726381778717,
            0.325854864841209
          ],
          [
            0.6885366633534431,
            0.30936508300976884
          ],
          [
            0.6949006885290145,
            0.29150115269237514
          ],
          [
            0.7002040428419909,
            0.27226307388902843
          ],
          [
            0.7023253845671814,
            0.2530249950856815
          ],
          [
            0.7044467262923717,
            0.2324127677963813
          ],
          [
            0.6408064745366573,
            0.21454883747898773
          ],
          [
            0.6492918414374191,
            0.21180054050708105
          ],
          [
            0.6588378792007763,
            0.21317468899303446
          ],
          [
            0.6673232461015385,
            0.21454883747898773
          ],
          [
            0.6747479421397049,
            0.21867128293684776
          ],
          [
            0.6906580050786337,
            0.22279372839470782
          ],
          [
            0.6949006885290145,
            0.22141957990875455
          ],
          [
            0.6991433719793955,
            0.22141957990875455
          ],
          [
            0.7023253845671814,
            0.22141957990875455
          ],
          [
            0.7055073971549671,
            0.2241678768806612
          ],
          [
            0.6832333090404671,
            0.23378691628233467
          ],
          [
            0.6853546507656574,
            0.24890254962782146
          ],
          [
            0.6864153216282528,
            0.26264403448735485
          ],
          [
            0.6874759924908478,
            0.2763855193468885
          ],
          [
            0.6673232461015385,
            0.2818821132907018
          ],
          [
            0.6736872712771099,
            0.28463041026260855
          ],
          [
            0.6800512964526811,
            0.28737870723451514
          ],
          [
            0.6853546507656574,
            0.2887528557204686
          ],
          [
            0.6895973342160383,
            0.28463041026260855
          ],
          [
            0.6461098288496336,
            0.22691617385256785
          ],
          [
            0.6535345248878002,
            0.22279372839470782
          ],
          [
            0.6620198917885622,
            0.2241678768806612
          ],
          [
            0.6673232461015385,
            0.2324127677963813
          ],
          [
            0.6598985500633716,
            0.23378691628233467
          ],
          [
            0.6524738540252051,
            0.2324127677963813
          ],
          [
            0.6864153216282528,
            0.23653521325424132
          ],
          [
            0.6917186759412288,
            0.22966447082447464
          ],
          [
            0.697022030254205,
            0.22966447082447464
          ],
          [
            0.701264713704586,
            0.23653521325424132
          ],
          [
            0.697022030254205,
            0.239283510226148
          ],
          [
            0.6917186759412288,
            0.239283510226148
          ],
          [
            0.6482311705748239,
            0.3011201920940487
          ],
          [
            0.6598985500633716,
            0.29974604360809526
          ],
          [
            0.6726266004145145,
            0.3011201920940487
          ],
          [
            0.6758086130023002,
            0.302494340580002
          ],
          [
            0.6800512964526811,
            0.302494340580002
          ],
          [
            0.6821726381778717,
            0.3052426375519088
          ],
          [
            0.6832333090404671,
            0.3079909345238153
          ],
          [
            0.6800512964526811,
            0.3107392314957221
          ],
          [
            0.6768692838648956,
            0.3134875284676289
          ],
          [
            0.6726266004145145,
            0.31486167695358214
          ],
          [
            0.6641412335137528,
            0.3134875284676289
          ],
          [
            0.6556558666129908,
            0.3079909345238153
          ],
          [
            0.6503525123000145,
            0.3011201920940487
          ],
          [
            0.6620198917885622,
            0.30386848906595526
          ],
          [
            0.6747479421397049,
            0.3066167860378621
          ],
          [
            0.6779299547274906,
            0.3079909345238153
          ],
          [
            0.6821726381778717,
            0.3079909345238153
          ],
          [
            0.6779299547274906,
            0.3079909345238153
          ],
          [
            0.6736872712771099,
            0.3079909345238153
          ],
          [
            0.6620198917885622,
            0.3052426375519088
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            0.895367481559515,
            0.8947523380258947
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.8529406470557055,
            0.926357753202822
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "bench",
      "possible_names": [
        "bench"
      ],
      "box": [
        0.3,
        0.42105263157894735,
        0.8421875,
        0.9271255060728745
      ]
    }
  ],
  "scene": "A serene outdoor setting features a bicycle leaning against a column and a white chair with a cane resting on it amidst soft natural light and muted colors creating a calm atmosphere",
  "overall_past": "Before the current scene, the elderly man likely completed a quiet bicycle ride along the tree-lined pathway, perhaps enjoying the gentle breeze and the soft light filtering through the leaves. He may have paused to rest, leaning his bicycle against the column as he settled into the white chair, using his cane for support. The thoughtful expression suggests he was reflecting on a memory—perhaps of a past journey, a loved one, or a moment from his life that the peaceful setting evoked. The presence of the bicycle and the calm atmosphere imply this was not just a physical break, but a deliberate pause to reconnect with the stillness and beauty of the moment.",
  "overall_past_clean": "The figure had moved steadily along the winding path, the rhythm of their motion steady and deliberate, before coming to a halt, setting down their means of transport with care, and allowing themselves to settle into stillness as the surrounding quiet settled over them like a familiar embrace.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual may slowly rise from the white chair, using the cane for support, and walk toward the bicycle leaning against the column. As he reaches it, he might pause to adjust his balance, glance around the peaceful surroundings one last time, and then mount the bicycle, beginning a slow ride down the tree-lined pathway. This suggests a continuation of a quiet, reflective journey—perhaps a return home or a continuation of a daily ritual—where the stillness of the moment gives way to gentle motion, symbolizing resilience and the quiet rhythm of life.",
  "overall_future_clean": "The figure pedals forward with steady resolve, the wheels humming softly against the path as the trees lean in to whisper secrets, each breath a rhythm, each turn a quiet defiance against stillness, carrying the weight of silence into the unfolding light.",
  "future_scene_ok": false
}