{
  "image_path": "./ref_datasets/hico_det/images/train/train_00023771.jpg",
  "image_id": "train_00023771",
  "width": 591,
  "height": 287,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 23771,
  "annotations": {
    "objects": "[{'id': 386, 'bbox_human': [28, 548, 43, 266], 'bbox_object': [248, 386, 106, 204], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('laptop', 'read')]",
    "negative_captions": "[('laptop', 'repair'), ('laptop', 'type_on'), ('laptop', 'no_interaction')]",
    "ambiguous_captions": "[('laptop', 'hold'), ('laptop', 'open')]",
    "positive_objects": "[385]",
    "negative_objects": "[386, 387, 388]",
    "ambiguous_objects": "[383, 384]",
    "size": "[591, 287, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a white shirt, blue jeans, and white headphones. He also has a yellow bracelet on his wrist.",
        "clothing": [
          {
            "possible_names": [
              "shirt",
              "t-shirt"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "jeans",
              "pants"
            ],
            "name": "jeans",
            "type": "bottom",
            "color": [
              "blue"
            ]
          },
          {
            "possible_names": [
              "headphones",
              "earphones"
            ],
            "name": "headphones",
            "type": "accessory",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "bracelet"
            ],
            "name": "bracelet",
            "type": "accessory",
            "color": [
              "yellow"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "laptop",
              "computer"
            ],
            "name": "laptop",
            "position": "body"
          },
          {
            "standalone": false,
            "possible_names": [
              "socket",
              "power outlet"
            ],
            "name": "socket",
            "position": "foot"
          }
        ],
        "description": "An adult male is lying down, wearing a white shirt, blue jeans, and white headphones. He has a yellow bracelet on his wrist. He is using a laptop placed on his body and has a power cord plugged into an outlet near his foot.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused on something, possibly listening to music or engaged in work, as indicated by the headphones and laptop setup. There is no strong emotional expression visible.",
        "meaningful": true,
        "story": "The individual seems to be relaxing while working or enjoying some leisure activity. He is lying down with a laptop on his lap and headphones on, suggesting he might be listening to music, watching a video, or perhaps even working remotely in a comfortable setting.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "A person is reclining on the ground with a laptop resting on their lap and headphones on, suggesting they might be engaged in some form of digital entertainment or work. Their legs are extended with feet plugged into an electrical outlet, which humorously implies they are recharging themselves like a device. The individual appears relaxed and content, possibly enjoying a moment of leisure or productivity, indicating a playful take on modern technology's role in daily life.",
        "intention": "The individual is humorously portraying themselves as a device in need of charging to highlight the pervasive integration of technology into everyday life",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.15854612989128286,
            0.2637991290474603
          ],
          [
            0.1597415752851188,
            0.30238294435295077
          ],
          [
            0.16384265833152273,
            0.33866127359742487
          ],
          [
            0.1693431811831785,
            0.37190439500519146
          ],
          [
            0.17901569603432888,
            0.39459655366767515
          ],
          [
            0.18931046458929668,
            0.4146775681916726
          ],
          [
            0.20043311068364494,
            0.42960266903183725
          ],
          [
            0.21023975860562508,
            0.4395607492115558
          ],
          [
            0.22282590179129846,
            0.4359542596037558
          ],
          [
            0.2239427410925187,
            0.41433819874772504
          ],
          [
            0.2237322905053832,
            0.3959470590351232
          ],
          [
            0.22547330296151963,
            0.3797078415076492
          ],
          [
            0.22790123985849317,
            0.3610769967762257
          ],
          [
            0.2290515465122045,
            0.3386385107348961
          ],
          [
            0.22666191426572924,
            0.31505845232707697
          ],
          [
            0.2261047812801414,
            0.2953898580350824
          ],
          [
            0.22869676445197273,
            0.26764798959491853
          ],
          [
            0.20183757586498782,
            0.26762040756780037
          ],
          [
            0.20779391386268622,
            0.24887108885868087
          ],
          [
            0.21091061731107516,
            0.24610728087740907
          ],
          [
            0.21685126221407605,
            0.23791533907353432
          ],
          [
            0.2205504593078082,
            0.23580281327410443
          ],
          [
            0.22556478273531425,
            0.24673795344047492
          ],
          [
            0.2265365663749284,
            0.2478893008500323
          ],
          [
            0.22661584743935906,
            0.25182464432514623
          ],
          [
            0.22733662593528964,
            0.2542600769377158
          ],
          [
            0.22742456210705575,
            0.2645009384041345
          ],
          [
            0.2247813584178088,
            0.2699157198369058
          ],
          [
            0.22888837207594095,
            0.2867832971841557
          ],
          [
            0.23308903807339704,
            0.30471314144941514
          ],
          [
            0.2358598887761895,
            0.3223936879379706
          ],
          [
            0.21980157104816764,
            0.3327060849468408
          ],
          [
            0.22456395421478811,
            0.33404875205131596
          ],
          [
            0.22711437740330537,
            0.33874808691697905
          ],
          [
            0.22842153063251514,
            0.3377553845828537
          ],
          [
            0.22803149535686518,
            0.3403214359235977
          ],
          [
            0.20581725187165625,
            0.2699923479717249
          ],
          [
            0.2087683059871269,
            0.2686928938490173
          ],
          [
            0.2145847420142646,
            0.26759184575781053
          ],
          [
            0.21404021553351218,
            0.27325372615223686
          ],
          [
            0.2134201343952241,
            0.27530829665552864
          ],
          [
            0.20837815821617447,
            0.2709714017025922
          ],
          [
            0.22572104574143098,
            0.27433344687674993
          ],
          [
            0.22573865125627082,
            0.2742667191060637
          ],
          [
            0.2272876272000983,
            0.27641166888284946
          ],
          [
            0.22565728902874402,
            0.27872437799433797
          ],
          [
            0.22623185878621804,
            0.2760353069390866
          ],
          [
            0.22487190307440147,
            0.27684518862506413
          ],
          [
            0.21198193820052483,
            0.36164055421258634
          ],
          [
            0.21869868819541274,
            0.3615935474203973
          ],
          [
            0.2272512490316552,
            0.3611164615188682
          ],
          [
            0.22707401268258026,
            0.36275190141676905
          ],
          [
            0.22660318468687238,
            0.36678589535566514
          ],
          [
            0.22527643618215995,
            0.374192119653454
          ],
          [
            0.22490558838654118,
            0.3717871400596729
          ],
          [
            0.22507744605396576,
            0.3724448477943006
          ],
          [
            0.22568695966477606,
            0.37625201060559516
          ],
          [
            0.22486281204776887,
            0.38091832906704987
          ],
          [
            0.2198287597565885,
            0.3763238765399452
          ],
          [
            0.2157342541699021,
            0.3678748898389863
          ],
          [
            0.21148999624273065,
            0.36186492449018476
          ],
          [
            0.21769054748022473,
            0.3608037740689359
          ],
          [
            0.22466373754809785,
            0.36893913910838727
          ],
          [
            0.22526435699905498,
            0.37215918412310617
          ],
          [
            0.22593688907212958,
            0.3711313918907883
          ],
          [
            0.22525242546603444,
            0.3727060168937049
          ],
          [
            0.22488833441952158,
            0.37559154580753795
          ],
          [
            0.21662812075062826,
            0.3640703929485285
          ]
        ],
        "visibility": [
          1.8673864538021334e-12,
          2.177747774112504e-06,
          5.550454443437047e-05,
          1.3544471533927238e-13,
          3.293603547378332e-15,
          6.577683818627389e-14,
          3.0429681377577585e-18,
          1.081571796371101e-14,
          0.1260870397090912,
          1.9917870304198004e-06,
          0.00043633917812258005,
          0.00012683810200542212,
          4.378595974685595e-08,
          3.867199893647921e-09,
          2.440788456764542e-14,
          4.659126556783022e-11,
          9.382805643554093e-10,
          4.822706036605728e-12,
          0.002727077342569828,
          0.9990460276603699,
          3.0288647145937375e-09,
          3.0736690970201153e-10,
          3.695342456921935e-05,
          0.00017730840772856027,
          4.463357461403916e-11,
          1.0998905963788275e-06,
          0.40004804730415344,
          0.011180169880390167,
          0.9804297685623169
        ],
        "headpose": {
          "pitch": -0.3734147662176481,
          "yaw": -59.73236070702516,
          "roll": 2.5057007873526635
        },
        "attributes": {
          "5 oClock Shadow": 0.3456949293613434,
          "Arched Eyebrows": 0.0037418280262500048,
          "Attractive": 0.051526401191949844,
          "Bags Under Eyes": 0.08740422874689102,
          "Bald": 0.062221329659223557,
          "Bangs": 6.6278785197937395e-06,
          "Big Lips": 0.04311368241906166,
          "Big Nose": 0.10868041217327118,
          "Black Hair": 0.08505377918481827,
          "Blond Hair": 0.0025390887167304754,
          "Blurry": 0.3558887541294098,
          "Brown Hair": 0.006781418342143297,
          "Bushy Eyebrows": 0.17004014551639557,
          "Chubby": 0.008893203921616077,
          "Double Chin": 0.002124043181538582,
          "Eyeglasses": 0.006776782684028149,
          "Goatee": 0.03301797807216644,
          "Gray Hair": 0.010539006441831589,
          "Heavy Makeup": 8.352072472916916e-05,
          "High Cheekbones": 0.022229354828596115,
          "Male": 0.9996688365936279,
          "Mouth Slightly Open": 0.037646908313035965,
          "Mustache": 0.028834136202931404,
          "Narrow Eyes": 0.25528794527053833,
          "No Beard": 0.45461007952690125,
          "Oval Face": 0.030035650357604027,
          "Pale Skin": 0.00834601279348135,
          "Pointy Nose": 0.2532084882259369,
          "Receding Hairline": 0.2954052984714508,
          "Rosy Cheeks": 5.7605819165473804e-05,
          "Sideburns": 0.1082397997379303,
          "Smiling": 0.012024412862956524,
          "Straight Hair": 0.051366012543439865,
          "Wavy Hair": 0.007105881813913584,
          "Wearing Earrings": 0.0014486477011814713,
          "Wearing Hat": 0.0009242485975846648,
          "Wearing Lipstick": 0.00010114054748555645,
          "Wearing Necklace": 0.0016160676022991538,
          "Wearing Necktie": 0.12817448377609253,
          "Young": 0.62931889295578
        },
        "age": [
          0.0003662496746983379,
          0.007581319194287062,
          0.9076775312423706,
          0.878211498260498,
          0.9522030353546143,
          0.21147778630256653,
          0.011347068473696709,
          2.9216960683697835e-05
        ],
        "race": [
          0.5343911051750183,
          0.13217319548130035,
          0.8939277529716492,
          0.19810675084590912,
          0.6185281872749329
        ],
        "gender": [
          0.9972503781318665,
          0.005468273535370827
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 96.65971994400024,
          "disgust": 2.3872884225006885e-08,
          "fear": 0.0001387276142850169,
          "happy": 0.28024057392030954,
          "sad": 3.0598968267440796,
          "surprise": 2.0012158403327097e-16,
          "neutral": 3.8822185466358405e-07
        },
        "dominant_emotion": "angry",
        "region": {
          "x": 0,
          "y": 0,
          "w": 60,
          "h": 95,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 26,
        "gender": {
          "Woman": 0.019026815425604582,
          "Man": 99.98098015785217
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.0002830559651556541,
          "indian": 1.5623870305716991,
          "black": 0.016454329306725413,
          "white": 2.947081997990608,
          "middle eastern": 94.27343606948853,
          "latino hispanic": 1.2003571726381779
        },
        "dominant_race": "middle eastern"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "thigh",
                "read"
              ]
            ],
            "negative_action": [
              "repair",
              "type on",
              "no interaction"
            ],
            "position": "thigh"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.059168439358472824,
        0.15739759802818298,
        0.9224512577056885,
        0.9112855195999146
      ]
    ],
    "face_boxes": [
      [
        0.16634607315063477,
        0.19533781707286835,
        0.23599112033843994,
        0.41895246505737305
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.15625140504586918,
            0.4934644173142802
          ],
          [
            0.1127712538500526,
            0.5121177051748548
          ],
          [
            0.09646619715162139,
            0.8292235988046234
          ],
          [
            0.23596501557153293,
            0.8627995169536578
          ],
          [
            0.19973155624168576,
            0.47481112945370557
          ],
          [
            0.266763456001903,
            0.6203067747661877
          ],
          [
            0.39720390958935275,
            0.6314987474825324
          ],
          [
            0.3609704502595056,
            0.7620717625065547
          ],
          [
            0.6091696466689586,
            0.7732637352228996
          ],
          [
            0.8464988052794574,
            0.7583411049344398
          ],
          [
            0.4026389284888298,
            0.6725359807757966
          ],
          [
            0.6019229548029892,
            0.6874586110642563
          ],
          [
            0.7975836351841638,
            0.7695330776507846
          ],
          [
            0.20878992107414757,
            0.2957395659921892
          ],
          [
            0.22509497777257878,
            0.29200890842007426
          ],
          [
            0.15081638614639212,
            0.3032008811364191
          ],
          [
            0.19610821030870104,
            0.29947022356430414
          ]
        ],
        "dw_hand_1": [
          [
            0.393580563656368,
            0.6613440080594518
          ],
          [
            0.3990155825558451,
            0.6650746656315667
          ],
          [
            0.38814554475689095,
            0.6464213777709921
          ],
          [
            0.38452219882390626,
            0.6426907201988772
          ],
          [
            0.3790871799244292,
            0.7210345292132906
          ],
          [
            0.3899572177233833,
            0.6426907201988772
          ],
          [
            0.38452219882390626,
            0.6613440080594518
          ],
          [
            0.38452219882390626,
            0.6911892686363712
          ],
          [
            0.38452219882390626,
            0.6911892686363712
          ],
          [
            0.393580563656368,
            0.6613440080594518
          ],
          [
            0.393580563656368,
            0.6837279534921413
          ],
          [
            0.393580563656368,
            0.6837279534921413
          ],
          [
            0.3863338717903986,
            0.6613440080594518
          ],
          [
            0.39720390958935275,
            0.6613440080594518
          ],
          [
            0.3827105258574139,
            0.6613440080594518
          ],
          [
            0.3827105258574139,
            0.6837279534921413
          ],
          [
            0.3827105258574139,
            0.6911892686363712
          ],
          [
            0.393580563656368,
            0.6538826929152219
          ],
          [
            0.38452219882390626,
            0.6613440080594518
          ],
          [
            0.3808988528909215,
            0.6911892686363712
          ],
          [
            0.3827105258574139,
            0.6949199262084861
          ]
        ],
        "dw_hand_2": [
          [
            0.23777668853802528,
            0.8665301745257726
          ],
          [
            0.25770509116944124,
            0.8404155715209681
          ],
          [
            0.27763349380085717,
            0.8105703109440487
          ],
          [
            0.2957502234657807,
            0.8068396533719339
          ],
          [
            0.3138669531307043,
            0.8068396533719339
          ],
          [
            0.3011852423652578,
            0.8217622836603936
          ],
          [
            0.3229253179631661,
            0.8217622836603936
          ],
          [
            0.3356070287286126,
            0.8254929412325085
          ],
          [
            0.3464770665275667,
            0.8292235988046234
          ],
          [
            0.30299691533175016,
            0.847876886665198
          ],
          [
            0.32473699092965846,
            0.851607544237313
          ],
          [
            0.34104204762808965,
            0.851607544237313
          ],
          [
            0.3555354313600285,
            0.8590688593815428
          ],
          [
            0.2993735693987654,
            0.8739914896700025
          ],
          [
            0.3211136449966737,
            0.8777221472421174
          ],
          [
            0.3337953557621202,
            0.8777221472421174
          ],
          [
            0.3464770665275667,
            0.8814528048142324
          ],
          [
            0.29393855049928835,
            0.900106092674807
          ],
          [
            0.3102436071977196,
            0.900106092674807
          ],
          [
            0.31930197203018135,
            0.896375435102692
          ],
          [
            0.32836033686264315,
            0.900106092674807
          ]
        ],
        "dw_face": [
          [
            0.16349809691183861,
            0.29200890842007426
          ],
          [
            0.16349809691183861,
            0.31439285385276383
          ],
          [
            0.165309769878331,
            0.33304614171333846
          ],
          [
            0.16712144284482333,
            0.355430087146028
          ],
          [
            0.1725564617443004,
            0.37035271743448767
          ],
          [
            0.17799148064377748,
            0.3890060052950623
          ],
          [
            0.18523817250974692,
            0.4001979780114071
          ],
          [
            0.1942965373422087,
            0.4076592931556369
          ],
          [
            0.20335490217467048,
            0.41885126587198174
          ],
          [
            0.21241326700713228,
            0.4225819234440966
          ],
          [
            0.2196599588731017,
            0.4151206082998668
          ],
          [
            0.22147163183959406,
            0.39646732043929217
          ],
          [
            0.22509497777257878,
            0.3740833750066026
          ],
          [
            0.22509497777257878,
            0.355430087146028
          ],
          [
            0.22690665073907113,
            0.3367767992854534
          ],
          [
            0.22690665073907113,
            0.31439285385276383
          ],
          [
            0.22690665073907113,
            0.2957395659921892
          ],
          [
            0.19791988327519341,
            0.2808169357037295
          ],
          [
            0.20516657514116285,
            0.27335562055949963
          ],
          [
            0.2106015940406399,
            0.27335562055949963
          ],
          [
            0.21422493997362463,
            0.27708627813161457
          ],
          [
            0.2196599588731017,
            0.2808169357037295
          ],
          [
            0.22509497777257878,
            0.28454759327584445
          ],
          [
            0.22509497777257878,
            0.28454759327584445
          ],
          [
            0.22690665073907113,
            0.28454759327584445
          ],
          [
            0.22690665073907113,
            0.2808169357037295
          ],
          [
            0.22690665073907113,
            0.28454759327584445
          ],
          [
            0.2232833048060864,
            0.29947022356430414
          ],
          [
            0.22690665073907113,
            0.3106621962806489
          ],
          [
            0.23052999667205584,
            0.32185416899699365
          ],
          [
            0.23415334260504056,
            0.33304614171333846
          ],
          [
            0.21784828590660935,
            0.3442381144296832
          ],
          [
            0.22147163183959406,
            0.34796877200179815
          ],
          [
            0.22509497777257878,
            0.34796877200179815
          ],
          [
            0.2287183237055635,
            0.34796877200179815
          ],
          [
            0.23234166963854821,
            0.3442381144296832
          ],
          [
            0.20154322920817813,
            0.29947022356430414
          ],
          [
            0.2069782481076552,
            0.2957395659921892
          ],
          [
            0.2106015940406399,
            0.2957395659921892
          ],
          [
            0.21241326700713228,
            0.29947022356430414
          ],
          [
            0.20878992107414757,
            0.3032008811364191
          ],
          [
            0.20516657514116285,
            0.3032008811364191
          ],
          [
            0.2232833048060864,
            0.29947022356430414
          ],
          [
            0.22509497777257878,
            0.2957395659921892
          ],
          [
            0.22509497777257878,
            0.29947022356430414
          ],
          [
            0.22509497777257878,
            0.29947022356430414
          ],
          [
            0.22509497777257878,
            0.29947022356430414
          ],
          [
            0.22509497777257878,
            0.29947022356430414
          ],
          [
            0.2106015940406399,
            0.37035271743448767
          ],
          [
            0.21784828590660935,
            0.3666220598623728
          ],
          [
            0.2232833048060864,
            0.36289140229025785
          ],
          [
            0.22509497777257878,
            0.36289140229025785
          ],
          [
            0.22509497777257878,
            0.36289140229025785
          ],
          [
            0.22509497777257878,
            0.37035271743448767
          ],
          [
            0.2232833048060864,
            0.3740833750066026
          ],
          [
            0.2232833048060864,
            0.37781403257871754
          ],
          [
            0.22509497777257878,
            0.3815446901508325
          ],
          [
            0.2232833048060864,
            0.3815446901508325
          ],
          [
            0.21784828590660935,
            0.3815446901508325
          ],
          [
            0.21422493997362463,
            0.37781403257871754
          ],
          [
            0.21241326700713228,
            0.37035271743448767
          ],
          [
            0.21784828590660935,
            0.37035271743448767
          ],
          [
            0.2232833048060864,
            0.37035271743448767
          ],
          [
            0.2232833048060864,
            0.37035271743448767
          ],
          [
            0.2232833048060864,
            0.3740833750066026
          ],
          [
            0.2232833048060864,
            0.3740833750066026
          ],
          [
            0.2232833048060864,
            0.3740833750066026
          ],
          [
            0.21603661294011697,
            0.3740833750066026
          ]
        ],
        "dw_foot_1": [
          [
            0.8700505538438581,
            0.5195790203190847
          ],
          [
            0.8519338241789345,
            0.549424280896004
          ],
          [
            0.8428754593464727,
            0.8366849139488532
          ]
        ],
        "dw_foot_2": [
          [
            0.8917906294417663,
            0.5158483627469698
          ],
          [
            0.8972256483412434,
            0.5718082263286937
          ],
          [
            0.8664272079108734,
            0.7956476806555891
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "laptop",
      "possible_names": [
        "laptop"
      ],
      "box": [
        0.4196277495769882,
        0.3693379790940767,
        0.6531302876480541,
        0.710801393728223
      ]
    }
  ],
  "scene": "A person is reclining with a laptop on their lap and headphones connected to it while their feet are plugged into an electrical outlet suggesting a humorous take on charging oneself through technology amidst a stark white background with blue jeans and white shirt as the main colors and objects in view",
  "overall_past": "Before the current scene, the individual likely realized their laptop was running low on battery while they were in the middle of an important task or immersive digital experience—perhaps a long work session, a streaming marathon, or an online meeting. Frustrated by the dwindling charge and unwilling to move or search for a charger, they improvised by using their own body as a power source, plugging their feet into the outlet in a humorous, exaggerated attempt to stay connected and powered. This act reflects a satirical commentary on how deeply reliant modern people are on technology, to the point of treating themselves like devices in need of constant charging.",
  "overall_past_clean": "The device had been steadily losing power through hours of uninterrupted use, the screen flickering with warnings that grew more urgent with each passing minute, until the low battery alert became an insistent, inescapable presence demanding immediate attention.",
  "past_scene_ok": false,
  "overall_future": "After the current scene, the laptop might suddenly shut down due to a power surge from the unconventional charging method, causing the person to jolt awake in surprise—only to realize the outlet was not designed to power human beings, leading to a comical moment of self-awareness and laughter as they unplug their feet and check the laptop’s battery, which is now at 100%.",
  "overall_future_clean": "The device powers down abruptly with a sharp click, sending a jolt through the body, followed by a stunned pause before erupting into laughter at the absurdity of the situation, hands flying to unplug the connection while the screen confirms a full charge.",
  "future_scene_ok": false
}