{
  "image_path": "./ref_datasets/hico_det/images/train/train_00020812.jpg",
  "image_id": "train_00020812",
  "width": 640,
  "height": 441,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 20812,
  "annotations": {
    "objects": "[{'id': 386, 'bbox_human': [25, 430, 1, 441], 'bbox_object': [190, 479, 282, 418], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('laptop', 'read')]",
    "negative_captions": "[('laptop', 'open'), ('laptop', 'repair'), ('laptop', 'no_interaction')]",
    "ambiguous_captions": "[('laptop', 'hold'), ('laptop', 'type_on')]",
    "positive_objects": "[385]",
    "negative_objects": "[384, 386, 388]",
    "ambiguous_objects": "[383, 387]",
    "size": "[640, 441, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark gray long-sleeved top and dark pants. She has a wristband on her left wrist and is wearing stud earrings.",
        "clothing": [
          {
            "possible_names": [
              "sweater",
              "shirt",
              "blouse"
            ],
            "name": "sweater",
            "type": "top",
            "color": [
              "dark gray"
            ]
          },
          {
            "possible_names": [
              "pants",
              "jeans"
            ],
            "name": "pants",
            "type": "bottom",
            "color": [
              "dark"
            ]
          },
          {
            "possible_names": [
              "wristband",
              "bracelet"
            ],
            "name": "wristband",
            "type": "accessory",
            "color": [
              "silver"
            ]
          },
          {
            "possible_names": [
              "earrings"
            ],
            "name": "earrings",
            "type": "accessory",
            "color": [
              "silver"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "laptop",
              "computer"
            ],
            "name": "laptop",
            "position": "body"
          }
        ],
        "description": "The person is an adult female sitting in a classroom or lecture hall. She appears neutral in emotion and is holding a laptop on her lap. She is wearing a dark gray sweater, dark pants, a silver wristband, and silver stud earrings. The laptop is in contact with her body as she uses it.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused on something, possibly the laptop screen, with a neutral expression that suggests concentration rather than strong emotion.",
        "meaningful": true,
        "story": "The person seems to be engaged in work or study at a public space, such as a library or conference room, using a laptop. The setting suggests a professional or academic environment.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is seated comfortably in a wooden chair, focused on the laptop resting on their lap, suggesting they might be engaged in work or study. Their hand is raised near their face, possibly indicating deep thought or concentration as they interact with the content on the screen. The presence of a pen in their other hand implies they may be taking notes or preparing to write something down. Their expression appears calm and attentive, reflecting a sense of dedication to the task at hand. The setting, which looks like a classroom or lecture hall, supports the idea that they could be a student or an attendee at a seminar, fully immersed in the learning process.",
        "intention": "The individual is deeply engaged in processing information with the intent to understand and retain knowledge through active note-taking and thoughtful reflection",
        "intention_ok": false
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.23870044010026112,
            0.2203285579044996
          ],
          [
            0.24261329770088197,
            0.2580194165878864
          ],
          [
            0.2467259319765227,
            0.2960463602024643
          ],
          [
            0.2525977632829121,
            0.33175016662083595
          ],
          [
            0.26604309592928205,
            0.35846817281047694
          ],
          [
            0.2822852381638118,
            0.3784840737958537
          ],
          [
            0.3015255536351885,
            0.39095830901911777
          ],
          [
            0.3196222645895822,
            0.3979180314064335
          ],
          [
            0.3368876951081412,
            0.3999097334129894
          ],
          [
            0.3471355216843741,
            0.3880338634840678
          ],
          [
            0.35447000946317403,
            0.3727480935015492
          ],
          [
            0.36127905249595643,
            0.3498056505658613
          ],
          [
            0.3655254364013672,
            0.33011297381036214
          ],
          [
            0.37024515356336324,
            0.3044411057131477
          ],
          [
            0.37130830458232333,
            0.2749864444170409
          ],
          [
            0.3712730016027178,
            0.2503394411727762
          ],
          [
            0.3720085782664163,
            0.22159709071587852
          ],
          [
            0.28660888246127536,
            0.21284275623367255
          ],
          [
            0.2976810412747519,
            0.19683616880386595
          ],
          [
            0.3089449588741575,
            0.19555243698184377
          ],
          [
            0.32081417441368104,
            0.19936394838210175
          ],
          [
            0.33203192608697074,
            0.2027972718446742
          ],
          [
            0.34945666704859046,
            0.20180972587108456
          ],
          [
            0.354551408120564,
            0.19618455993731432
          ],
          [
            0.35886724846703666,
            0.19299817000309702
          ],
          [
            0.36596849901335576,
            0.18674249374098018
          ],
          [
            0.37045546429497855,
            0.19579422354196166
          ],
          [
            0.3408158285277231,
            0.23587426994084
          ],
          [
            0.3438639419419425,
            0.25276995245831896
          ],
          [
            0.3460415380341666,
            0.269162428120328
          ],
          [
            0.3473770609923771,
            0.2871935613957817
          ],
          [
            0.3304604836872646,
            0.3012131906304886
          ],
          [
            0.33716710465294975,
            0.3002692662206019
          ],
          [
            0.3431864670344761,
            0.3037421393633893
          ],
          [
            0.34742144516536166,
            0.3018275746875957
          ],
          [
            0.3521559527942112,
            0.30076240759510653
          ],
          [
            0.2983280794961112,
            0.23898677467566154
          ],
          [
            0.3054335896457945,
            0.2350259071266068
          ],
          [
            0.3172305515834263,
            0.23223881710683947
          ],
          [
            0.32275845663888114,
            0.23912903526511284
          ],
          [
            0.3167527032749994,
            0.24290297245338274
          ],
          [
            0.3051477427993502,
            0.24376735403038052
          ],
          [
            0.3496524427618299,
            0.23669005768716936
          ],
          [
            0.3545446004186358,
            0.22865394701029362
          ],
          [
            0.36357161317552833,
            0.22788761316243214
          ],
          [
            0.366260016816003,
            0.23390471468011964
          ],
          [
            0.3641153608049665,
            0.23673806022122565
          ],
          [
            0.3548901200294495,
            0.23934234551793362
          ],
          [
            0.3154341867991856,
            0.3345769675835306
          ],
          [
            0.3267676055431366,
            0.3259227234914846
          ],
          [
            0.3397897175380161,
            0.31830362475030355
          ],
          [
            0.3442955221448626,
            0.3206049780417771
          ],
          [
            0.34799460768699647,
            0.3192186831346715
          ],
          [
            0.35378447515623906,
            0.32622318280179563
          ],
          [
            0.3560021000249045,
            0.3380159218024775
          ],
          [
            0.35308194075311927,
            0.3525204008205601
          ],
          [
            0.3475471258163452,
            0.3674276065857309
          ],
          [
            0.3415300624711173,
            0.37509755683555396
          ],
          [
            0.3326302119663784,
            0.3702697543832219
          ],
          [
            0.3233645720141275,
            0.35665248905450037
          ],
          [
            0.31727708790983467,
            0.3356466231548481
          ],
          [
            0.33154044321605136,
            0.33380242277589633
          ],
          [
            0.3427235305309296,
            0.3347005485754628
          ],
          [
            0.348344840322222,
            0.3369641126379984
          ],
          [
            0.3544000932148525,
            0.3364176201828097
          ],
          [
            0.3492163028035845,
            0.34581195261627484
          ],
          [
            0.3428788559777396,
            0.3485131299260136
          ],
          [
            0.3302720138004848,
            0.3456089766156067
          ]
        ],
        "visibility": [
          0.00011949860345339403,
          3.9847924426794634e-07,
          0.14621475338935852,
          1.660704640471522e-08,
          3.2074216615995965e-09,
          8.159146318575949e-07,
          3.483884256638703e-07,
          1.2634473467443286e-09,
          0.00010320845467504114,
          6.365996523527429e-05,
          5.495468258231995e-08,
          0.20805281400680542,
          0.004007014911621809,
          1.0204914815403754e-06,
          0.00033063211594708264,
          2.5936247993740835e-07,
          2.7553988957151887e-07,
          1.6715002004730195e-07,
          1.390533937994931e-10,
          0.99172443151474,
          1.5043087608912487e-10,
          2.4249477209234427e-13,
          6.500051148369823e-13,
          0.0031958550680428743,
          2.578697999016809e-15,
          1.5539027787485164e-14,
          6.945727992757611e-09,
          1.9527007566466636e-07,
          7.0277387465012e-08
        ],
        "headpose": {
          "pitch": -9.166513432223558,
          "yaw": -29.54581374558772,
          "roll": 3.6080431601910044
        },
        "attributes": {
          "5 oClock Shadow": 0.011749781668186188,
          "Arched Eyebrows": 0.08013489842414856,
          "Attractive": 0.027094140648841858,
          "Bags Under Eyes": 0.06391075253486633,
          "Bald": 3.785208900808357e-05,
          "Bangs": 0.006394653115421534,
          "Big Lips": 0.6314959526062012,
          "Big Nose": 0.17166367173194885,
          "Black Hair": 0.8012300133705139,
          "Blond Hair": 0.0003716919745784253,
          "Blurry": 0.08240808546543121,
          "Brown Hair": 0.01980501040816307,
          "Bushy Eyebrows": 0.019676022231578827,
          "Chubby": 0.07334665209054947,
          "Double Chin": 0.009762242436408997,
          "Eyeglasses": 0.000709504762198776,
          "Goatee": 0.0006209784187376499,
          "Gray Hair": 0.0006877747946418822,
          "Heavy Makeup": 0.04791755974292755,
          "High Cheekbones": 0.23986324667930603,
          "Male": 0.07836832851171494,
          "Mouth Slightly Open": 0.9749161005020142,
          "Mustache": 0.0007221515406854451,
          "Narrow Eyes": 0.08895709365606308,
          "No Beard": 0.9756964445114136,
          "Oval Face": 0.18040533363819122,
          "Pale Skin": 0.0004265272873453796,
          "Pointy Nose": 0.07046128064393997,
          "Receding Hairline": 0.20754610002040863,
          "Rosy Cheeks": 0.001487167552113533,
          "Sideburns": 0.0008531318744644523,
          "Smiling": 0.021337086334824562,
          "Straight Hair": 0.018730223178863525,
          "Wavy Hair": 0.38127753138542175,
          "Wearing Earrings": 0.5141394138336182,
          "Wearing Hat": 0.001985204638913274,
          "Wearing Lipstick": 0.1292612999677658,
          "Wearing Necklace": 0.03842153027653694,
          "Wearing Necktie": 0.0015501206507906318,
          "Young": 0.9601559638977051
        },
        "age": [
          0.052808210253715515,
          0.7541325688362122,
          0.9548483490943909,
          0.8023095726966858,
          0.3695870637893677,
          0.0032385741360485554,
          0.00021468846534844488,
          3.4216855056001805e-06
        ],
        "race": [
          0.00287922122515738,
          0.9885030388832092,
          0.2235109657049179,
          0.818273663520813,
          0.34611478447914124
        ],
        "gender": [
          0.048101454973220825,
          0.955333948135376
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 2.038089474964977e-07,
          "disgust": 8.00488336310735e-21,
          "fear": 0.009944813064066693,
          "happy": 3.448045460263671e-08,
          "sad": 0.017099954129662365,
          "surprise": 5.3579824604854664e-09,
          "neutral": 99.9729573726654
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 119,
          "h": 173,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 31,
        "gender": {
          "Woman": 95.86705565452576,
          "Man": 4.132940247654915
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 2.834970116662227e-06,
          "indian": 6.532282375792108e-05,
          "black": 99.99993443488684,
          "white": 1.3511012559160832e-09,
          "middle eastern": 1.517454447061656e-08,
          "latino hispanic": 1.011075017356063e-06
        },
        "dominant_race": "black"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "hand",
                "read"
              ]
            ],
            "negative_action": [
              "open",
              "repair",
              "no interaction"
            ],
            "position": "hand"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.04026374965906143,
        0.01192441489547491,
        0.6583569645881653,
        0.9924377202987671
      ]
    ],
    "face_boxes": [
      [
        0.2476120889186859,
        0.1306716948747635,
        0.3730267882347107,
        0.39424607157707214
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.26128553114831454,
            0.4628375814615193
          ],
          [
            0.17638789253930254,
            0.44495262796916657
          ],
          [
            0.09012093717853231,
            0.7867539613785749
          ],
          [
            0.30921161745985354,
            0.8682298606215151
          ],
          [
            0.3461831697573265,
            0.48072253495387207
          ],
          [
            0.44340465913216265,
            0.8225238683632804
          ],
          [
            0.40369447333117325,
            0.5562367830326946
          ],
          [
            0.1832344762980938,
            0.9397696745909261
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.354399070267876,
            0.9059869846609265
          ],
          [
            0.6200465201089781,
            0.9675907133568079
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.306472983956337,
            0.23828205427975693
          ],
          [
            0.3585070205231508,
            0.23828205427975693
          ],
          [
            0.23116056260963277,
            0.2581542248268157
          ],
          [
            0.37220018804073335,
            0.2502053566079921
          ]
        ],
        "dw_hand_1": [
          [
            0.3941092560688654,
            0.5443134807044595
          ],
          [
            0.3680922377854586,
            0.5164924419385776
          ],
          [
            0.34344453625380994,
            0.4866841861179897
          ],
          [
            0.33933658599853517,
            0.45886314735210754
          ],
          [
            0.33933658599853517,
            0.42309324036740203
          ],
          [
            0.35576838701963426,
            0.4409781938597548
          ],
          [
            0.35302975351611776,
            0.41713158920328447
          ],
          [
            0.348921803260843,
            0.4052082868750493
          ],
          [
            0.34344453625380994,
            0.39527220160152016
          ],
          [
            0.3680922377854586,
            0.4370037597503432
          ],
          [
            0.3653536042819421,
            0.41116993803916685
          ],
          [
            0.3612456540266673,
            0.4052082868750493
          ],
          [
            0.3571377037713924,
            0.4012338527656377
          ],
          [
            0.38178540530304106,
            0.4350165426956372
          ],
          [
            0.3776774550477664,
            0.41116993803916685
          ],
          [
            0.37220018804073335,
            0.4052082868750493
          ],
          [
            0.3680922377854586,
            0.4032210698203435
          ],
          [
            0.39547857282062376,
            0.4370037597503432
          ],
          [
            0.39137062256534894,
            0.41713158920328447
          ],
          [
            0.38589335555831594,
            0.41116993803916685
          ],
          [
            0.38178540530304106,
            0.4052082868750493
          ]
        ],
        "dw_hand_2": [
          [
            0.3133195677151283,
            0.870217077676221
          ],
          [
            0.33659795249501867,
            0.8543193412385739
          ],
          [
            0.3585070205231508,
            0.8364343877462211
          ],
          [
            0.38178540530304106,
            0.8344471706915155
          ],
          [
            0.4064331068346897,
            0.8443832559650447
          ],
          [
            0.38863198906183244,
            0.8245110854179859
          ],
          [
            0.41738764084875585,
            0.8304727365821035
          ],
          [
            0.4365580753733713,
            0.8463704730197508
          ],
          [
            0.4516205596427124,
            0.8602809924026914
          ],
          [
            0.3900013058135907,
            0.8364343877462211
          ],
          [
            0.4201262743522724,
            0.8423960389103387
          ],
          [
            0.4420353423804045,
            0.8582937753479859
          ],
          [
            0.45709782664974535,
            0.8722042947309266
          ],
          [
            0.38726267231007416,
            0.8543193412385739
          ],
          [
            0.41464900734523946,
            0.8582937753479859
          ],
          [
            0.43381944186985494,
            0.870217077676221
          ],
          [
            0.45025124289095403,
            0.8801531629497502
          ],
          [
            0.3804160885512829,
            0.8781659458950442
          ],
          [
            0.40095583982765676,
            0.8781659458950442
          ],
          [
            0.41601832409699746,
            0.8841275970591618
          ],
          [
            0.42971149161458017,
            0.8900892482232794
          ]
        ],
        "dw_face": [
          [
            0.2393764631201824,
            0.23629483722505115
          ],
          [
            0.24211509662369882,
            0.2621286589362273
          ],
          [
            0.2434844133754571,
            0.28796248064740365
          ],
          [
            0.24896168038249017,
            0.31379630235857975
          ],
          [
            0.25580826414128144,
            0.3356556899603443
          ],
          [
            0.26813211490710576,
            0.3555278605074028
          ],
          [
            0.28182528242468835,
            0.3714255969450498
          ],
          [
            0.29825708344578744,
            0.38334889927328497
          ],
          [
            0.31468888446688653,
            0.3932849845468141
          ],
          [
            0.3311206854879856,
            0.3932849845468141
          ],
          [
            0.3448138530055681,
            0.3793744651638732
          ],
          [
            0.35302975351611776,
            0.3575150775621086
          ],
          [
            0.3612456540266673,
            0.3356556899603443
          ],
          [
            0.3667229210337003,
            0.31180908530387397
          ],
          [
            0.37083087128897513,
            0.2859752635926976
          ],
          [
            0.37220018804073335,
            0.2601414418815215
          ],
          [
            0.37083087128897513,
            0.23430762017034537
          ],
          [
            0.2845639159282049,
            0.2184098837326984
          ],
          [
            0.29551844994227083,
            0.2124482325685808
          ],
          [
            0.306472983956337,
            0.21046101551387505
          ],
          [
            0.3160582012186447,
            0.21046101551387505
          ],
          [
            0.32701273523271085,
            0.2144354496232866
          ],
          [
            0.3516604367643595,
            0.21642266667799262
          ],
          [
            0.3571377037713924,
            0.2124482325685808
          ],
          [
            0.3612456540266673,
            0.21046101551387505
          ],
          [
            0.3667229210337003,
            0.208473798459169
          ],
          [
            0.37083087128897513,
            0.2124482325685808
          ],
          [
            0.34070590275029344,
            0.24225648838916874
          ],
          [
            0.34344453625380994,
            0.25616700777210966
          ],
          [
            0.3461831697573265,
            0.2700775271550509
          ],
          [
            0.348921803260843,
            0.2859752635926976
          ],
          [
            0.328382051984469,
            0.2998857829756388
          ],
          [
            0.3352286357432604,
            0.30187300003034456
          ],
          [
            0.34344453625380994,
            0.30187300003034456
          ],
          [
            0.348921803260843,
            0.30187300003034456
          ],
          [
            0.354399070267876,
            0.2978985659209328
          ],
          [
            0.2927798164387544,
            0.24225648838916874
          ],
          [
            0.3023650337010622,
            0.23828205427975693
          ],
          [
            0.31195025096337003,
            0.23828205427975693
          ],
          [
            0.3187968347221613,
            0.24424370544387453
          ],
          [
            0.31058093421161176,
            0.2482181395532863
          ],
          [
            0.3023650337010622,
            0.2482181395532863
          ],
          [
            0.348921803260843,
            0.24424370544387453
          ],
          [
            0.354399070267876,
            0.23828205427975693
          ],
          [
            0.3612456540266673,
            0.23828205427975693
          ],
          [
            0.3667229210337003,
            0.24225648838916874
          ],
          [
            0.3612456540266673,
            0.24623092249858056
          ],
          [
            0.35576838701963426,
            0.24623092249858056
          ],
          [
            0.31195025096337003,
            0.3356556899603443
          ],
          [
            0.32427410172919435,
            0.32373238763210915
          ],
          [
            0.33933658599853517,
            0.31777073646799153
          ],
          [
            0.34344453625380994,
            0.31777073646799153
          ],
          [
            0.3475524865090847,
            0.31777073646799153
          ],
          [
            0.35302975351611776,
            0.32571960468681493
          ],
          [
            0.35302975351611776,
            0.33764290701505006
          ],
          [
            0.3502911200126012,
            0.34956620934328525
          ],
          [
            0.3475524865090847,
            0.36148951167152044
          ],
          [
            0.33933658599853517,
            0.3654639457809322
          ],
          [
            0.32701273523271085,
            0.36148951167152044
          ],
          [
            0.31742751797040303,
            0.35155342639799103
          ],
          [
            0.3133195677151283,
            0.3356556899603443
          ],
          [
            0.328382051984469,
            0.32770682174152066
          ],
          [
            0.34344453625380994,
            0.32571960468681493
          ],
          [
            0.348921803260843,
            0.3296940387962267
          ],
          [
            0.3516604367643595,
            0.33764290701505006
          ],
          [
            0.3461831697573265,
            0.34956620934328525
          ],
          [
            0.33933658599853517,
            0.35354064345269703
          ],
          [
            0.32427410172919435,
            0.34956620934328525
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "laptop",
      "possible_names": [
        "laptop"
      ],
      "box": [
        0.296875,
        0.6394557823129252,
        0.7484375,
        0.9478458049886621
      ]
    }
  ],
  "scene": "A person is seated indoors using a silver laptop with a warm yellow wall and wooden chairs surrounding them creating an intimate setting for focused work or study.",
  "overall_past": "Before the current scene, the individual likely entered the room, chose a wooden chair near the center of the space, and settled in with their laptop and notebook. They may have opened their device, perhaps logging in or launching a document or presentation, while simultaneously retrieving a pen from a nearby pocket or bag. The warm yellow wall and the quiet, focused atmosphere suggest the room had already been prepared for study or a session—possibly a lecture or seminar—implying that the individual arrived just before the session began or shortly after it started, giving them time to get settled and begin engaging with the material.",
  "overall_past_clean": "The individual entered the room with purpose, moved to a central wooden chair, placed their device and notebook on the surface, powered on the device, and retrieved a writing instrument, all within moments of the session's commencement, establishing a focused presence in a space already set for quiet engagement.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to lower their hand from their face, pause briefly to reflect on the notes they’ve just written, and then begin typing a response or summary into the laptop—perhaps drafting a thought for a paper, recording key insights from a lecture, or preparing for a discussion. The calm and focused demeanor suggests a moment of synthesis, where ideas are being processed and organized, leading naturally to the next step of articulating or documenting their understanding.",
  "overall_future_clean": "The hand descends steadily, fingers releasing their grip as the mind settles into clarity, then moves with purpose to the keyboard, fingers striking keys in deliberate rhythm, shaping thoughts into structured words that flow onto the screen.",
  "future_scene_ok": true
}