{
  "image_path": "./ref_datasets/hico_det/images/test/test_00001615.jpg",
  "image_id": "test_00001615",
  "width": 640,
  "height": 439,
  "split": "test",
  "source": "zhimeng/hico_det",
  "dataset_index": 1615,
  "annotations": {
    "objects": "[{'id': 90, 'bbox_human': [203, 611, 77, 438], 'bbox_object': [396, 605, 254, 438], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('chair', 'sit_on')]",
    "negative_captions": "[('chair', 'carry'), ('chair', 'hold'), ('chair', 'lie_on'), ('chair', 'stand_on'), ('chair', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[89]",
    "negative_objects": "[86, 87, 88, 90, 91]",
    "ambiguous_objects": "[]",
    "size": "[640, 439, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a casual outfit consisting of a white polo shirt and beige pants. He is barefoot.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "shirt",
                "tee",
                "t-shirt"
              ],
              "name": "t-shirt",
              "type": "top",
              "color": [
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "pants",
                "trousers",
                "jeans"
              ],
              "name": "pants",
              "type": "bottom",
              "color": [
                "beige",
                "light brown"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "pen"
            ],
            "name": "pen",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "tablet",
              "clipboard"
            ],
            "name": "tablet",
            "position": "body"
          }
        ],
        "description": "The person is a male adult sitting in a director's chair under a stall with glass items displayed on tables behind him. He appears happy, holding a pen in one hand and a tablet on his lap. He is casually dressed in a white polo shirt, beige pants, and is barefoot.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, possibly engaged in thought or observation while seated.",
        "meaningful": true,
        "story": "The individual seems to be taking a break at an outdoor event, possibly a market or exhibition, as indicated by the display of glassware behind him. He might be a vendor, an attendee, or someone involved in organizing the event.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is seated on a director's chair, casually dressed in a white t-shirt and beige pants, holding a pen and a notepad, suggesting they might be taking notes or planning something related to the event setup around them which includes tables draped in white cloths and adorned with various glassware and decorative items. Their relaxed posture and focused gaze towards the left indicate they could be engaged in conversation with someone off-camera or observing the ongoing activities at the event. The setting appears to be an outdoor market or exhibition under a tent, and the individual seems to be involved in organizing or managing aspects of it, possibly motivated by a desire to ensure everything runs smoothly or to document details for future reference.",
        "intention": "The individual is actively overseeing event logistics ensuring seamless execution and maintaining detailed records for continuity and improvement",
        "intention_ok": false
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.7977969484669821,
            0.2557038879922109
          ],
          [
            0.7998391483511244,
            0.27460489674961375
          ],
          [
            0.7987852790525982,
            0.29745115498320274
          ],
          [
            0.7966516630990165,
            0.3182810961210956
          ],
          [
            0.7955819692994867,
            0.33531669014019255
          ],
          [
            0.7978475990039962,
            0.3572862104061486
          ],
          [
            0.7990471184253692,
            0.3724577994056451
          ],
          [
            0.7987167837364333,
            0.3902052656819834
          ],
          [
            0.8010276442127567,
            0.41494340210755404
          ],
          [
            0.8139758374009813,
            0.42181751171773707
          ],
          [
            0.8289302840828896,
            0.4139788333112007
          ],
          [
            0.8432157133306776,
            0.3982911623536745
          ],
          [
            0.8555945864745549,
            0.3790468781691904
          ],
          [
            0.8703681869166238,
            0.35416107817034437
          ],
          [
            0.8762572633368629,
            0.3261536791547284
          ],
          [
            0.8799612441233226,
            0.29684960659807913
          ],
          [
            0.8832967132329941,
            0.27114754377961586
          ],
          [
            0.7954250408070428,
            0.25150088304965923
          ],
          [
            0.7950253513242517,
            0.24006698029149134
          ],
          [
            0.7972715487437589,
            0.24401342089076092
          ],
          [
            0.8003199138811656,
            0.23764300020517684
          ],
          [
            0.8019334831408091,
            0.2345869531082168
          ],
          [
            0.8065075384719032,
            0.22764517700016554
          ],
          [
            0.8123127784047808,
            0.22401803322657676
          ],
          [
            0.8153219291142054,
            0.22407903032740434
          ],
          [
            0.8219460874795914,
            0.2242820610489552
          ],
          [
            0.8281187632254191,
            0.23745869732896163
          ],
          [
            0.8018435211053916,
            0.251866718437165
          ],
          [
            0.7952415898442269,
            0.27115603778093056
          ],
          [
            0.7880564918475492,
            0.28645632160706896
          ],
          [
            0.784558218451483,
            0.3025558445611141
          ],
          [
            0.7943225998963628,
            0.3251825168006318
          ],
          [
            0.7940220516707216,
            0.32327781730624544
          ],
          [
            0.7968203452016626,
            0.32162190639658467
          ],
          [
            0.7996008930461748,
            0.31729313313204577
          ],
          [
            0.8053073557359832,
            0.31659708006002596
          ],
          [
            0.7991645493677685,
            0.26362556135697124
          ],
          [
            0.7985533636595521,
            0.2612857138183425
          ],
          [
            0.7997776400830064,
            0.26120634130185566
          ],
          [
            0.7985700779727527,
            0.25687519471341996
          ],
          [
            0.7996033036283084,
            0.2591786037001903
          ],
          [
            0.8005286880901881,
            0.2618042672452421
          ],
          [
            0.8146836466022901,
            0.2590718130471068
          ],
          [
            0.8146852927548546,
            0.25246836050612664
          ],
          [
            0.8189781027180809,
            0.25568850599823345
          ],
          [
            0.8231350585818291,
            0.255723989867171
          ],
          [
            0.821257842012814,
            0.2561685509065677
          ],
          [
            0.815018624493054,
            0.25521218167660953
          ],
          [
            0.7964170843362808,
            0.3553689751220067
          ],
          [
            0.7954713393534932,
            0.35279647046333407
          ],
          [
            0.792943103824343,
            0.3419584459875214
          ],
          [
            0.7935908871037619,
            0.3394282328900164
          ],
          [
            0.7964521267584392,
            0.3393768763022356
          ],
          [
            0.8057170212268829,
            0.34182637854271053
          ],
          [
            0.8130016103386879,
            0.35264227578820756
          ],
          [
            0.8092212351305145,
            0.36051191447264513
          ],
          [
            0.8041564362389702,
            0.3679979312237566
          ],
          [
            0.796001347899437,
            0.3684470783100818
          ],
          [
            0.7969782909112317,
            0.3622654082524516
          ],
          [
            0.7997161641716957,
            0.3589080828546586
          ],
          [
            0.797771224805287,
            0.3553070188771231
          ],
          [
            0.7977656392114503,
            0.3532159063895983
          ],
          [
            0.7952824746923788,
            0.34903137946881413
          ],
          [
            0.8053980275988579,
            0.34706334077764944
          ],
          [
            0.8135300900254931,
            0.3534917651423794
          ],
          [
            0.8068225845694542,
            0.3591074242174451
          ],
          [
            0.7979608923196793,
            0.3577668352620515
          ],
          [
            0.7990148061088154,
            0.35383511194762285
          ]
        ],
        "visibility": [
          0.9943127632141113,
          0.9999972581863403,
          0.0779980719089508,
          0.0003839749551843852,
          0.0028502170462161303,
          0.0009082616888917983,
          1.868053089992827e-08,
          1.7194097381434403e-05,
          0.9998815059661865,
          0.9976582527160645,
          0.9784646034240723,
          1.4813892448728438e-05,
          8.903167326934636e-05,
          0.03451037406921387,
          1.1842695357699995e-06,
          0.9805924892425537,
          0.026906762272119522,
          0.16858486831188202,
          1.955074537818291e-07,
          1.8178188121442673e-11,
          3.921488784738858e-13,
          4.804355630233341e-15,
          0.0033058864064514637,
          1.7299170429474486e-10,
          5.362716022118408e-14,
          7.542690916295669e-10,
          1.433662987437856e-06,
          2.3829286419640994e-06,
          0.032682523131370544
        ],
        "headpose": {
          "pitch": 12.775529040597643,
          "yaw": 69.58682786792532,
          "roll": 14.06510034552096
        },
        "attributes": {
          "5 oClock Shadow": 0.05299906060099602,
          "Arched Eyebrows": 0.00014359028136823326,
          "Attractive": 0.061618655920028687,
          "Bags Under Eyes": 0.07894249260425568,
          "Bald": 6.030516885857651e-08,
          "Bangs": 0.19573266804218292,
          "Big Lips": 0.0443936288356781,
          "Big Nose": 0.023909403011202812,
          "Black Hair": 0.20779690146446228,
          "Blond Hair": 0.0014096373924985528,
          "Blurry": 0.11272378265857697,
          "Brown Hair": 0.1485167145729065,
          "Bushy Eyebrows": 0.005524937529116869,
          "Chubby": 0.000827325158752501,
          "Double Chin": 0.0002339356578886509,
          "Eyeglasses": 0.008172346279025078,
          "Goatee": 0.0010452962014824152,
          "Gray Hair": 0.000318746839184314,
          "Heavy Makeup": 0.00035086917341686785,
          "High Cheekbones": 0.13420136272907257,
          "Male": 0.9927206039428711,
          "Mouth Slightly Open": 0.8735359907150269,
          "Mustache": 0.0002503824362065643,
          "Narrow Eyes": 0.23874416947364807,
          "No Beard": 0.9539397954940796,
          "Oval Face": 0.0354958139359951,
          "Pale Skin": 0.001023563090711832,
          "Pointy Nose": 0.2143738865852356,
          "Receding Hairline": 5.78424078412354e-05,
          "Rosy Cheeks": 0.0001887691905722022,
          "Sideburns": 0.0004908028640784323,
          "Smiling": 0.23414164781570435,
          "Straight Hair": 0.009007390588521957,
          "Wavy Hair": 0.655899703502655,
          "Wearing Earrings": 0.0059061311185359955,
          "Wearing Hat": 0.0031525567173957825,
          "Wearing Lipstick": 0.0005551585927605629,
          "Wearing Necklace": 0.012500991113483906,
          "Wearing Necktie": 0.005174631252884865,
          "Young": 0.9601362943649292
        },
        "age": [
          0.0022754904348403215,
          0.7531953454017639,
          0.9892324209213257,
          0.7620033025741577,
          0.30541083216667175,
          0.002486814744770527,
          3.247923814342357e-05,
          1.2407221561261395e-07
        ],
        "race": [
          0.9565218687057495,
          0.008531203493475914,
          0.1400669366121292,
          0.4326555132865906,
          0.7931320071220398
        ],
        "gender": [
          0.959465503692627,
          0.05578799173235893
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 1.809197020795571e-07,
          "disgust": 5.873358181582475e-15,
          "fear": 1.6984822189001885e-06,
          "happy": 1.725186188083531e-05,
          "sad": 99.99997615814493,
          "surprise": 6.952421779468394e-14,
          "neutral": 1.3640069217622753e-09
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 75,
          "h": 114,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 32,
        "gender": {
          "Woman": 9.3674436211586,
          "Man": 90.63255786895752
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.01940579677466303,
          "indian": 0.013815733836963773,
          "black": 0.0017659669538261369,
          "white": 97.80684113502502,
          "middle eastern": 0.598128093406558,
          "latino hispanic": 1.5600426122546196
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "body",
                "sit on"
              ]
            ],
            "negative_action": [
              "carry",
              "hold",
              "lie on",
              "stand on",
              "no interaction"
            ],
            "position": "body"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.3132610023021698,
        0.17779360711574554,
        0.9552232623100281,
        0.991605818271637
      ]
    ],
    "face_boxes": [
      [
        0.7891994118690491,
        0.22221481800079346,
        0.8684597015380859,
        0.3973046541213989
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.8622480283698273,
            0.4694860319688754
          ],
          [
            0.8204150035873884,
            0.45220648338751857
          ],
          [
            0.7228046124283638,
            0.580278431696398
          ],
          [
            0.5819667623274857,
            0.5924757601067677
          ],
          [
            0.9040810531522665,
            0.4867655805502322
          ],
          [
            0.848303686775681,
            0.7103832680736726
          ],
          [
            0.683760455964754,
            0.7083503800052776
          ],
          [
            0.7409322565007541,
            0.7652712459203352
          ],
          [
            0.5220060934726563,
            0.8120276714934184
          ],
          [
            0.4048736240818268,
            0.9705929408282215
          ],
          [
            0.7981040570367541,
            0.8181263356986029
          ],
          [
            0.5136394885161686,
            0.7612054697835455
          ],
          [
            0.4034791899224123,
            0.9421325078706927
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8190205694279736,
            0.29364121405271537
          ],
          [
            0.8580647258915836,
            0.324134535078639
          ],
          [
            0.8803756724422177,
            0.33023319928382383
          ]
        ],
        "dw_hand_1": [
          [
            0.676788285167681,
            0.7063174919368829
          ],
          [
            0.6628439435735345,
            0.7164819322788571
          ],
          [
            0.6461107336605588,
            0.7266463726208319
          ],
          [
            0.6349552603852417,
            0.744942365236386
          ],
          [
            0.6293775237475832,
            0.7652712459203352
          ],
          [
            0.6265886554287541,
            0.7408765890995962
          ],
          [
            0.6196164846316808,
            0.7673041339887303
          ],
          [
            0.6210109187910955,
            0.7856001266042846
          ],
          [
            0.6251942212693393,
            0.8038961192198387
          ],
          [
            0.6307719579069978,
            0.7490081413731761
          ],
          [
            0.6237997871099246,
            0.77543568626231
          ],
          [
            0.6265886554287541,
            0.7957645669462589
          ],
          [
            0.6321663920664126,
            0.8140605595618131
          ],
          [
            0.637744128704071,
            0.7530739175099657
          ],
          [
            0.6321663920664126,
            0.7795014623990997
          ],
          [
            0.6349552603852417,
            0.7998303430830487
          ],
          [
            0.6405329970229003,
            0.8140605595618131
          ],
          [
            0.648899601979388,
            0.7591725817151505
          ],
          [
            0.6447162995011443,
            0.7795014623990997
          ],
          [
            0.6475051678199735,
            0.7957645669462589
          ],
          [
            0.6502940361388028,
            0.8079618953566283
          ]
        ],
        "dw_hand_2": [
          [
            0.5708112890521686,
            0.6006073123803474
          ],
          [
            0.5540780791391928,
            0.5924757601067677
          ],
          [
            0.5373448692262173,
            0.5863770959015832
          ],
          [
            0.5247949617914855,
            0.5924757601067677
          ],
          [
            0.5150339226755831,
            0.6006073123803474
          ],
          [
            0.5234005276320708,
            0.5843442078331881
          ],
          [
            0.5094561860379245,
            0.5884099839699777
          ],
          [
            0.5024840152408514,
            0.6006073123803474
          ],
          [
            0.4955118444437783,
            0.610771752722322
          ],
          [
            0.5261893959509003,
            0.5945086481751625
          ],
          [
            0.5122450543567538,
            0.6026402004487423
          ],
          [
            0.5066673177190953,
            0.6128046407907167
          ],
          [
            0.5010895810814369,
            0.6229690811326916
          ],
          [
            0.5317671325885588,
            0.6046730885171374
          ],
          [
            0.5206116593132417,
            0.610771752722322
          ],
          [
            0.5164283568349977,
            0.6229690811326916
          ],
          [
            0.5136394885161686,
            0.6290677453378761
          ],
          [
            0.538739303385632,
            0.6148375288591117
          ],
          [
            0.5317671325885588,
            0.6189033049959015
          ],
          [
            0.5289782642697294,
            0.6270348572694812
          ],
          [
            0.5261893959509003,
            0.633133521474666
          ]
        ],
        "dw_face": [
          [
            0.8036817936744127,
            0.2855096617791358
          ],
          [
            0.8008929253555834,
            0.301772766326295
          ],
          [
            0.7981040570367541,
            0.3180358708734543
          ],
          [
            0.7967096228773395,
            0.33429897542061365
          ],
          [
            0.7981040570367541,
            0.35056207996777305
          ],
          [
            0.7981040570367541,
            0.3668251845149323
          ],
          [
            0.7981040570367541,
            0.3830882890620916
          ],
          [
            0.8036817936744127,
            0.3952856174724611
          ],
          [
            0.8148372669497299,
            0.3973185055408559
          ],
          [
            0.8245983060656321,
            0.39325272940406636
          ],
          [
            0.8357537793409493,
            0.38715406519888124
          ],
          [
            0.8455148184568518,
            0.37902251292530165
          ],
          [
            0.8552758575727543,
            0.3688580725833273
          ],
          [
            0.8608535942104127,
            0.35462785610456277
          ],
          [
            0.8664313308480713,
            0.34039763962579844
          ],
          [
            0.8692201991669005,
            0.32616742314703406
          ],
          [
            0.8734035016451445,
            0.3099043185998747
          ],
          [
            0.8036817936744127,
            0.27534522143716117
          ],
          [
            0.8050762278338274,
            0.2773781095055562
          ],
          [
            0.8050762278338274,
            0.2773781095055562
          ],
          [
            0.8050762278338274,
            0.2773781095055562
          ],
          [
            0.8050762278338274,
            0.2773781095055562
          ],
          [
            0.8092595303120712,
            0.2773781095055562
          ],
          [
            0.8148372669497299,
            0.2773781095055562
          ],
          [
            0.8190205694279736,
            0.279410997573951
          ],
          [
            0.8245983060656321,
            0.2814438856423459
          ],
          [
            0.8287816085438762,
            0.2855096617791358
          ],
          [
            0.8050762278338274,
            0.2895754379159256
          ],
          [
            0.7981040570367541,
            0.2977069901895052
          ],
          [
            0.7939207545585102,
            0.3058385424630848
          ],
          [
            0.7883430179208517,
            0.3160029828050594
          ],
          [
            0.7897374520802665,
            0.324134535078639
          ],
          [
            0.7925263203990957,
            0.3282003112154289
          ],
          [
            0.7981040570367541,
            0.33023319928382383
          ],
          [
            0.8008929253555834,
            0.33023319928382383
          ],
          [
            0.8050762278338274,
            0.3282003112154289
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8036817936744127,
            0.2895754379159256
          ],
          [
            0.8148372669497299,
            0.29364121405271537
          ],
          [
            0.8176261352685591,
            0.2916083259843205
          ],
          [
            0.8204150035873884,
            0.29364121405271537
          ],
          [
            0.8245983060656321,
            0.29567410212111045
          ],
          [
            0.8204150035873884,
            0.2977069901895052
          ],
          [
            0.8162317011091444,
            0.2977069901895052
          ],
          [
            0.7981040570367541,
            0.35056207996777305
          ],
          [
            0.7967096228773395,
            0.3464963038309832
          ],
          [
            0.7967096228773395,
            0.34243052769419324
          ],
          [
            0.7967096228773395,
            0.34243052769419324
          ],
          [
            0.7981040570367541,
            0.34243052769419324
          ],
          [
            0.8078650961526567,
            0.3464963038309832
          ],
          [
            0.8162317011091444,
            0.35259496803616786
          ],
          [
            0.8106539644714859,
            0.3586936322413527
          ],
          [
            0.8050762278338274,
            0.36275940837814247
          ],
          [
            0.7981040570367541,
            0.3647922964465374
          ],
          [
            0.7967096228773395,
            0.36072652030974744
          ],
          [
            0.7967096228773395,
            0.35462785610456277
          ],
          [
            0.7981040570367541,
            0.35056207996777305
          ],
          [
            0.7981040570367541,
            0.34852919189937803
          ],
          [
            0.7994984911961687,
            0.3464963038309832
          ],
          [
            0.8078650961526567,
            0.34852919189937803
          ],
          [
            0.8148372669497299,
            0.35259496803616786
          ],
          [
            0.8078650961526567,
            0.3566607441729576
          ],
          [
            0.7994984911961687,
            0.3566607441729576
          ],
          [
            0.7981040570367541,
            0.35462785610456277
          ]
        ],
        "dw_foot_1": [
          [
            0.32539087699519265,
            0.9340009555971133
          ],
          [
            0.33794078442992437,
            0.954329836281062
          ],
          [
            0.4034791899224123,
            0.9665271646914317
          ]
        ],
        "dw_foot_2": [
          [
            0.323996442835778,
            0.9421325078706927
          ],
          [
            0.33515191611109507,
            0.9400996198022978
          ],
          [
            0.4034791899224123,
            0.9929547095805655
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "chair",
      "possible_names": [
        "chair"
      ],
      "box": [
        0.61875,
        0.5785876993166287,
        0.9453125,
        0.9977220956719818
      ]
    }
  ],
  "scene": "A man sits on a wooden chair in front of tables draped with white cloths displaying an array of glassware and vases under a tented area with a mix of natural light and shadows creating a serene outdoor setting for what appears to be an art or craft fair showcasing intricate designs and craftsmanship in various glass pieces and decorative items arranged neatly for display and sale amidst a calm environment with soft beige tones and greenery peeking from the sides adding to the aesthetic appeal of the scene",
  "overall_past": "Before the current scene, the individual likely arrived at the venue earlier to oversee the setup of the display area, coordinating the arrangement of tables, positioning the glassware and decorative items with care, and ensuring the white cloths were properly draped to create a clean, cohesive aesthetic. They may have inspected each piece for quality and placement, possibly adjusting the lighting or greenery to enhance the serene atmosphere. This preparation suggests a deliberate effort to create an inviting and professional environment for the art fair, indicating that the individual is responsible for the event’s presentation and is now taking a moment to review the final details, perhaps jotting down observations or next steps for the day’s activities.",
  "overall_past_clean": "The individual arrived early to meticulously supervise the assembly of the display, ensuring every element was precisely positioned to achieve a harmonious and polished presentation, while making real-time adjustments to lighting, layout, and decorative accents to optimize the overall ambiance.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to rise from the chair, walk toward one of the display tables, and carefully adjust the placement of a glass vase to enhance its visual impact, ensuring it aligns perfectly with the overall aesthetic of the fair. This action would reflect a continued commitment to detail and presentation, possibly in preparation for an upcoming visitor or during a final walkthrough before the event opens to the public.",
  "overall_future_clean": "The individual strides purposefully forward, their hands moving with precision to reposition the display, aligning it flawlessly within the composition before stepping back to assess the final arrangement with unwavering focus.",
  "future_scene_ok": true
}