{
  "image_path": "./ref_datasets/hico_det/images/train/train_00023440.jpg",
  "image_id": "train_00023440",
  "width": 640,
  "height": 508,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 23440,
  "annotations": {
    "objects": "[{'id': 384, 'bbox_human': [31, 493, 132, 364], 'bbox_object': [75, 287, 82, 283], 'connection': 1, 'invis': 0}, {'id': 386, 'bbox_human': [28, 499, 129, 362], 'bbox_object': [78, 282, 82, 277], 'connection': 1, 'invis': 0}, {'id': 388, 'bbox_human': [29, 491, 124, 355], 'bbox_object': [86, 280, 82, 273], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('laptop', 'hold'), ('laptop', 'read'), ('laptop', 'type_on')]",
    "negative_captions": "[('laptop', 'open'), ('laptop', 'repair'), ('laptop', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[383, 385, 387]",
    "negative_objects": "[384, 386, 388]",
    "ambiguous_objects": "[]",
    "size": "[640, 508, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a black and white checkered dress over a black shirt.",
        "clothing": [
          {
            "possible_names": [
              "dress",
              "gown"
            ],
            "name": "dress",
            "type": "whole body",
            "color": [
              "black",
              "white"
            ]
          },
          {
            "possible_names": [
              "shirt",
              "t-shirt"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "black"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "laptop",
              "computer"
            ],
            "name": "laptop",
            "position": "body"
          }
        ],
        "description": "The person is an adult female in the foreground, sitting on a couch with a neutral expression. She is wearing a black and white checkered dress over a black shirt. She is using a laptop that is resting on her lap. The scene appears casual and relaxed, with the person possibly engaged in leisure activities such as browsing or working on the laptop.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears calm and focused, possibly engaged in work or study on the laptop.",
        "meaningful": true,
        "story": "A young adult female is relaxing on a couch while working or browsing on her laptop. The setting suggests a casual home environment, indicating she might be spending leisure time productively.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "Sophie is lying on a bed covered with a colorful floral blanket, using a laptop placed on her lap while wearing a black and white checkered dress over a black top. Her posture suggests she is relaxed and engaged in whatever activity she is doing on the computer, possibly working, studying, or browsing the internet. The room around her appears to be a personal space with various items like books, a speaker, and other objects indicating a lived-in environment. Her expression seems calm and focused, suggesting she is comfortable and absorbed in her task, perhaps enjoying some leisure time or completing an important project. The handwritten date at the bottom indicates this moment was captured on August 24, 2010, adding a nostalgic element to the scene.",
        "intention": "The individual is engaged in a focused and relaxed activity on the laptop likely balancing productivity with personal comfort in a familiar environment",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.6307442584208081,
            0.30479397883699505
          ],
          [
            0.6234794884920121,
            0.3204647177920433
          ],
          [
            0.6151848350252423,
            0.3356545713004165
          ],
          [
            0.6095285368817194,
            0.3522618549076591
          ],
          [
            0.603874762569155,
            0.3704816875361216
          ],
          [
            0.6031332848327501,
            0.38923822398663105
          ],
          [
            0.6051622816494533,
            0.4040750655334095
          ],
          [
            0.6067272228854044,
            0.4206771713810375
          ],
          [
            0.614043310710362,
            0.4389793655601476
          ],
          [
            0.6249187086309705,
            0.4511931851690612
          ],
          [
            0.6395693370274136,
            0.45705970950818575
          ],
          [
            0.6564792313746043,
            0.4608629170901596
          ],
          [
            0.6726147745336805,
            0.4613032147908506
          ],
          [
            0.6884777716227941,
            0.45246915527618375
          ],
          [
            0.7002597672598703,
            0.44066046059332764
          ],
          [
            0.7117624146597726,
            0.4273951386171734
          ],
          [
            0.7217329527650561,
            0.4107500074684821
          ],
          [
            0.6349928953817913,
            0.29725971284947866
          ],
          [
            0.6435113395963397,
            0.2942204947412617
          ],
          [
            0.6479063753570828,
            0.30345525804601187
          ],
          [
            0.6528831375496729,
            0.31478969694122555
          ],
          [
            0.6575510071856635,
            0.32548138609887245
          ],
          [
            0.6769032835960388,
            0.3493265968876293
          ],
          [
            0.6868402148996081,
            0.3546560983958207
          ],
          [
            0.6944929795605795,
            0.35903006195351567
          ],
          [
            0.7007187392030444,
            0.3666412786101866
          ],
          [
            0.7030266497816358,
            0.3836504806951946
          ],
          [
            0.6562693106276648,
            0.35186752720544257
          ],
          [
            0.6491516091993877,
            0.36040011514292525
          ],
          [
            0.6429975850241525,
            0.37019820315229074
          ],
          [
            0.6359745881387165,
            0.37788369162144353
          ],
          [
            0.6288989893027714,
            0.3802642259072131
          ],
          [
            0.6313727864197323,
            0.38266701719758217
          ],
          [
            0.6336093268224171,
            0.39005056784579406
          ],
          [
            0.6396628737449646,
            0.3948760434934876
          ],
          [
            0.6448954560926983,
            0.40150365759739054
          ],
          [
            0.6325459693159375,
            0.3194996668329657
          ],
          [
            0.6383707829884121,
            0.3197772536422592
          ],
          [
            0.6488449748073306,
            0.33104435303347984
          ],
          [
            0.6482392221689224,
            0.3441574586926215
          ],
          [
            0.6418619441134589,
            0.33929333389140626
          ],
          [
            0.6341144250971931,
            0.3268364949489203
          ],
          [
            0.6691630039896284,
            0.37043203666588315
          ],
          [
            0.6749068890299116,
            0.3683080346029172
          ],
          [
            0.6857248255184718,
            0.3796075338453758
          ],
          [
            0.6878751405647823,
            0.3885737775549443
          ],
          [
            0.6822849214076996,
            0.3879741717243087
          ],
          [
            0.6725940082754407,
            0.3782708293541478
          ],
          [
            0.6160993058766637,
            0.3890691165580792
          ],
          [
            0.6212592090879168,
            0.39625244414176125
          ],
          [
            0.6265570125409534,
            0.4004554925538826
          ],
          [
            0.6291031041315625,
            0.40408177289973496
          ],
          [
            0.6313411112342562,
            0.4058736867121556
          ],
          [
            0.6384882573570524,
            0.4187614821207671
          ],
          [
            0.6470753874097552,
            0.4278208273468189
          ],
          [
            0.6376307193722044,
            0.4231495393274605
          ],
          [
            0.6296930496181761,
            0.421757891690369
          ],
          [
            0.6226319351366588,
            0.4136679408520762
          ],
          [
            0.6189018928578922,
            0.40661534147402034
          ],
          [
            0.6180512317589352,
            0.3978522000886726
          ],
          [
            0.6175254613161087,
            0.3917684225183236
          ],
          [
            0.6224214443138668,
            0.4010415036981366
          ],
          [
            0.6265656633036477,
            0.4088786031853898
          ],
          [
            0.6354702647243228,
            0.4209490487492393
          ],
          [
            0.6448636093309947,
            0.42629913860016383
          ],
          [
            0.6357422019754138,
            0.4178087743516714
          ],
          [
            0.627410255585398,
            0.40737055820340645
          ],
          [
            0.6215730552162443,
            0.3983303371510972
          ]
        ],
        "visibility": [
          1.0,
          0.9970099925994873,
          0.005605306010693312,
          1.2744196323244417e-11,
          0.9998629093170166,
          0.9696642160415649,
          1.4135568271456123e-08,
          4.948695533218972e-13,
          0.0003347942838445306,
          4.7175923513801885e-14,
          5.094051402920741e-07,
          1.6908034012885764e-06,
          7.427770086722481e-16,
          1.2869694501205231e-06,
          2.0949880719101088e-11,
          5.14994358269405e-09,
          5.717421978565507e-13,
          3.5686787726307845e-12,
          5.838745285868807e-13,
          8.74564396596833e-12,
          2.729362513775868e-08,
          2.3445919684894623e-12,
          2.13571388485434e-06,
          1.0971795642703876e-15,
          6.172297984651055e-17,
          3.6425553400817716e-17,
          3.64321029941439e-12,
          1.3690494293783217e-09,
          2.9692704810823465e-18
        ],
        "headpose": {
          "pitch": -2.0354943431897072,
          "yaw": 16.451921050039317,
          "roll": 34.54079597241516
        },
        "attributes": {
          "5 oClock Shadow": 8.993822848424315e-05,
          "Arched Eyebrows": 0.22362017631530762,
          "Attractive": 0.28949281573295593,
          "Bags Under Eyes": 0.0219663605093956,
          "Bald": 9.732798207551241e-05,
          "Bangs": 0.0002137366682291031,
          "Big Lips": 0.09102418273687363,
          "Big Nose": 0.08119365572929382,
          "Black Hair": 0.44762128591537476,
          "Blond Hair": 0.0012410890776664019,
          "Blurry": 0.006889356765896082,
          "Brown Hair": 0.03589710593223572,
          "Bushy Eyebrows": 0.000734178873244673,
          "Chubby": 0.10807636380195618,
          "Double Chin": 0.009783169254660606,
          "Eyeglasses": 0.00022401296882890165,
          "Goatee": 1.4192608432495035e-05,
          "Gray Hair": 0.0002787329431157559,
          "Heavy Makeup": 0.3458940088748932,
          "High Cheekbones": 0.41308948397636414,
          "Male": 0.002812801394611597,
          "Mouth Slightly Open": 0.00035653801751323044,
          "Mustache": 1.877438262454234e-05,
          "Narrow Eyes": 0.003393033752217889,
          "No Beard": 0.9998145699501038,
          "Oval Face": 0.4536550045013428,
          "Pale Skin": 0.017752772197127342,
          "Pointy Nose": 0.0733303353190422,
          "Receding Hairline": 0.11908258497714996,
          "Rosy Cheeks": 0.004592232871800661,
          "Sideburns": 5.203777618589811e-06,
          "Smiling": 0.2311110943555832,
          "Straight Hair": 0.17882443964481354,
          "Wavy Hair": 0.052164990454912186,
          "Wearing Earrings": 0.016636528074741364,
          "Wearing Hat": 0.00030269825947470963,
          "Wearing Lipstick": 0.6676444411277771,
          "Wearing Necklace": 0.015716133639216423,
          "Wearing Necktie": 0.0014190598158165812,
          "Young": 0.8792067170143127
        },
        "age": [
          0.34441807866096497,
          0.28532615303993225,
          0.07484234869480133,
          0.3936270475387573,
          0.7489165663719177,
          0.4979988932609558,
          0.0366266630589962,
          0.0007002651691436768
        ],
        "race": [
          0.3801364302635193,
          0.009356159716844559,
          0.8902987241744995,
          0.3841741383075714,
          0.9436519145965576
        ],
        "gender": [
          0.0031791755463927984,
          0.9973520040512085
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 5.714575479487394e-07,
          "disgust": 4.929963162421218e-12,
          "fear": 0.0003047807240363909,
          "happy": 4.185409843921661,
          "sad": 0.025645954883657396,
          "surprise": 5.834662530901369e-06,
          "neutral": 95.78863382339478
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 103,
          "h": 121,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 34,
        "gender": {
          "Woman": 98.62731099128723,
          "Man": 1.3726907782256603
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 0.0020222812963766046,
          "indian": 0.0007084096978360321,
          "black": 1.1664373289477226e-05,
          "white": 99.50154423713684,
          "middle eastern": 0.28731299098581076,
          "latino hispanic": 0.2084019361063838
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "thigh",
                "hold"
              ],
              [
                "thigh",
                "read"
              ],
              [
                "thigh",
                "type on"
              ]
            ],
            "negative_action": [
              "open",
              "repair",
              "no interaction"
            ],
            "position": "thigh"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.04263598844408989,
        0.25776147842407227,
        0.7647799253463745,
        0.767978310585022
      ]
    ],
    "face_boxes": [
      [
        0.6021604537963867,
        0.29282698035240173,
        0.710601806640625,
        0.4538087546825409
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.616919193810059,
            0.4778240017221355
          ],
          [
            0.546949101280835,
            0.42929126480015756
          ],
          [
            0.4243048941509592,
            0.4510814732141069
          ],
          [
            0.3488315359171894,
            0.4451386891012118
          ],
          [
            0.686889286339283,
            0.5263567386441135
          ],
          [
            0.5579556326899263,
            0.6511552050149139
          ],
          [
            0.4714757430470652,
            0.4946618900420055
          ],
          [
            0.47304810467693537,
            0.6769072695041267
          ],
          [
            0.2859370707223813,
            0.5342804507946406
          ],
          [
            0.20574662759900092,
            0.46098611340226553
          ],
          [
            0.5689621640990177,
            0.730392326520184
          ],
          [
            0.5658174408392774,
            0.762087175122292
          ],
          [
            0.322101388209396,
            0.7898201676491364
          ],
          [
            0.6381460758133066,
            0.3441113591819923
          ],
          [
            0.6774551165600619,
            0.37382527974646873
          ],
          [
            0.6145606513652536,
            0.3441113591819923
          ],
          [
            0.7089023491574657,
            0.42136755264963066
          ]
        ],
        "dw_hand_1": [
          [
            0.4651862965275845,
            0.49070003396674194
          ],
          [
            0.4447455953392717,
            0.4847572498538469
          ],
          [
            0.42587725578082924,
            0.4788144657409513
          ],
          [
            0.4085812778522572,
            0.4807953937785833
          ],
          [
            0.3928576615535551,
            0.48871910592911016
          ],
          [
            0.4054365545925167,
            0.4550433292893704
          ],
          [
            0.38499585340420417,
            0.45900518536463397
          ],
          [
            0.37084459873537234,
            0.4728716816280562
          ],
          [
            0.36298279058602123,
            0.4847572498538469
          ],
          [
            0.40700891622238694,
            0.4570242573270022
          ],
          [
            0.38656821503407424,
            0.46296704143989753
          ],
          [
            0.3755616836249828,
            0.4788144657409513
          ],
          [
            0.37084459873537234,
            0.4926809620043737
          ],
          [
            0.41329836274186765,
            0.4649479694775291
          ],
          [
            0.3944300231834251,
            0.4728716816280562
          ],
          [
            0.38656821503407424,
            0.48673817789147844
          ],
          [
            0.38342349177433377,
            0.49664281807963706
          ],
          [
            0.422732532521089,
            0.4788144657409513
          ],
          [
            0.4085812778522572,
            0.48673817789147844
          ],
          [
            0.399147108073036,
            0.49664281807963706
          ],
          [
            0.3944300231834251,
            0.5025856021925327
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.6239948211444748,
            0.3302448629185701
          ],
          [
            0.6161330129951239,
            0.3460922872196241
          ],
          [
            0.609843566475643,
            0.36193971152067805
          ],
          [
            0.6051264815860324,
            0.3758062077841003
          ],
          [
            0.6004093966964218,
            0.39165363208515447
          ],
          [
            0.6004093966964218,
            0.40948198442384026
          ],
          [
            0.6019817583262921,
            0.425329408724894
          ],
          [
            0.609843566475643,
            0.43919590498831645
          ],
          [
            0.6208500978847346,
            0.44910054517647535
          ],
          [
            0.6334289909236961,
            0.4550433292893704
          ],
          [
            0.6460078839626577,
            0.4570242573270022
          ],
          [
            0.6601591386314896,
            0.4550433292893704
          ],
          [
            0.6727380316704512,
            0.4510814732141069
          ],
          [
            0.6837445630795426,
            0.44117683302594823
          ],
          [
            0.6931787328587639,
            0.42929126480015756
          ],
          [
            0.7041852642678552,
            0.41740569657436716
          ],
          [
            0.7120470724172062,
            0.4055201283485767
          ],
          [
            0.6318566292938259,
            0.32232115076804296
          ],
          [
            0.6365737141834366,
            0.32232115076804296
          ],
          [
            0.6428631607029173,
            0.3262830068433065
          ],
          [
            0.6475802455925279,
            0.33222579095620186
          ],
          [
            0.6522973304821384,
            0.3361876470314652
          ],
          [
            0.6727380316704512,
            0.35401599937015094
          ],
          [
            0.6805998398198021,
            0.3579778554454145
          ],
          [
            0.686889286339283,
            0.36392063955830983
          ],
          [
            0.6931787328587639,
            0.37184435170883673
          ],
          [
            0.6978958177483744,
            0.3817489918969956
          ],
          [
            0.6538696921120086,
            0.3579778554454145
          ],
          [
            0.6491526072223982,
            0.36392063955830983
          ],
          [
            0.6428631607029173,
            0.37184435170883673
          ],
          [
            0.6381460758133066,
            0.3777871358217323
          ],
          [
            0.6287119060340854,
            0.3837299199346274
          ],
          [
            0.6318566292938259,
            0.3876917760098909
          ],
          [
            0.6350013525535664,
            0.38967270404752247
          ],
          [
            0.6397184374431768,
            0.393634560122786
          ],
          [
            0.6444355223327876,
            0.3975964161980496
          ],
          [
            0.6302842676639557,
            0.3381685750690972
          ],
          [
            0.6381460758133066,
            0.3381685750690972
          ],
          [
            0.6444355223327876,
            0.3441113591819923
          ],
          [
            0.6460078839626577,
            0.35401599937015094
          ],
          [
            0.6397184374431768,
            0.35203507133251943
          ],
          [
            0.6334289909236961,
            0.3460922872196241
          ],
          [
            0.6664485851509703,
            0.36986342367120517
          ],
          [
            0.6743103933003214,
            0.36986342367120517
          ],
          [
            0.6821722014496723,
            0.3758062077841003
          ],
          [
            0.686889286339283,
            0.3857108479722592
          ],
          [
            0.679027478189932,
            0.3837299199346274
          ],
          [
            0.6711656700405809,
            0.3777871358217323
          ],
          [
            0.6145606513652536,
            0.395615488160418
          ],
          [
            0.6208500978847346,
            0.3975964161980496
          ],
          [
            0.625567182774345,
            0.39957734423568136
          ],
          [
            0.6287119060340854,
            0.40155827227331314
          ],
          [
            0.6318566292938259,
            0.4055201283485767
          ],
          [
            0.6397184374431768,
            0.4134438404991038
          ],
          [
            0.6460078839626577,
            0.42334848068726244
          ],
          [
            0.6381460758133066,
            0.42334848068726244
          ],
          [
            0.6302842676639557,
            0.42136755264963066
          ],
          [
            0.6224224595146047,
            0.4154247685367354
          ],
          [
            0.6192777362548643,
            0.4114629124614718
          ],
          [
            0.6161330129951239,
            0.4035392003109449
          ],
          [
            0.6161330129951239,
            0.3975964161980496
          ],
          [
            0.6224224595146047,
            0.4035392003109449
          ],
          [
            0.6271395444042153,
            0.40750105638620826
          ],
          [
            0.6365737141834366,
            0.4154247685367354
          ],
          [
            0.6444355223327876,
            0.42136755264963066
          ],
          [
            0.6350013525535664,
            0.41740569657436716
          ],
          [
            0.625567182774345,
            0.40948198442384026
          ],
          [
            0.6208500978847346,
            0.4035392003109449
          ]
        ],
        "dw_foot_1": [
          [
            0.23404913693666457,
            0.7264304704449205
          ],
          [
            0.252917476495107,
            0.7799155274609777
          ],
          [
            0.30795013354056416,
            0.7977438797996635
          ]
        ],
        "dw_foot_2": [
          [
            0.1098325681769186,
            0.4134438404991038
          ],
          [
            0.1224114612158802,
            0.4055201283485767
          ],
          [
            0.20574662759900092,
            0.48871910592911016
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "laptop",
      "possible_names": [
        "laptop"
      ],
      "box": [
        0.1171875,
        0.16141732283464566,
        0.4484375,
        0.5570866141732284
      ]
    }
  ],
  "scene": "A cozy indoor setting features a person lounging on a colorful floral-patterned couch with a laptop while surrounded by various household items and furniture including a patterned curtain a desk with a computer monitor and speakers and a shelf with books and other objects creating a casual and lived-in atmosphere with warm tones and personal touches throughout the space",
  "overall_past": "Before this scene, the individual likely returned home after a day out—perhaps running errands, meeting a friend, or attending a casual outing—then changed into her comfortable black and white checkered dress, signaling a transition from public or structured activities to personal downtime. She may have come in from a warm summer day, given the floral blanket and the cozy, sunlit atmosphere, and decided to settle in for a quiet moment of focused work or leisurely browsing. The laptop was probably already set up on the desk earlier, but she chose to move to the couch, drawn by its inviting comfort and the soft, warm lighting, possibly after a brief pause to grab a drink or a snack from the nearby desk area. The handwritten date suggests this moment was part of a routine or a special memory captured in the quiet rhythm of daily life.",
  "overall_past_clean": "After stepping through the door, the individual shed the day’s weight, shedding outer layers and routines, then moved with purpose through the space, pausing only to gather a drink before settling into a familiar rhythm of quiet focus, the day’s energy now channeled into a deliberate pause of stillness and intention.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to close the laptop, stretch slightly, and perhaps reach for a nearby book or drink, signaling a transition from focused activity to a more relaxed state—possibly preparing to unwind with reading or listening to music, as suggested by the presence of a speaker and books nearby. The warm, personal atmosphere implies a routine of balancing productivity with comfort, so the next moment may involve a brief pause in the day, savoring a quiet moment before continuing with evening activities.",
  "overall_future_clean": "The individual rises from the chair, closes the device with a soft click, stretches upward, then reaches for the book beside them, settling back into the seat with a deliberate calm, the faint hum of music beginning to fill the space as the room dims slightly.",
  "future_scene_ok": false
}