{
  "video_path": "./ref_datasets/part2/6894261001.mp4",
  "start_time": 0.0,
  "end_time": 4.56,
  "image_path": "./022793.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6894261001.mp4",
      "start_time": 0.0,
      "end_time": 4.56,
      "image_path": "./ref_datasets/extracted_frames/person_-5349479225449459111_1_6894261001.mp4_0.00_4.56.jpg",
      "type": "person"
    }
  ],
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a light beige zip-up jacket over a black turtleneck sweater. The jacket appears to be made of a soft material, possibly fleece or a similar fabric. The person also has on glasses with thin frames.",
        "clothing": [
          {
            "possible_names": [
              "light beige zip-up jacket",
              "beige fleece jacket"
            ],
            "name": "zip up jacket",
            "type": "top",
            "color": [
              "light beige"
            ]
          },
          {
            "possible_names": [
              "black turtleneck sweater",
              "black high-neck sweater"
            ],
            "name": "turtleneck sweater",
            "type": "top",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "glasses",
              "eyeglasses"
            ],
            "name": "glasses",
            "type": "accessory",
            "color": [
              "silver"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "hand",
              "fingers"
            ],
            "name": "hand",
            "position": "head"
          }
        ],
        "description": "The person is an adult male who appears to be in a neutral emotional state. He is wearing a light beige zip-up jacket over a black turtleneck sweater and glasses with thin frames. His hand is raised to his head, possibly adjusting his hair or glasses. The background is dark, which contrasts with his light-colored jacket.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be in a neutral state, possibly engaged in a conversation or deep in thought, as indicated by their hand gesture near the head.",
        "meaningful": true,
        "story": "The individual seems to be involved in an intellectual discussion or perhaps reflecting on something important. The setting suggests a formal or semi-formal environment, possibly a meeting or a seminar.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is wearing a beige jacket over a black turtleneck and appears to be engaged in a thoughtful or possibly concerned action as they touch their forehead with one hand while looking downward. Their expression suggests deep contemplation or concern, perhaps indicating they are processing information or dealing with a challenging situation. The setting seems informal, and the individual's posture and gesture imply a moment of introspection or decision-making, possibly discussing or considering something important with someone out of frame.",
        "intention": "The individual is deeply processing a significant decision or challenging situation requiring careful thought and internal reflection",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              "adjusting hair",
              "touching head"
            ]
          },
          "object": 0,
          "deleted": true
        }
      ],
      "without_face": false,
      "facex_detailing": {
        "landmarks": [
          [
            0.3706674074133237,
            0.41322307954695253
          ],
          [
            0.40724991162618,
            0.4376299292615856
          ],
          [
            0.41688644256856705,
            0.46056483216276733
          ],
          [
            0.430029731326633,
            0.4761748880403507
          ],
          [
            0.44153517815801835,
            0.49096170134485523
          ],
          [
            0.46385164161523185,
            0.5034716567143415
          ],
          [
            0.48980570071273377,
            0.5243667158913947
          ],
          [
            0.5120170540279813,
            0.534470668249962
          ],
          [
            0.5233391894234551,
            0.538796363777507
          ],
          [
            0.5549253437254164,
            0.5260914305068788
          ],
          [
            0.5795324398411645,
            0.4965919546192347
          ],
          [
            0.6087924586402045,
            0.4687240695733951
          ],
          [
            0.6240965876314375,
            0.44032411414742645
          ],
          [
            0.6207145174344381,
            0.4028803829467588
          ],
          [
            0.6203240268760257,
            0.36840908515156623
          ],
          [
            0.6030768944157494,
            0.34763437768226635
          ],
          [
            0.5996725042661031,
            0.31523935164250333
          ],
          [
            0.36107397543059455,
            0.39076421007005974
          ],
          [
            0.34220552378230623,
            0.38303721682892217
          ],
          [
            0.34134266210926906,
            0.3866507125509207
          ],
          [
            0.3499622775448693,
            0.38491717592439645
          ],
          [
            0.3622552697857221,
            0.38653555666395517
          ],
          [
            0.3673026813401116,
            0.37945103496967614
          ],
          [
            0.37816585252682366,
            0.37811712398610836
          ],
          [
            0.4041301959090763,
            0.3841341365159144
          ],
          [
            0.4136175877518124,
            0.3856450032923567
          ],
          [
            0.44488748841815523,
            0.38513098939196677
          ],
          [
            0.38557964745495055,
            0.413762184621599
          ],
          [
            0.3887343161635929,
            0.434637766631421
          ],
          [
            0.38094986610942416,
            0.45982756409727865
          ],
          [
            0.38487897879547545,
            0.4839983620022261
          ],
          [
            0.4251772595776452,
            0.4828114005168395
          ],
          [
            0.4307098110516866,
            0.4809332058235732
          ],
          [
            0.4309733331203461,
            0.4825415844649008
          ],
          [
            0.43827793134583365,
            0.4830444620084972
          ],
          [
            0.44475025600857204,
            0.4763990816923396
          ],
          [
            0.37732002950376936,
            0.41253548971506077
          ],
          [
            0.3695095530814595,
            0.41399060596459286
          ],
          [
            0.3766471250189675,
            0.4149723239359908
          ],
          [
            0.3802828199333615,
            0.4091017224179778
          ],
          [
            0.3835979234841135,
            0.40546009937506594
          ],
          [
            0.38389118512471515,
            0.4068963113152265
          ],
          [
            0.41871347460481856,
            0.41430149592507515
          ],
          [
            0.4146358337667253,
            0.41871486161947497
          ],
          [
            0.427709596686893,
            0.413876836393648
          ],
          [
            0.4371613363424937,
            0.4143291649597007
          ],
          [
            0.43083295093642343,
            0.41729599581530746
          ],
          [
            0.41660643849107953,
            0.41278539322779484
          ],
          [
            0.4550574445062213,
            0.4979843200188106
          ],
          [
            0.45371515187952255,
            0.5031745497139646
          ],
          [
            0.4395602289173338,
            0.495959290398935
          ],
          [
            0.4389677319261763,
            0.499592332031108
          ],
          [
            0.44068013661437566,
            0.49579863814074887
          ],
          [
            0.4679133978154924,
            0.49713972130472056
          ],
          [
            0.4772175868352254,
            0.49167083063227335
          ],
          [
            0.4724269294076496,
            0.4957294139969775
          ],
          [
            0.46412344541814593,
            0.5105385687580121
          ],
          [
            0.45322151978810626,
            0.5153325641287393
          ],
          [
            0.45450053181913164,
            0.509304953728528
          ],
          [
            0.45131558047400583,
            0.49861629680967856
          ],
          [
            0.4539495928419961,
            0.4985541302747393
          ],
          [
            0.45241392850875856,
            0.5062925004729715
          ],
          [
            0.45551463696691724,
            0.503041211318531
          ],
          [
            0.46613574392265744,
            0.49949771882699284
          ],
          [
            0.48357700837983025,
            0.4891957180491553
          ],
          [
            0.4632567008336385,
            0.49459962372599325
          ],
          [
            0.45090161595079636,
            0.5003017592046132
          ],
          [
            0.44634079701370666,
            0.49625133333583177
          ]
        ],
        "visibility": [
          0.9999980926513672,
          0.999994158744812,
          0.9787644147872925,
          0.19692416489124298,
          0.9994543194770813,
          0.9995439648628235,
          1.2315506126014952e-07,
          0.0009536489378660917,
          0.6434676051139832,
          0.7049931287765503,
          1.5915555096057687e-08,
          0.00015148127567954361,
          0.11454549431800842,
          4.3188699144769416e-11,
          0.9999964237213135,
          1.850347253196105e-08,
          2.1945427697289688e-09,
          0.005017368122935295,
          5.016084969611256e-07,
          0.000910082075279206,
          1.9737868786363086e-16,
          2.8018425268783176e-07,
          0.6002824306488037,
          0.21752102673053741,
          0.3719486892223358,
          0.9999967813491821,
          0.008777283132076263,
          0.0009979127207770944,
          3.006840961461421e-05
        ],
        "headpose": {
          "pitch": -53.668447044901555,
          "yaw": 59.8540268667106,
          "roll": -60.964267286107
        },
        "attributes": {
          "5 oClock Shadow": 0.04560299962759018,
          "Arched Eyebrows": 0.001198723097331822,
          "Attractive": 0.11040659993886948,
          "Bags Under Eyes": 0.027125345543026924,
          "Bald": 5.960491762380116e-06,
          "Bangs": 0.007504281587898731,
          "Big Lips": 0.039190515875816345,
          "Big Nose": 0.02339419350028038,
          "Black Hair": 0.0020122334826737642,
          "Blond Hair": 0.03177189081907272,
          "Blurry": 0.03974294662475586,
          "Brown Hair": 0.3870273232460022,
          "Bushy Eyebrows": 0.0002974004892166704,
          "Chubby": 0.0002980132703669369,
          "Double Chin": 4.00067656300962e-05,
          "Eyeglasses": 0.009570665657520294,
          "Goatee": 0.03441241756081581,
          "Gray Hair": 0.0022988806013017893,
          "Heavy Makeup": 0.00032561086118221283,
          "High Cheekbones": 0.007434094790369272,
          "Male": 0.9858418107032776,
          "Mouth Slightly Open": 0.004353497643023729,
          "Mustache": 0.012211565859615803,
          "Narrow Eyes": 0.06948895007371902,
          "No Beard": 0.6114471554756165,
          "Oval Face": 0.0038751554675400257,
          "Pale Skin": 0.001287460676394403,
          "Pointy Nose": 0.526242733001709,
          "Receding Hairline": 0.004346633329987526,
          "Rosy Cheeks": 0.00018067096243612468,
          "Sideburns": 0.007134934421628714,
          "Smiling": 0.0019883615896105766,
          "Straight Hair": 0.183716282248497,
          "Wavy Hair": 0.1200522780418396,
          "Wearing Earrings": 0.009810484014451504,
          "Wearing Hat": 0.0006188797415234149,
          "Wearing Lipstick": 0.0009868508204817772,
          "Wearing Necklace": 0.005315524525940418,
          "Wearing Necktie": 0.0039186072535812855,
          "Young": 0.6233590841293335
        },
        "age": [
          0.00016171409515663981,
          0.015067014843225479,
          0.6598694324493408,
          0.6329771280288696,
          0.9867135286331177,
          0.07381264865398407,
          0.005036307033151388,
          1.5360534462161013e-06
        ],
        "race": [
          0.9998708963394165,
          2.840061642928049e-05,
          0.934303343296051,
          0.007592880167067051,
          0.05940091237425804
        ],
        "gender": [
          0.9663580060005188,
          0.05143009498715401
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 1.9762217998504639,
          "disgust": 0.009013011731440201,
          "fear": 1.037793606519699,
          "happy": 0.03313525230623782,
          "sad": 96.75306677818298,
          "surprise": 4.910749584752239e-07,
          "neutral": 0.19076861208304763
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 573,
          "h": 918,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 34,
        "gender": {
          "Woman": 5.732986330986023,
          "Man": 94.26701664924622
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.423925047984725,
          "indian": 17.670798918104044,
          "black": 0.33758626618519616,
          "white": 24.039846544247453,
          "middle eastern": 37.846310478009045,
          "latino hispanic": 19.68153502721012
        },
        "dominant_race": "middle eastern"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.13761954009532928,
        0.20390786230564117,
        0.9990800619125366,
        0.9312605857849121
      ]
    ],
    "face_boxes": [
      [
        0.35269320011138916,
        0.3156667947769165,
        0.618501603603363,
        0.5401063561439514
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.7908141077186849,
            0.5756292699798942
          ],
          [
            0.6049329337913126,
            0.5840073747336865
          ],
          [
            0.29920731877918716,
            0.7631699225455523
          ],
          [
            0.22338736625618003,
            0.5040931447744369
          ],
          [
            0.9766952816460571,
            0.5672511652261019
          ],
          [
            0.9815868914862511,
            0.91010899053514
          ],
          [
            0.8984295242029531,
            0.8946417202204466
          ],
          [
            0.5902581042707306,
            0.973267010986805
          ],
          [
            0.28697829417870213,
            0.9178426256924868
          ],
          [
            0.24295380561695606,
            1.090560477539897
          ],
          [
            0.869079865161789,
            0.9913121596872807
          ],
          [
            0.3530150270213212,
            0.9333098960071802
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.38481049098258224,
            0.41773421885073186
          ],
          [
            0.4288349795443283,
            0.4074227053076029
          ],
          [
            0.6342825928324767,
            0.38035498225688935
          ],
          [
            0.6367283977525736,
            0.376488164678216
          ]
        ],
        "dw_hand_1": [
          [
            0.9033211340431471,
            0.8907749026417732
          ],
          [
            0.839730206120625,
            0.8611293012052774
          ],
          [
            0.7785850831181998,
            0.8314836997687817
          ],
          [
            0.6831986912344167,
            0.8276168821901083
          ],
          [
            0.6049329337913126,
            0.8366394565403461
          ],
          [
            0.7467896191569388,
            0.8198832470327616
          ],
          [
            0.6489574223530586,
            0.8173053686469793
          ],
          [
            0.5804748845903426,
            0.8327726389616728
          ],
          [
            0.5486794206290815,
            0.8482399092763663
          ],
          [
            0.7467896191569388,
            0.8469509700834751
          ],
          [
            0.6391742026726707,
            0.8508177876621484
          ],
          [
            0.5804748845903426,
            0.8649961187839508
          ],
          [
            0.5535710304692755,
            0.876596571519971
          ],
          [
            0.7541270339172298,
            0.877885510712862
          ],
          [
            0.6636322518736407,
            0.8804633890986443
          ],
          [
            0.6073787387114096,
            0.888197024255991
          ],
          [
            0.5755832747501486,
            0.8959306594133377
          ],
          [
            0.7614644486775208,
            0.9049532337635755
          ],
          [
            0.6978735207549988,
            0.9062421729564667
          ],
          [
            0.6489574223530586,
            0.9075311121493578
          ],
          [
            0.6073787387114096,
            0.908820051342249
          ]
        ],
        "dw_hand_2": [
          [
            0.24784541545715005,
            0.48604799607396126
          ],
          [
            0.2918699040188961,
            0.44609088109433653
          ],
          [
            0.3310027827404482,
            0.4100005836933851
          ],
          [
            0.3407860024208362,
            0.3893775566071272
          ],
          [
            0.3505692221012242,
            0.36230983355641366
          ],
          [
            0.26496604989782907,
            0.36746559032797815
          ],
          [
            0.2698576597380231,
            0.3391089280843735
          ],
          [
            0.30409892861938115,
            0.33266423211991786
          ],
          [
            0.3432318073409332,
            0.33008635373413564
          ],
          [
            0.24050800069685904,
            0.37004346871376037
          ],
          [
            0.2527370252973441,
            0.3391089280843735
          ],
          [
            0.30654473353947814,
            0.3313752929270267
          ],
          [
            0.3505692221012242,
            0.33008635373413564
          ],
          [
            0.23072478101647104,
            0.38293286064267157
          ],
          [
            0.25029122037724705,
            0.3584430159777403
          ],
          [
            0.30409892861938115,
            0.35070938082039355
          ],
          [
            0.3383401975007392,
            0.35070938082039355
          ],
          [
            0.22827897609637404,
            0.40097800934314726
          ],
          [
            0.2551828302174411,
            0.3867996782213449
          ],
          [
            0.2894240990987991,
            0.3816439214497805
          ],
          [
            0.3163279532198662,
            0.38035498225688935
          ]
        ],
        "dw_face": [
          [
            0.38481049098258224,
            0.41644527965784073
          ],
          [
            0.4043769303433583,
            0.4370683067440987
          ],
          [
            0.41905175986394033,
            0.4576913338303566
          ],
          [
            0.43128078446442536,
            0.4770254217237234
          ],
          [
            0.45084722382520137,
            0.4950705704241991
          ],
          [
            0.4728594681060744,
            0.5118267799317837
          ],
          [
            0.49731751730704443,
            0.5285829894393682
          ],
          [
            0.5315587861884025,
            0.5337387462109328
          ],
          [
            0.5658000550697605,
            0.5247161718606949
          ],
          [
            0.5927039091908276,
            0.5079599623531104
          ],
          [
            0.6122703485516036,
            0.4886258744597435
          ],
          [
            0.6293909829922826,
            0.4680028473734856
          ],
          [
            0.6391742026726707,
            0.4473798202872276
          ],
          [
            0.6367283977525736,
            0.42546785400807857
          ],
          [
            0.6220535682319916,
            0.40355588772892953
          ],
          [
            0.6098245436315066,
            0.38293286064267157
          ],
          [
            0.5927039091908276,
            0.3610208943635225
          ],
          [
            0.3676898565419032,
            0.40484482692182067
          ],
          [
            0.3676898565419032,
            0.40484482692182067
          ],
          [
            0.36524405162180623,
            0.40484482692182067
          ],
          [
            0.36524405162180623,
            0.40484482692182067
          ],
          [
            0.36524405162180623,
            0.40484482692182067
          ],
          [
            0.37258146638209727,
            0.40097800934314726
          ],
          [
            0.38481049098258224,
            0.39582225257158277
          ],
          [
            0.39948532050316427,
            0.3919554349929094
          ],
          [
            0.41660595494384334,
            0.3893775566071272
          ],
          [
            0.43617239430461935,
            0.38808861741423606
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3897021008227763,
            0.43577936755120755
          ],
          [
            0.3872562959026793,
            0.4525355770587921
          ],
          [
            0.3872562959026793,
            0.4692917865663767
          ],
          [
            0.39948532050316427,
            0.4770254217237234
          ],
          [
            0.41660595494384334,
            0.4770254217237234
          ],
          [
            0.43128078446442536,
            0.47444754333794115
          ],
          [
            0.44350980906491033,
            0.4705807257592678
          ],
          [
            0.45084722382520137,
            0.46671390818059444
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.3872562959026793,
            0.41902315804362295
          ],
          [
            0.41660595494384334,
            0.41128952288627624
          ],
          [
            0.41905175986394033,
            0.40484482692182067
          ],
          [
            0.43128078446442536,
            0.4022669485360384
          ],
          [
            0.44350980906491033,
            0.4022669485360384
          ],
          [
            0.43617239430461935,
            0.4074227053076029
          ],
          [
            0.4263891746242313,
            0.4125784620791674
          ],
          [
            0.45573883366539536,
            0.4976484488099813
          ],
          [
            0.4484014189051044,
            0.49635950961709024
          ],
          [
            0.44350980906491033,
            0.49249269203841683
          ],
          [
            0.44350980906491033,
            0.49249269203841683
          ],
          [
            0.4484014189051044,
            0.4899148136526346
          ],
          [
            0.4655220533457834,
            0.4899148136526346
          ],
          [
            0.4850884927065594,
            0.49120375284552575
          ],
          [
            0.4801968828663654,
            0.49635950961709024
          ],
          [
            0.4728594681060744,
            0.5028042055815458
          ],
          [
            0.4630762484256864,
            0.5066710231602192
          ],
          [
            0.45818463858549235,
            0.5053820839673281
          ],
          [
            0.45818463858549235,
            0.5015152663886547
          ],
          [
            0.45573883366539536,
            0.4976484488099813
          ],
          [
            0.45573883366539536,
            0.4976484488099813
          ],
          [
            0.45573883366539536,
            0.49635950961709024
          ],
          [
            0.4704136631859774,
            0.49378163123130797
          ],
          [
            0.4826426877864624,
            0.49120375284552575
          ],
          [
            0.4704136631859774,
            0.49378163123130797
          ],
          [
            0.4606304435055894,
            0.4976484488099813
          ],
          [
            0.45818463858549235,
            0.4976484488099813
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "022793",
  "objects": [
    {
      "box": [
        0.16859781742095947,
        0.31601983308792114,
        0.361222505569458,
        0.5268704891204834
      ],
      "name": "hand",
      "possible_names": [
        "hand"
      ],
      "deleted": true
    }
  ],
  "mask_file": "./person_labeling/./022793.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person wearing a beige jacket and black turtleneck is seated against a dark background with soft lighting creating an intimate atmosphere and blurred objects in the foreground suggesting a casual setting",
  "overall_past": "Before this scene, the individual likely had a conversation or received information that triggered a moment of deep reflection. The soft lighting and blurred foreground suggest a private, unstructured environment—possibly a quiet room or a casual gathering—where the exchange was meaningful but not formal. The act of touching the forehead while looking down indicates a reaction to something emotionally or mentally taxing, such as a difficult decision, a personal revelation, or news that challenged their perspective. It is plausible that they had just been told something unexpected or weighty—perhaps about a relationship, a personal responsibility, or a sudden change in circumstances—prompting this introspective pause as they processed the implications.",
  "overall_past_clean": "A sharp, unexpected revelation had just been delivered—something that shattered a long-held assumption, forcing a sudden confrontation with a truth too heavy to ignore, and the silence that followed was thick with the weight of irreversible change.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to slowly lower their hand from their forehead, take a deep breath, and then look up with a determined expression—perhaps preparing to speak or make a decision. The soft lighting and intimate atmosphere suggest a private, meaningful moment, and the gesture of touching the forehead implies a mental struggle or weighing of options. Given the casual yet introspective setting, it is plausible that they will now turn toward the unseen person or situation, offering a response—whether a confession, a commitment, or a hard-earned conclusion—marking a turning point in the conversation or internal journey.",
  "overall_future_clean": "The hand descends slowly, breath deepens, eyes lift with unwavering resolve, and a voice emerges—clear, steady, and unyielding—declaring a choice that shifts the course of everything.",
  "future_scene_ok": true
}