{
  "video_path": "./ref_datasets/part2/8090411011.mp4",
  "start_time": 0.0,
  "end_time": 1.32,
  "image_path": "./009528.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/8090411010.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_5022734288974257480_1_8090411010.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/8090411010.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_5022734288974257480_1_8090411010.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/8090411011.mp4",
      "start_time": 0.0,
      "end_time": 1.32,
      "image_path": "./ref_datasets/extracted_frames/person_2248941331733770234_1_8090411011.mp4_0.00_1.32.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/8090411011.mp4",
      "start_time": 0.0,
      "end_time": 1.32,
      "image_path": "./ref_datasets/extracted_frames/face_2248941331733770234_1_8090411011.mp4_0.00_1.32.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "senior",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a plain white t-shirt with short sleeves. The shirt appears to be made of a lightweight fabric suitable for casual wear.",
        "clothing": [
          {
            "possible_names": [
              "t-shirt",
              "shirt",
              "tee"
            ],
            "name": "t shirt",
            "type": "top",
            "color": [
              "white"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "glasses",
              "eyeglasses",
              "spectacles"
            ],
            "name": "glasses",
            "position": "head"
          }
        ],
        "description": "The person is an older male with a neutral expression, wearing a plain white t-shirt and glasses. He is positioned against a dark background, which contrasts with his light-colored clothing. The glasses he wears have thin frames and rest on his nose. There are no other objects or accessories visible in the image.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, with no strong emotions displayed.",
        "meaningful": false,
        "story": "unknown",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person appears to be standing still against a dark background, wearing glasses and a white shirt, with a serious and contemplative expression on their face which suggests they might be deep in thought or focused on something important. Their posture is upright and steady indicating confidence or determination. The lighting highlights their facial features creating an intense atmosphere around them as if they are about to share significant information or insights. There are no other people or objects in the frame so their actions seem to be entirely self-contained and introspective possibly reflecting on past experiences or planning for future events.",
        "intention": "They are mentally preparing to reveal profound insights or make a decisive choice rooted in deep reflection",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.4205172676854093,
            0.41923468311627704
          ],
          [
            0.42561359922648023,
            0.4945788814907982
          ],
          [
            0.43140278543744764,
            0.5715865447407676
          ],
          [
            0.43956144713527656,
            0.6352552499089923
          ],
          [
            0.44978049714753277,
            0.6958305165881202
          ],
          [
            0.47101451435041236,
            0.7419594094866798
          ],
          [
            0.49663158364187254,
            0.7707499084018525
          ],
          [
            0.5219855628435494,
            0.793354428382147
          ],
          [
            0.548624780344629,
            0.8042208807809013
          ],
          [
            0.5756411833684331,
            0.7965023267836798
          ],
          [
            0.6009080089602205,
            0.7610908752395994
          ],
          [
            0.6232251653709164,
            0.7217772972016107
          ],
          [
            0.6388680459165943,
            0.662164925393604
          ],
          [
            0.6459268271686193,
            0.5877802542277745
          ],
          [
            0.6478570989923131,
            0.5184554477532705
          ],
          [
            0.6473180736315547,
            0.44363253144990833
          ],
          [
            0.650597467279863,
            0.36705191986901414
          ],
          [
            0.44054140577229517,
            0.3710530235653832
          ],
          [
            0.45340499878428364,
            0.30626115486735395
          ],
          [
            0.4753482754174148,
            0.2883738319079081
          ],
          [
            0.49840105457601125,
            0.2825857503073556
          ],
          [
            0.5204228544629186,
            0.2958462578909738
          ],
          [
            0.5518490624986316,
            0.28597262444950283
          ],
          [
            0.5730886286308865,
            0.26221387826261067
          ],
          [
            0.5950886696309031,
            0.2561390161514282
          ],
          [
            0.6160841655142759,
            0.27202739091146555
          ],
          [
            0.6303698251596981,
            0.32231358289718626
          ],
          [
            0.5348344629989262,
            0.37070660335677014
          ],
          [
            0.5354717516345575,
            0.4179818485464369
          ],
          [
            0.5366210293580338,
            0.46385688384373985
          ],
          [
            0.5381511525363758,
            0.5113012177603585
          ],
          [
            0.5137920255342853,
            0.5559577686446053
          ],
          [
            0.5260561629833723,
            0.5666950310979572
          ],
          [
            0.5397616171283319,
            0.5747881974492755
          ],
          [
            0.5545989584159811,
            0.5594602017175584
          ],
          [
            0.5669787379144949,
            0.547026150567191
          ],
          [
            0.4662500383015632,
            0.40243553207034155
          ],
          [
            0.4775185089210067,
            0.3863716539882478
          ],
          [
            0.49212403482933026,
            0.3806147793928782
          ],
          [
            0.5054499776237207,
            0.397041178317297
          ],
          [
            0.4910868336730012,
            0.4037942716053554
          ],
          [
            0.47942042217372327,
            0.40535568027269275
          ],
          [
            0.5688374639679462,
            0.38398298706327166
          ],
          [
            0.5815389160829666,
            0.36155358552932737
          ],
          [
            0.5939353187571408,
            0.3594980606010982
          ],
          [
            0.6059845237396821,
            0.3717398663361867
          ],
          [
            0.5943546525306518,
            0.3825263928799402
          ],
          [
            0.5821685188611017,
            0.38629878418786184
          ],
          [
            0.4962936420366869,
            0.6484464157195318
          ],
          [
            0.5124220420964665,
            0.6355931066331408
          ],
          [
            0.5294035841445748,
            0.6297193260419937
          ],
          [
            0.5420465481827335,
            0.634428216162182
          ],
          [
            0.5532285617600173,
            0.6249555911336627
          ],
          [
            0.5715442081047286,
            0.6317768074217297
          ],
          [
            0.5926531618844761,
            0.6457277820223855
          ],
          [
            0.5723322033009453,
            0.6574745734532674
          ],
          [
            0.5546963834483313,
            0.6621023830913363
          ],
          [
            0.5424258824398118,
            0.6676351638067336
          ],
          [
            0.5297887152619153,
            0.665432520139785
          ],
          [
            0.5128417182507263,
            0.6617253331910996
          ],
          [
            0.501132202195812,
            0.6471525918869745
          ],
          [
            0.5310124548951145,
            0.644210858572097
          ],
          [
            0.5412538777183624,
            0.6489896677789233
          ],
          [
            0.5530192372540105,
            0.6431381458327883
          ],
          [
            0.5852565807020582,
            0.6438465737161182
          ],
          [
            0.5537977992702892,
            0.6435391221727643
          ],
          [
            0.5413145381420433,
            0.6474750535828727
          ],
          [
            0.5284559214571434,
            0.6415217961583819
          ]
        ],
        "visibility": [
          0.01874484308063984,
          7.76718138695287e-08,
          0.9997839331626892,
          1.2787658952573278e-11,
          0.007928824983537197,
          0.999997615814209,
          1.667796189217565e-19,
          3.80115279530191e-11,
          0.9999911785125732,
          8.139513063554205e-09,
          0.9835968613624573,
          0.1429363489151001,
          0.9999010562896729,
          0.006950305309146643,
          2.9319226086954586e-05,
          3.0000793516116175e-11,
          0.0024259062483906746,
          5.113652150612324e-07,
          0.0009762699482962489,
          0.030799517408013344,
          2.3529830427831966e-12,
          2.6219132295564742e-17,
          1.2903765309602022e-05,
          5.21279579831363e-13,
          2.39360370716743e-13,
          5.321635601802932e-13,
          7.582726113675164e-12,
          5.145998644567884e-12,
          2.6800991981268396e-10
        ],
        "headpose": {
          "pitch": -2.015585408976178,
          "yaw": 0.22196471288272407,
          "roll": -4.149510675511997
        },
        "attributes": {
          "5 oClock Shadow": 0.2765377461910248,
          "Arched Eyebrows": 0.0049458215944468975,
          "Attractive": 0.027699586004018784,
          "Bags Under Eyes": 0.31927135586738586,
          "Bald": 0.10321776568889618,
          "Bangs": 0.00012245532707311213,
          "Big Lips": 0.17274214327335358,
          "Big Nose": 0.6399331092834473,
          "Black Hair": 0.0389123298227787,
          "Blond Hair": 0.0011932987254112959,
          "Blurry": 0.005771147087216377,
          "Brown Hair": 0.0007328988867811859,
          "Bushy Eyebrows": 0.0405404306948185,
          "Chubby": 0.16891314089298248,
          "Double Chin": 0.05719839781522751,
          "Eyeglasses": 0.03734169527888298,
          "Goatee": 0.3071466386318207,
          "Gray Hair": 0.05203121528029442,
          "Heavy Makeup": 0.0003489663649816066,
          "High Cheekbones": 0.16076865792274475,
          "Male": 0.9995090961456299,
          "Mouth Slightly Open": 0.0007998385699465871,
          "Mustache": 0.17590461671352386,
          "Narrow Eyes": 0.08069511502981186,
          "No Beard": 0.09558741003274918,
          "Oval Face": 0.14489714801311493,
          "Pale Skin": 0.002824063878506422,
          "Pointy Nose": 0.03241630643606186,
          "Receding Hairline": 0.02792232856154442,
          "Rosy Cheeks": 0.000678473908919841,
          "Sideburns": 0.2224739044904709,
          "Smiling": 0.01842757873237133,
          "Straight Hair": 0.009310012683272362,
          "Wavy Hair": 0.0025751828216016293,
          "Wearing Earrings": 0.004963797051459551,
          "Wearing Hat": 0.06783688068389893,
          "Wearing Lipstick": 0.0006119322497397661,
          "Wearing Necklace": 0.019337421283125877,
          "Wearing Necktie": 0.007572570350021124,
          "Young": 0.40544363856315613
        },
        "age": [
          0.004621726460754871,
          0.01755741983652115,
          0.07731794565916061,
          0.14359846711158752,
          0.53806072473526,
          0.8822585940361023,
          0.7344293594360352,
          0.6323094367980957
        ],
        "race": [
          0.30002155900001526,
          0.21605676412582397,
          0.7625349164009094,
          0.5834635496139526,
          0.5415859222412109
        ],
        "gender": [
          0.9904534816741943,
          0.015351307578384876
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 2.2153579223361565e-13,
          "disgust": 0.0,
          "fear": 1.5060363978136593e-05,
          "happy": 2.8637484172266462e-21,
          "sad": 99.99998807907104,
          "surprise": 8.467867512716234e-31,
          "neutral": 2.743969022894594e-16
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 946,
          "h": 1355,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 56,
        "gender": {
          "Woman": 0.8429365232586861,
          "Man": 99.15705919265747
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 1.3139057904481888,
          "indian": 2.330583520233631,
          "black": 0.1759115606546402,
          "white": 66.46225452423096,
          "middle eastern": 19.532382488250732,
          "latino hispanic": 10.184958577156067
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.23410004377365112,
        0.06670408695936203,
        0.8363650441169739,
        0.9868817329406738
      ]
    ],
    "face_boxes": [
      [
        0.4246978759765625,
        0.13676513731479645,
        0.6556621789932251,
        0.7808065414428711
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5433647191524505,
            0.9849163880271297
          ],
          [
            0.3026076203584671,
            0.9836331167076299
          ],
          [
            0.13759432792663573,
            1.0041654578196255
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.784121817946434,
            0.9861996593466293
          ],
          [
            0.9153209111094475,
            1.040097054765618
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4797940245270729,
            0.39589485237675326
          ],
          [
            0.5934097340703011,
            0.3753625112647576
          ],
          [
            0.4216336017847061,
            0.47802421682473606
          ],
          [
            0.6610381326079369,
            0.4523587904347414
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.417575897872448,
            0.4087275655717506
          ],
          [
            0.4189284658432007,
            0.4728911315467371
          ],
          [
            0.42433873772621156,
            0.5370546975217236
          ],
          [
            0.43110157757997514,
            0.6012182634967101
          ],
          [
            0.44327468931674957,
            0.6628152868326973
          ],
          [
            0.46085807293653486,
            0.711579596973687
          ],
          [
            0.4865568643808365,
            0.7552108218366779
          ],
          [
            0.5163133597373962,
            0.7834427908656719
          ],
          [
            0.5487749910354615,
            0.7885758761436709
          ],
          [
            0.5825891903042794,
            0.7757431629486735
          ],
          [
            0.6109931176900864,
            0.739811566002681
          ],
          [
            0.6326342052221299,
            0.6936137985006908
          ],
          [
            0.646159884929657,
            0.6345833178037031
          ],
          [
            0.6529227247834206,
            0.5704197518287166
          ],
          [
            0.655627860724926,
            0.5062561858537301
          ],
          [
            0.6569804286956787,
            0.4420926198787436
          ],
          [
            0.655627860724926,
            0.37792905390375703
          ],
          [
            0.436511849462986,
            0.36252979806976027
          ],
          [
            0.4527426651120186,
            0.3419974569577646
          ],
          [
            0.47303118467330935,
            0.3368643716797657
          ],
          [
            0.4933197042346001,
            0.3368643716797657
          ],
          [
            0.5136082237958908,
            0.33943091431876515
          ],
          [
            0.5595955348014832,
            0.3265982011237678
          ],
          [
            0.5771789184212684,
            0.31633203056777
          ],
          [
            0.5961148700118065,
            0.31119894528977105
          ],
          [
            0.6164033895730973,
            0.3137654879287705
          ],
          [
            0.6353393411636352,
            0.33173128640176675
          ],
          [
            0.536601879298687,
            0.3881952244597549
          ],
          [
            0.5379544472694398,
            0.42669336404474684
          ],
          [
            0.5393070152401924,
            0.4651915036297387
          ],
          [
            0.5406595832109451,
            0.5062561858537301
          ],
          [
            0.5149607917666436,
            0.5550204959947199
          ],
          [
            0.5284864714741707,
            0.5575870386337194
          ],
          [
            0.5433647191524505,
            0.5575870386337194
          ],
          [
            0.5568903988599777,
            0.5524539533557205
          ],
          [
            0.5704160785675049,
            0.5473208680777215
          ],
          [
            0.4540952330827713,
            0.40359448029375167
          ],
          [
            0.4703260487318039,
            0.38562868182075544
          ],
          [
            0.4892620003223419,
            0.38306213918175597
          ],
          [
            0.5054928159713745,
            0.4010279376547522
          ],
          [
            0.4879094323515892,
            0.4112941082107501
          ],
          [
            0.4703260487318039,
            0.4138606508497495
          ],
          [
            0.5690635105967522,
            0.3881952244597549
          ],
          [
            0.5825891903042794,
            0.3676628833477592
          ],
          [
            0.6001725739240646,
            0.36252979806976027
          ],
          [
            0.6164033895730973,
            0.37792905390375703
          ],
          [
            0.6015251418948173,
            0.3907617670987544
          ],
          [
            0.5852943262457848,
            0.39332830973775385
          ],
          [
            0.5000825440883636,
            0.6422829457207015
          ],
          [
            0.5163133597373962,
            0.6294502325257042
          ],
          [
            0.5352493113279343,
            0.6217506046087059
          ],
          [
            0.5447172871232033,
            0.6217506046087059
          ],
          [
            0.555537830889225,
            0.6191840619697064
          ],
          [
            0.574473782479763,
            0.6217506046087059
          ],
          [
            0.5934097340703011,
            0.6320167751647037
          ],
          [
            0.5785314863920212,
            0.6474160309987005
          ],
          [
            0.5623006707429886,
            0.6551156589156989
          ],
          [
            0.546069855093956,
            0.6576822015546984
          ],
          [
            0.5298390394449234,
            0.6576822015546984
          ],
          [
            0.5149607917666436,
            0.6525491162766994
          ],
          [
            0.5054928159713745,
            0.6422829457207015
          ],
          [
            0.5244287675619126,
            0.6397164030817021
          ],
          [
            0.546069855093956,
            0.6371498604427026
          ],
          [
            0.5663583746552467,
            0.6320167751647037
          ],
          [
            0.5879994621872902,
            0.6320167751647037
          ],
          [
            0.5677109426259994,
            0.6345833178037031
          ],
          [
            0.546069855093956,
            0.6397164030817021
          ],
          [
            0.5257813355326653,
            0.6397164030817021
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "009528",
  "objects": [],
  "mask_file": "./person_labeling/./009528.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A dimly lit scene with a stark black background and soft lighting highlighting an individual wearing a white shirt creating a minimalist and contemplative atmosphere",
  "overall_past": "Before this scene, the person likely spent a prolonged period in quiet reflection or intense mental preparation—perhaps reviewing a pivotal decision, a personal failure, or a moment of profound realization. The seriousness in their expression, combined with the solitary, minimalist setting, suggests they were engaged in deep introspection, possibly after a significant life event or creative breakthrough. The white shirt and glasses may symbolize clarity or intellectual rigor, indicating they had been analyzing complex ideas or emotions. The stillness and focused posture imply that they had just reached a moment of resolution or clarity, preparing to act or speak with purpose—making this current scene the quiet culmination of an internal journey.",
  "overall_past_clean": "They had been locked in a relentless internal reckoning, dissecting every choice, every failure, every unspoken truth until the weight of it all coalesced into a single, undeniable conviction that demanded release.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person is likely to begin speaking—perhaps delivering a profound insight, a personal revelation, or a carefully considered decision. The intense, focused expression, upright posture, and solitary, contemplative setting suggest a moment of internal clarity preceding an outward expression of thought. Given the minimalist and dramatic lighting, the scene feels like a threshold: the silence before a breakthrough. The most plausible next event is that the person slowly raises their head, takes a deep breath, and begins to speak—voice calm but resonant—sharing a truth they’ve been reflecting on, possibly about purpose, change, or a pivotal life choice. This moment marks the transition from introspection to action or communication.",
  "overall_future_clean": "The air shifts as they lift their gaze, breath steadying, then a voice emerges—clear, unwavering, cutting through the stillness like a blade through silence, declaring a truth long held in the quiet.",
  "future_scene_ok": true
}