{
  "video_path": "./ref_datasets/part2/8724518003.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./031193.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/8724518003.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-7277223048544915781_1_8724518003.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "senior",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a plain, light beige t-shirt with a round neckline. The shirt appears to be made of a soft material and fits loosely on the body.",
        "clothing": [
          {
            "possible_names": [
              "t-shirt",
              "shirt",
              "tee"
            ],
            "name": "t shirt",
            "type": "top",
            "color": [
              "light beige"
            ]
          }
        ],
        "objects": [],
        "description": "The person is an older female with short, light-colored hair. She is wearing a plain, light beige t-shirt with a round neckline. Her expression is neutral, and she is positioned against a dark blue background. There are no additional objects or accessories visible.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, neither smiling nor frowning, suggesting a calm or indifferent state.",
        "meaningful": false,
        "story": "unknown",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person appears to be standing still against a plain dark background, wearing a light-colored top. Their expression is neutral, possibly indicating a calm demeanor or a moment of reflection. The individual's posture suggests they might be engaged in a formal setting or participating in an interview, as there are no visible interactions with other people or objects around them. The simplicity of the scene focuses attention on the person, highlighting their presence and possibly conveying a sense of seriousness or contemplation.",
        "intention": "The individual is deliberately presenting a composed and focused image likely to convey professionalism and sincerity in a formal or evaluative context",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.43813985808187034,
            0.3646749619453672
          ],
          [
            0.44657958023266736,
            0.42893108224111887
          ],
          [
            0.4575888120536027,
            0.4852692959800599
          ],
          [
            0.46726651662694557,
            0.5340352760420906
          ],
          [
            0.4792900202030848,
            0.5817151658118718
          ],
          [
            0.49786641630843015,
            0.6213612974636138
          ],
          [
            0.5204643977922387,
            0.6462857885966226
          ],
          [
            0.540848502199099,
            0.6614972771160186
          ],
          [
            0.5628657643101178,
            0.6619113704514882
          ],
          [
            0.5861740764563105,
            0.646865625419314
          ],
          [
            0.6059189459109413,
            0.6180198894606697
          ],
          [
            0.6242963911000905,
            0.5798449906091842
          ],
          [
            0.6383173524269036,
            0.5252390978828309
          ],
          [
            0.6417753992968106,
            0.4682928926414914
          ],
          [
            0.6414787341408166,
            0.40872239139344957
          ],
          [
            0.6405991930181959,
            0.35274886157777574
          ],
          [
            0.6435751487401181,
            0.28444138661263485
          ],
          [
            0.45579496756961035,
            0.3633926332943023
          ],
          [
            0.4669334512478339,
            0.3314875668949551
          ],
          [
            0.4853617150303242,
            0.3253826335309044
          ],
          [
            0.5035738624366266,
            0.3230752284564669
          ],
          [
            0.5231360581237823,
            0.3329430456199343
          ],
          [
            0.5534493156758669,
            0.32362162707343933
          ],
          [
            0.5693354328562106,
            0.30249881384864685
          ],
          [
            0.5868352265097201,
            0.2899984014412713
          ],
          [
            0.603780159377493,
            0.28546079349896264
          ],
          [
            0.6199260434202318,
            0.30525920287011166
          ],
          [
            0.5376220529682801,
            0.3666924727341485
          ],
          [
            0.5393941877409816,
            0.407733069241993
          ],
          [
            0.5442315304119671,
            0.44751966065830656
          ],
          [
            0.5458869729191065,
            0.49269252939829755
          ],
          [
            0.5319734305043572,
            0.5084054462493413
          ],
          [
            0.5400282160595192,
            0.5149711079067654
          ],
          [
            0.5494861123734154,
            0.5215997858652993
          ],
          [
            0.5586265683440226,
            0.5060769794479248
          ],
          [
            0.5654394742034907,
            0.4931694942807394
          ],
          [
            0.48246827469639747,
            0.37797043645192707
          ],
          [
            0.49184093420626596,
            0.3666360427462866
          ],
          [
            0.5039240521977523,
            0.36592107793641465
          ],
          [
            0.5148093055468053,
            0.37905903581588984
          ],
          [
            0.5024181232604731,
            0.3833525159056224
          ],
          [
            0.49286874628991684,
            0.3823284286355215
          ],
          [
            0.5660485784589713,
            0.358561922349627
          ],
          [
            0.5747376182615491,
            0.33893432286050584
          ],
          [
            0.5850550712618445,
            0.3335589503485059
          ],
          [
            0.5964881816014116,
            0.33611801049065965
          ],
          [
            0.5873667344650519,
            0.3497540673566243
          ],
          [
            0.5783996789084216,
            0.3545135110143631
          ],
          [
            0.5206859005182716,
            0.5625063882933723
          ],
          [
            0.5324615087676128,
            0.5588409722797454
          ],
          [
            0.5433017201139592,
            0.5557029438397242
          ],
          [
            0.5538735895700353,
            0.5563911532598829
          ],
          [
            0.5623724280656981,
            0.5483443190181065
          ],
          [
            0.5762696419842541,
            0.545865259662507
          ],
          [
            0.59119468852545,
            0.5391541200970846
          ],
          [
            0.5778956521202677,
            0.5590857032745604
          ],
          [
            0.5645272042020224,
            0.5706428735975235
          ],
          [
            0.5550269256844851,
            0.5752285881647988
          ],
          [
            0.5464643033587241,
            0.577019196843344
          ],
          [
            0.5332902775096175,
            0.5735814790877084
          ],
          [
            0.5261312691478192,
            0.5634822241843693
          ],
          [
            0.5455942101710076,
            0.5607239823492746
          ],
          [
            0.5548590605280229,
            0.5635279182403807
          ],
          [
            0.5621487995543117,
            0.5562179308088998
          ],
          [
            0.5862532337196171,
            0.5411168896962726
          ],
          [
            0.5626283541371646,
            0.557721443781777
          ],
          [
            0.5529652219764623,
            0.5619689644329131
          ],
          [
            0.5447335546487011,
            0.5587745301307194
          ]
        ],
        "visibility": [
          0.9992807507514954,
          1.7431113519705832e-05,
          2.8355159997772716e-07,
          5.275563406265116e-12,
          0.7685797810554504,
          0.9990764856338501,
          1.8931378686914968e-10,
          1.6802618324485152e-11,
          0.9984645843505859,
          1.3814696053771058e-09,
          1.750219050391763e-17,
          3.7936017174833303e-13,
          0.0005214384873397648,
          7.246671253520465e-13,
          6.561895133927464e-05,
          2.0583019732287706e-16,
          5.0112570343374685e-11,
          8.876162582716063e-10,
          8.765574221400943e-18,
          1.4115973945294513e-09,
          5.88572857689489e-28,
          6.5103355124149746e-21,
          1.4919103705324233e-05,
          8.623064786661416e-06,
          2.0590737367107495e-14,
          3.453444593755849e-15,
          3.807784945371925e-15,
          2.152422315563978e-15,
          4.032290126798621e-12
        ],
        "headpose": {
          "pitch": -13.025817053864529,
          "yaw": -1.4007955994716872,
          "roll": -9.605824369449607
        },
        "attributes": {
          "5 oClock Shadow": 0.004826598800718784,
          "Arched Eyebrows": 0.0011502737179398537,
          "Attractive": 0.11011400073766708,
          "Bags Under Eyes": 0.5867490172386169,
          "Bald": 0.00026178741245530546,
          "Bangs": 0.00025401372113265097,
          "Big Lips": 0.03738566115498543,
          "Big Nose": 0.2776351273059845,
          "Black Hair": 6.840727292001247e-05,
          "Blond Hair": 0.5170185565948486,
          "Blurry": 5.3546959861705545e-06,
          "Brown Hair": 0.0058325654827058315,
          "Bushy Eyebrows": 0.001693753176368773,
          "Chubby": 0.10031141340732574,
          "Double Chin": 0.068398617208004,
          "Eyeglasses": 0.00765701849013567,
          "Goatee": 3.887460843543522e-05,
          "Gray Hair": 0.2974851429462433,
          "Heavy Makeup": 0.001674850471317768,
          "High Cheekbones": 0.2925432622432709,
          "Male": 0.9193882942199707,
          "Mouth Slightly Open": 0.011761697940528393,
          "Mustache": 5.443197096610675e-06,
          "Narrow Eyes": 0.04202007129788399,
          "No Beard": 0.9990031123161316,
          "Oval Face": 0.24395638704299927,
          "Pale Skin": 0.023763634264469147,
          "Pointy Nose": 0.0415215902030468,
          "Receding Hairline": 0.03374563157558441,
          "Rosy Cheeks": 0.004606121219694614,
          "Sideburns": 5.6744365792837925e-06,
          "Smiling": 0.03520938754081726,
          "Straight Hair": 0.6871864795684814,
          "Wavy Hair": 0.015363970771431923,
          "Wearing Earrings": 0.006022405344992876,
          "Wearing Hat": 1.911963408929296e-05,
          "Wearing Lipstick": 0.007789792492985725,
          "Wearing Necklace": 0.006806512828916311,
          "Wearing Necktie": 0.005721079185605049,
          "Young": 0.3139064311981201
        },
        "age": [
          0.009962375275790691,
          0.10363008081912994,
          0.006884360685944557,
          0.036919448524713516,
          0.7563230395317078,
          0.9022564888000488,
          0.5480673909187317,
          0.10973048955202103
        ],
        "race": [
          0.9999496936798096,
          6.146651139715686e-05,
          0.5822287797927856,
          0.004157493356615305,
          0.015149720013141632
        ],
        "gender": [
          0.48124459385871887,
          0.4932588040828705
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 42.16639995574951,
          "disgust": 2.48290366045012e-07,
          "fear": 0.03412811201997101,
          "happy": 27.986299991607666,
          "sad": 22.472110390663147,
          "surprise": 0.0004095176791452104,
          "neutral": 7.340653240680695
        },
        "dominant_emotion": "angry",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1234,
          "h": 1529,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 67,
        "gender": {
          "Woman": 70.65319418907166,
          "Man": 29.346802830696106
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 9.786965508851164e-10,
          "indian": 3.635864667065475e-11,
          "black": 4.450660175092591e-15,
          "white": 100.0,
          "middle eastern": 5.759938304095158e-06,
          "latino hispanic": 3.821331517883664e-06
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.2596713900566101,
        0.026339689269661903,
        0.8372580409049988,
        0.9855049252510071
      ]
    ],
    "face_boxes": [
      [
        0.4436672329902649,
        0.1917332261800766,
        0.6446979641914368,
        0.6640076041221619
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5565120321114857,
            0.8571777078337793
          ],
          [
            0.33632537261644996,
            0.8429341340351527
          ],
          [
            0.29003613169988,
            1.4150510149466544
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7766986916065216,
            0.871421281632406
          ],
          [
            0.8142305085659027,
            1.4150510149466544
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5002143066724141,
            0.3871397724791012
          ],
          [
            0.585286425113678,
            0.361026553848286
          ],
          [
            0.4414144601027172,
            0.4274965649085434
          ],
          [
            0.6465883928140004,
            0.3562786959154104
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.4414144601027172,
            0.3871397724791012
          ],
          [
            0.4476697629292805,
            0.4346183518078567
          ],
          [
            0.4551761263211567,
            0.4820969311366122
          ],
          [
            0.4651846108436585,
            0.5295755104653674
          ],
          [
            0.47644415593147277,
            0.5723062318612473
          ],
          [
            0.49646112497647593,
            0.6102890953242515
          ],
          [
            0.5152270334561665,
            0.6411501718879424
          ],
          [
            0.5402482447624206,
            0.6601416036194445
          ],
          [
            0.5665205166339874,
            0.6601416036194445
          ],
          [
            0.5915417279402415,
            0.6435241008543803
          ],
          [
            0.6115586969852448,
            0.6079151663578138
          ],
          [
            0.62782248433431,
            0.5699323028948095
          ],
          [
            0.6378309688568116,
            0.5200797945996163
          ],
          [
            0.6440862716833751,
            0.47260121527086085
          ],
          [
            0.6440862716833751,
            0.42037477800923007
          ],
          [
            0.6453373322486877,
            0.37052226971403696
          ],
          [
            0.6415841505527496,
            0.32304369038528147
          ],
          [
            0.4651846108436585,
            0.37764405661335027
          ],
          [
            0.47894627706209825,
            0.36340048281472365
          ],
          [
            0.4939590038458507,
            0.3562786959154104
          ],
          [
            0.5089717306296031,
            0.3562786959154104
          ],
          [
            0.5239844574133555,
            0.358652624881848
          ],
          [
            0.5565120321114857,
            0.34678298004965946
          ],
          [
            0.5702736983299256,
            0.3372872641839081
          ],
          [
            0.5865374856789906,
            0.3301654772845948
          ],
          [
            0.6028012730280558,
            0.32541761935171953
          ],
          [
            0.6178139998118083,
            0.33253940625103284
          ],
          [
            0.5427503658930461,
            0.3800179855797879
          ],
          [
            0.5452524870236714,
            0.41562692007635443
          ],
          [
            0.5490056687196097,
            0.4512358545729209
          ],
          [
            0.551507789850235,
            0.4868447890694874
          ],
          [
            0.5339929419358571,
            0.5082101497674275
          ],
          [
            0.5440014264583588,
            0.512958007700303
          ],
          [
            0.5540099109808605,
            0.5153319366667408
          ],
          [
            0.564018395503362,
            0.5058362208009897
          ],
          [
            0.572775819460551,
            0.4963405049352388
          ],
          [
            0.4826994587580364,
            0.39663548834485257
          ],
          [
            0.4939590038458507,
            0.3800179855797879
          ],
          [
            0.5089717306296031,
            0.37764405661335027
          ],
          [
            0.5214823362827301,
            0.3918876304119769
          ],
          [
            0.5089717306296031,
            0.3990094173112902
          ],
          [
            0.49521006441116333,
            0.4037572752441659
          ],
          [
            0.5652694560686748,
            0.37764405661335027
          ],
          [
            0.5752779405911763,
            0.3562786959154104
          ],
          [
            0.5890396068096161,
            0.3491569090160971
          ],
          [
            0.6040523335933685,
            0.358652624881848
          ],
          [
            0.5927927885055542,
            0.3728961986804746
          ],
          [
            0.5790311222871144,
            0.37764405661335027
          ],
          [
            0.5214823362827301,
            0.565184444961934
          ],
          [
            0.5364950630664825,
            0.5580626580626207
          ],
          [
            0.5502567292849223,
            0.5556887290961828
          ],
          [
            0.5577630926767985,
            0.553314800129745
          ],
          [
            0.5652694560686748,
            0.5509408711633074
          ],
          [
            0.5802821828524272,
            0.5461930132304317
          ],
          [
            0.5952949096361797,
            0.5414451552975562
          ],
          [
            0.585286425113678,
            0.5604365870290583
          ],
          [
            0.572775819460551,
            0.5746801608276849
          ],
          [
            0.560265213807424,
            0.5818019477269982
          ],
          [
            0.5465035475889842,
            0.5818019477269982
          ],
          [
            0.5339929419358571,
            0.5770540897941228
          ],
          [
            0.5252355179786682,
            0.5675583739283716
          ],
          [
            0.5414993053277333,
            0.565184444961934
          ],
          [
            0.5590141532421112,
            0.565184444961934
          ],
          [
            0.5752779405911763,
            0.5556887290961828
          ],
          [
            0.5915417279402415,
            0.5461930132304317
          ],
          [
            0.5752779405911763,
            0.5556887290961828
          ],
          [
            0.5590141532421112,
            0.565184444961934
          ],
          [
            0.5414993053277333,
            0.5675583739283716
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "031193",
  "objects": [],
  "mask_file": "./person_labeling/./031193.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "The image features a person against a solid dark blue background wearing a light beige long-sleeved shirt with no other notable objects present in the scene.",
  "overall_past": "Before the current scene, the person likely finished a conversation or a session—such as an interview, a formal discussion, or a recorded statement—where they were actively engaged in communication. The neutral expression and still posture suggest a pause after speaking or listening, indicating a moment of reflection following the exchange. The plain dark background and lack of props or other people reinforce the idea that this is a deliberate, focused setting, possibly for a professional or introspective purpose, such as a job interview, a media appearance, or a personal interview. Thus, the most plausible event before this scene is that the person had just concluded a meaningful verbal exchange and is now taking a brief moment to collect their thoughts.",
  "overall_past_clean": "They had just concluded a tense, high-stakes conversation, their voice steady and deliberate as they delivered the final words, leaving the air charged with unspoken weight before falling into silence.",
  "past_scene_ok": true,
  "overall_future": "Based on the description, the person is standing still in a formal, isolated setting with a neutral expression, suggesting a moment of pause or introspection. The lack of interaction or environmental cues implies a controlled, possibly staged environment—such as an interview, audition, or official recording. Given the calm and serious tone, the most plausible next event is:\n\n**The person begins to speak, likely in response to a question or prompt, marking the start of a dialogue or formal presentation.**\n\nThis follows naturally from the stillness and focus on the individual, indicating that the scene is leading into a moment of communication or expression.",
  "overall_future_clean": "A steady voice emerges, clear and deliberate, cutting through the silence as the individual begins to articulate thoughts with purpose and precision.",
  "future_scene_ok": true
}