{
  "video_path": "./ref_datasets/part2/6721814001.mp4",
  "start_time": 0.0,
  "end_time": 2.0,
  "image_path": "./005779.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6721814001.mp4",
      "start_time": 0.0,
      "end_time": 2.0,
      "image_path": "./ref_datasets/extracted_frames/person_3154341143363873500_1_6721814001.mp4_0.00_2.00.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/6721814001.mp4",
      "start_time": 0.0,
      "end_time": 2.0,
      "image_path": "./ref_datasets/extracted_frames/face_3154341143363873500_1_6721814001.mp4_0.00_2.00.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark gray headwrap, a black sweater, and a green jacket. She also has large hoop earrings.",
        "clothing": [
          {
            "possible_names": [
              "headwrap",
              "turban"
            ],
            "name": "headwrap",
            "type": "headwear",
            "color": [
              "dark gray"
            ]
          },
          {
            "possible_names": [
              "sweater",
              "knit top"
            ],
            "name": "sweater",
            "type": "top",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "jacket",
              "coat"
            ],
            "name": "jacket",
            "type": "top",
            "color": [
              "green"
            ]
          },
          {
            "possible_names": [
              "earrings",
              "hoop earrings"
            ],
            "name": "earrings",
            "type": "accessory",
            "color": [
              "silver"
            ]
          }
        ],
        "objects": [],
        "description": "The person is an adult female with a neutral expression. She is wearing a dark gray headwrap, a black sweater, and a green jacket. She also has large silver hoop earrings. The background consists of trees with autumn leaves.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, suggesting a neutral emotional state.",
        "meaningful": false,
        "story": "unknown",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box appears to be standing outdoors, possibly in a park or garden setting, as indicated by the tree branches and leaves in the background. They are wearing a dark head covering and large hoop earrings, suggesting a sense of personal style and cultural expression. Their posture is upright and they seem to be looking directly at the camera, which could indicate that they are engaged in a conversation or being interviewed. The calm and composed expression on their face suggests confidence and a willingness to communicate, possibly motivated by a desire to share their thoughts or experiences with an audience. The overall scene conveys a sense of tranquility and connection with nature, enhancing the impression of a thoughtful and reflective moment.",
        "intention": "They intend to share their thoughts or experiences with an audience in a confident and reflective manner",
        "intention_ok": false
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3656825170586152,
            0.32036053997183606
          ],
          [
            0.362883702918355,
            0.35663444541749495
          ],
          [
            0.36006367040931114,
            0.400284655131991
          ],
          [
            0.36087146094068884,
            0.44335054168625476
          ],
          [
            0.36363451620563864,
            0.4883210869062515
          ],
          [
            0.37290762551128864,
            0.531163735474859
          ],
          [
            0.3853840058403356,
            0.562190760695745
          ],
          [
            0.39815547382459043,
            0.5885693095033131
          ],
          [
            0.4163800266837435,
            0.6040588850066775
          ],
          [
            0.44366526923009325,
            0.604234917012472
          ],
          [
            0.46632371747067997,
            0.5851774476823353
          ],
          [
            0.49445817688746113,
            0.5707489327778892
          ],
          [
            0.5186891539820604,
            0.5452436230012349
          ],
          [
            0.5362390478540744,
            0.5016446286723727
          ],
          [
            0.5434500107275587,
            0.45112788199432313
          ],
          [
            0.550612207768219,
            0.39304058965709476
          ],
          [
            0.5576522542962007,
            0.3309632464770287
          ],
          [
            0.36405543694272635,
            0.27663071491415536
          ],
          [
            0.3708568037487566,
            0.23548698044485517
          ],
          [
            0.3835604929697833,
            0.2337906676861975
          ],
          [
            0.39978882148861883,
            0.22835093027069459
          ],
          [
            0.4125205505506268,
            0.24187425022560455
          ],
          [
            0.4376859872734973,
            0.23543166019140724
          ],
          [
            0.45861658225102087,
            0.2190229045493262
          ],
          [
            0.4795014887515988,
            0.2179250910641655
          ],
          [
            0.49956158181386334,
            0.233848851800911
          ],
          [
            0.5172044733805317,
            0.2665389451242629
          ],
          [
            0.41924514758533665,
            0.28494261879296534
          ],
          [
            0.41642281218831034,
            0.3098799532841123
          ],
          [
            0.4121084720827639,
            0.333084914230165
          ],
          [
            0.4075361469760537,
            0.35669828565820816
          ],
          [
            0.3969033695225205,
            0.4071936965698288
          ],
          [
            0.40444502505872937,
            0.40994212036094974
          ],
          [
            0.41256165376731324,
            0.4137913885570707
          ],
          [
            0.42627753149718045,
            0.4098900219514257
          ],
          [
            0.4385046049686415,
            0.40832389555280163
          ],
          [
            0.375563070770087,
            0.3122032368703494
          ],
          [
            0.3812046180479228,
            0.29440097406743065
          ],
          [
            0.3972554703243077,
            0.29184485856029724
          ],
          [
            0.40757704503568154,
            0.3070001975884514
          ],
          [
            0.39579622919804286,
            0.3086362260674673
          ],
          [
            0.3836035656942321,
            0.3103767854826791
          ],
          [
            0.45510062109678984,
            0.3054624234163572
          ],
          [
            0.46708276781386565,
            0.28717619192505645
          ],
          [
            0.4817522258098636,
            0.28256064991629315
          ],
          [
            0.4932629728955882,
            0.2959427576452967
          ],
          [
            0.48299707780991274,
            0.2998739800046361
          ],
          [
            0.4661525344210012,
            0.30226900331557743
          ],
          [
            0.3890576712254967,
            0.47344867350563163
          ],
          [
            0.39724214537335295,
            0.45000648938474197
          ],
          [
            0.406842818696584,
            0.4335245382218134
          ],
          [
            0.41352746139413543,
            0.4380102995842223
          ],
          [
            0.42196503780516126,
            0.4342769700383383
          ],
          [
            0.44050193202814886,
            0.4522276524513487
          ],
          [
            0.461460756616933,
            0.47779596717584705
          ],
          [
            0.4409917342476547,
            0.4791666589086018
          ],
          [
            0.42626122151102336,
            0.4838768992632155
          ],
          [
            0.4147342772755239,
            0.48587348787557505
          ],
          [
            0.40689645700954963,
            0.48439024639508077
          ],
          [
            0.39741903178926025,
            0.48004328684201314
          ],
          [
            0.39360814710546815,
            0.46874115381922044
          ],
          [
            0.40377555654517244,
            0.4618952366567793
          ],
          [
            0.4135918499369707,
            0.4573594054532429
          ],
          [
            0.42626427835119624,
            0.45939312880001376
          ],
          [
            0.45516348121953865,
            0.47572396355015895
          ],
          [
            0.42644171869116165,
            0.4611398455169466
          ],
          [
            0.41640523022839,
            0.4603442648573527
          ],
          [
            0.4048909031519933,
            0.4613845147310741
          ]
        ],
        "visibility": [
          1.0,
          0.9999982118606567,
          0.9650646448135376,
          5.731140845455229e-05,
          1.0,
          0.999998927116394,
          0.7694504261016846,
          0.0007418766035698354,
          0.9721320271492004,
          1.0769869732030202e-05,
          1.5102324724125538e-08,
          3.584946898627095e-05,
          1.9456995232758345e-06,
          1.2232608526119293e-07,
          5.544555460801348e-05,
          1.4505409318132934e-08,
          2.1770918401387007e-12,
          7.362991327752866e-10,
          1.0544896553166261e-11,
          1.0472568368058432e-09,
          8.190241934907371e-15,
          1.0471102564452844e-18,
          1.7672782348654437e-08,
          1.8091707687517555e-08,
          8.077898187841655e-20,
          3.691712036907838e-17,
          2.083701050245579e-12,
          1.2120557607637919e-15,
          1.1220330461900456e-16
        ],
        "headpose": {
          "pitch": 9.768030263180009,
          "yaw": 17.72640361331243,
          "roll": 2.5950460649987774
        },
        "attributes": {
          "5 oClock Shadow": 0.012311821803450584,
          "Arched Eyebrows": 0.0102311996743083,
          "Attractive": 0.07020814716815948,
          "Bags Under Eyes": 0.3506847620010376,
          "Bald": 0.0007826120126992464,
          "Bangs": 0.00010068759729620069,
          "Big Lips": 0.29234227538108826,
          "Big Nose": 0.6890645623207092,
          "Black Hair": 0.22851230204105377,
          "Blond Hair": 0.0002611031522974372,
          "Blurry": 0.00015936499403323978,
          "Brown Hair": 0.0016965564573183656,
          "Bushy Eyebrows": 0.11946620047092438,
          "Chubby": 0.8517704010009766,
          "Double Chin": 0.17059257626533508,
          "Eyeglasses": 0.006052528508007526,
          "Goatee": 0.0002386211126577109,
          "Gray Hair": 0.0004877025494351983,
          "Heavy Makeup": 0.018395904451608658,
          "High Cheekbones": 0.43081343173980713,
          "Male": 0.8012208342552185,
          "Mouth Slightly Open": 0.2207322120666504,
          "Mustache": 0.00012387119932100177,
          "Narrow Eyes": 0.4295058250427246,
          "No Beard": 0.991560161113739,
          "Oval Face": 0.2352955937385559,
          "Pale Skin": 0.0107321348041296,
          "Pointy Nose": 0.002853483660146594,
          "Receding Hairline": 0.009415190666913986,
          "Rosy Cheeks": 0.0010052132420241833,
          "Sideburns": 0.00031166651751846075,
          "Smiling": 0.3189040720462799,
          "Straight Hair": 0.09928885847330093,
          "Wavy Hair": 0.002744352212175727,
          "Wearing Earrings": 0.15564343333244324,
          "Wearing Hat": 0.08521914482116699,
          "Wearing Lipstick": 0.011947204358875751,
          "Wearing Necklace": 0.009912579320371151,
          "Wearing Necktie": 0.003330919425934553,
          "Young": 0.977458655834198
        },
        "age": [
          0.5057992339134216,
          0.9744815230369568,
          0.9259445667266846,
          0.5586309432983398,
          0.03281671553850174,
          0.0005717662279494107,
          4.6503122575813904e-05,
          1.8101460455000051e-06
        ],
        "race": [
          0.14214752614498138,
          0.12448999285697937,
          0.789505660533905,
          0.9042646288871765,
          0.3208814859390259
        ],
        "gender": [
          0.554050862789154,
          0.42716163396835327
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 3.6448538303375244,
          "disgust": 9.291373430642125e-05,
          "fear": 0.1535471179522574,
          "happy": 1.0627941228449345,
          "sad": 2.973475120961666,
          "surprise": 0.052765716100111604,
          "neutral": 92.11246967315674
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 770,
          "h": 1008,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 26,
        "gender": {
          "Woman": 67.67270565032959,
          "Man": 32.32729136943817
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 4.4655922800302505,
          "indian": 5.586804449558258,
          "black": 3.3427219837903976,
          "white": 26.712021231651306,
          "middle eastern": 9.82334315776825,
          "latino hispanic": 50.06951689720154
        },
        "dominant_race": "latino hispanic"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.10908982902765274,
        0.00830842088907957,
        0.8325385451316833,
        0.9868117570877075
      ]
    ],
    "face_boxes": [
      [
        0.35175320506095886,
        0.12821142375469208,
        0.5525319576263428,
        0.595100462436676
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4496280813382732,
            0.8467394314697486
          ],
          [
            0.20387866838110813,
            0.863831673900145
          ],
          [
            0.1174261061681641,
            1.0319053911323741
          ],
          [
            0.013362836837768555,
            0.9834773709129182
          ],
          [
            0.6953774942954383,
            0.8296471890393523
          ],
          [
            0.8106475772460303,
            1.0205105628454436
          ],
          [
            0.9339225270681909,
            0.9635364214107892
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.3879906064271927,
            0.328274744414397
          ],
          [
            0.47764511538876425,
            0.3254260373426644
          ],
          [
            0.35437016556660345,
            0.39949242120771467
          ],
          [
            0.5640976776017083,
            0.4194333707098435
          ]
        ],
        "dw_hand_1": [
          [
            0.9339225270681909,
            0.9293519365499969
          ],
          [
            0.9339225270681909,
            0.9037135729044026
          ],
          [
            0.9339225270681909,
            0.8752265021870757
          ],
          [
            0.9339225270681909,
            0.8267984819676196
          ],
          [
            0.9339225270681909,
            0.8211010678241544
          ],
          [
            0.9339225270681909,
            0.8296471890393523
          ],
          [
            0.9339225270681909,
            0.8267984819676196
          ],
          [
            0.9339225270681909,
            0.8211010678241544
          ],
          [
            0.9339225270681909,
            0.823949774895887
          ],
          [
            0.9339225270681909,
            0.8695290880436103
          ],
          [
            0.9339225270681909,
            0.8324958961110854
          ],
          [
            0.9339225270681909,
            0.8609829668284119
          ],
          [
            0.9339225270681909,
            0.8666803809718777
          ],
          [
            0.9339225270681909,
            0.8951674516892046
          ],
          [
            0.9339225270681909,
            0.8752265021870757
          ],
          [
            0.9339225270681909,
            0.8809239163305409
          ],
          [
            0.9339225270681909,
            0.8951674516892046
          ],
          [
            0.9339225270681909,
            0.9122596941196006
          ],
          [
            0.9339225270681909,
            0.9037135729044026
          ],
          [
            0.9339225270681909,
            0.892318744617472
          ],
          [
            0.9339225270681909,
            0.883772623402274
          ]
        ],
        "dw_hand_2": [
          [
            0.013362836837768555,
            0.9293519365499969
          ],
          [
            0.013362836837768555,
            0.90086486583267
          ],
          [
            0.013362836837768555,
            0.8780752092588083
          ],
          [
            0.013362836837768555,
            0.8609829668284119
          ],
          [
            0.013362836837768555,
            0.8324958961110854
          ],
          [
            0.013362836837768555,
            0.8552855526849467
          ],
          [
            0.013362836837768555,
            0.8467394314697486
          ],
          [
            0.013362836837768555,
            0.8609829668284119
          ],
          [
            0.013362836837768555,
            0.8695290880436103
          ],
          [
            0.013362836837768555,
            0.872377795115343
          ],
          [
            0.013362836837768555,
            0.863831673900145
          ],
          [
            0.013362836837768555,
            0.8780752092588083
          ],
          [
            0.013362836837768555,
            0.892318744617472
          ],
          [
            0.013362836837768555,
            0.8951674516892046
          ],
          [
            0.013362836837768555,
            0.892318744617472
          ],
          [
            0.013362836837768555,
            0.8980161587609373
          ],
          [
            0.013362836837768555,
            0.9122596941196006
          ],
          [
            0.013362836837768555,
            0.9179571082630663
          ],
          [
            0.013362836837768555,
            0.9179571082630663
          ],
          [
            0.013362836837768555,
            0.9151084011913336
          ],
          [
            0.013362836837768555,
            0.9122596941196006
          ]
        ],
        "dw_face": [
          [
            0.3559711389409172,
            0.34536698684479317
          ],
          [
            0.35276919219228964,
            0.3937950070642492
          ],
          [
            0.35276919219228964,
            0.43937432021197226
          ],
          [
            0.35437016556660345,
            0.4821049262879629
          ],
          [
            0.36077405906385845,
            0.5248355323639536
          ],
          [
            0.3735818460583687,
            0.5590200172247459
          ],
          [
            0.39279352655013394,
            0.5875070879420728
          ],
          [
            0.415207153790527,
            0.5960532091572708
          ],
          [
            0.44082272777954745,
            0.5960532091572708
          ],
          [
            0.46483732839425396,
            0.5903557950138055
          ],
          [
            0.48885192900896074,
            0.5818096737986076
          ],
          [
            0.5128665296236674,
            0.5618687242964785
          ],
          [
            0.5320782101154328,
            0.5362303606508843
          ],
          [
            0.5448859971099429,
            0.49349975457489376
          ],
          [
            0.5512898906071981,
            0.453617855570636
          ],
          [
            0.5560928107301394,
            0.40803854242291265
          ],
          [
            0.5592947574787669,
            0.3653079363469222
          ],
          [
            0.3623750324381722,
            0.3054850878405354
          ],
          [
            0.37198087268405494,
            0.28839284541013926
          ],
          [
            0.3847886596785652,
            0.28269543126667374
          ],
          [
            0.3975964466730754,
            0.28269543126667374
          ],
          [
            0.41040423366758566,
            0.28839284541013926
          ],
          [
            0.44722662127680246,
            0.27984672419494105
          ],
          [
            0.46483732839425396,
            0.27414931005147575
          ],
          [
            0.48244803551170573,
            0.2713006029797431
          ],
          [
            0.5016597160034709,
            0.27699801712320843
          ],
          [
            0.5176694497466088,
            0.2969389666253374
          ],
          [
            0.4248129940364097,
            0.3254260373426644
          ],
          [
            0.421611047287782,
            0.34251827977306054
          ],
          [
            0.4184091005391545,
            0.3596105222034567
          ],
          [
            0.415207153790527,
            0.37670276463385305
          ],
          [
            0.4007983934217029,
            0.4165846636381108
          ],
          [
            0.41040423366758566,
            0.4165846636381108
          ],
          [
            0.42001007391346823,
            0.4165846636381108
          ],
          [
            0.4312168875336647,
            0.4165846636381108
          ],
          [
            0.44402467452817496,
            0.4165846636381108
          ],
          [
            0.3735818460583687,
            0.33966957270132786
          ],
          [
            0.38318768630425143,
            0.328274744414397
          ],
          [
            0.39599547329876167,
            0.3254260373426644
          ],
          [
            0.40720228691895793,
            0.336820865629595
          ],
          [
            0.39599547329876167,
            0.34536698684479317
          ],
          [
            0.3847886596785652,
            0.34536698684479317
          ],
          [
            0.4568324615226852,
            0.3339721585578624
          ],
          [
            0.4680392751428817,
            0.31972862319919887
          ],
          [
            0.48404900888601937,
            0.31972862319919887
          ],
          [
            0.49845776925484336,
            0.3339721585578624
          ],
          [
            0.48404900888601937,
            0.33966957270132786
          ],
          [
            0.46964024851719544,
            0.33966957270132786
          ],
          [
            0.3879906064271927,
            0.4821049262879629
          ],
          [
            0.3975964466730754,
            0.46216397678583393
          ],
          [
            0.41040423366758566,
            0.44792044142717047
          ],
          [
            0.4184091005391545,
            0.44792044142717047
          ],
          [
            0.42641396741072346,
            0.4450717343554378
          ],
          [
            0.44722662127680246,
            0.4564665626423686
          ],
          [
            0.46483732839425396,
            0.4764075121444976
          ],
          [
            0.45042856802542997,
            0.4849536333596956
          ],
          [
            0.4344188342822922,
            0.49349975457489376
          ],
          [
            0.4184091005391545,
            0.49634846164662644
          ],
          [
            0.40720228691895793,
            0.49634846164662644
          ],
          [
            0.3975964466730754,
            0.4906510475031609
          ],
          [
            0.3911925531758202,
            0.4821049262879629
          ],
          [
            0.4056013135446442,
            0.47071009800103214
          ],
          [
            0.4184091005391545,
            0.4650126838575666
          ],
          [
            0.44082272777954745,
            0.4650126838575666
          ],
          [
            0.46163538164562645,
            0.47355880507276477
          ],
          [
            0.4392217544052337,
            0.47071009800103214
          ],
          [
            0.4184091005391545,
            0.47071009800103214
          ],
          [
            0.4056013135446442,
            0.4764075121444976
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "005779",
  "objects": [],
  "mask_file": "./person_labeling/./005779.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person stands outdoors with a backdrop of trees and autumn leaves wearing a green jacket and large hoop earrings against an overcast sky",
  "overall_past": "Before the current scene, the person likely arrived at the park or garden after a quiet walk through the autumnal woods, perhaps having chosen this serene location intentionally to reflect or prepare for a meaningful conversation. The dark head covering and large hoop earrings suggest they may have been getting ready for a public appearance, interview, or personal expression—possibly a cultural or artistic presentation. The calm, composed demeanor and direct gaze imply they had already gathered their thoughts, perhaps rehearsing or mentally preparing to share a story, perspective, or message. The overcast sky and falling leaves may mirror an introspective mood, indicating that the moment captured is a pause in a journey—both physical and emotional—where they’ve found stillness before speaking their truth.",
  "overall_past_clean": "They moved through the hushed woods with deliberate steps, each breath syncing with the rhythm of falling leaves, their mind sharpening with purpose as they carved space within themselves for what would come next.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person is likely to begin speaking—perhaps sharing a personal story, reflection, or message related to nature, identity, or cultural heritage—given their confident posture, direct eye contact with the camera, and the thoughtful, tranquil atmosphere. The large hoop earrings and dark head covering may signal cultural or personal significance, suggesting the content of their speech could center on themes of belonging, resilience, or environmental awareness. The overcast sky and autumn setting reinforce a mood of introspection, making it plausible that they are delivering a meaningful statement or participating in a documentary-style interview, inviting viewers to reflect on deeper connections between self, culture, and the natural world.",
  "overall_future_clean": "The camera holds steady as a quiet breath escapes, then a voice emerges—clear, steady, and charged with purpose—beginning to unfold a story that weaves memory, land, and identity into a tapestry of truth that settles over the viewer like dusk.",
  "future_scene_ok": true
}