{
  "video_path": "./ref_datasets/part2/6323280000.mp4",
  "start_time": 0.0,
  "end_time": 6.066666666666666,
  "image_path": "./004203.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6323280000.mp4",
      "start_time": 0.0,
      "end_time": 6.066666666666666,
      "image_path": "./ref_datasets/extracted_frames/person_7953131171088026259_1_6323280000.mp4_0.00_6.07.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/6323280000.mp4",
      "start_time": 0.0,
      "end_time": 6.066666666666666,
      "image_path": "./ref_datasets/extracted_frames/face_7953131171088026259_1_6323280000.mp4_0.00_6.07.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is dressed in an all-white outfit consisting of a loose-fitting hoodie and matching sweatpants. The hoodie has a drawstring at the neck and the sweatpants have a relaxed fit with a visible elastic waistband. He is also wearing white sneakers with thick soles.",
        "clothing": [
          {
            "possible_names": [
              "hoodie",
              "sweatshirt"
            ],
            "name": "hoodie",
            "type": "top",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "sweatpants",
              "track pants"
            ],
            "name": "sweatpants",
            "type": "bottom",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "sneakers",
              "athletic shoes"
            ],
            "name": "sneakers",
            "type": "footwear",
            "color": [
              "white"
            ]
          }
        ],
        "objects": [],
        "description": "A male adult is seated on a chair, wearing an all-white outfit that includes a loose-fitting hoodie and matching sweatpants, paired with white sneakers. His hair is styled in a curly fashion on top with a shaved side. He appears to be in a neutral emotional state, sitting with his hands clasped together. The setting features a wooden wall and floor, suggesting an indoor environment.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears calm and composed, with a neutral expression that does not convey strong emotions.",
        "meaningful": false,
        "story": "unknown",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is seated on a chair with hands clasped together, wearing an all-white outfit consisting of a hoodie, pants, and chunky sneakers, suggesting a casual yet stylish appearance. Their posture and direct gaze towards the camera indicate confidence and engagement, possibly for a photoshoot or interview setting. The wooden background and the chair's design contribute to a modern and minimalist aesthetic, enhancing the focus on the individual's attire and demeanor. The person's expression appears calm and composed, hinting at a relaxed state despite the formal setting, which could be motivated by comfort in the environment or familiarity with the situation.",
        "intention": "They are confidently showcasing their personal style and composure to make a strong visual impact in a professional yet relaxed setting",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3566378517046807,
            0.28799034693344894
          ],
          [
            0.3710242105066461,
            0.3013888648212222
          ],
          [
            0.38535731179373606,
            0.3124633503612131
          ],
          [
            0.39797185703560156,
            0.32271454227156937
          ],
          [
            0.4114011835326593,
            0.33183291785618557
          ],
          [
            0.432109897619202,
            0.3409585413755849
          ],
          [
            0.45016447554820427,
            0.3490091885240483
          ],
          [
            0.46966740183098604,
            0.3557709519352232
          ],
          [
            0.4858714411498377,
            0.3568658493625532
          ],
          [
            0.5128305888049817,
            0.35019520899680046
          ],
          [
            0.5328672646845459,
            0.33571260099831435
          ],
          [
            0.5527659058886231,
            0.3186436715269727
          ],
          [
            0.5683128891483186,
            0.2997277960447329
          ],
          [
            0.5722515857724286,
            0.27778593649522265
          ],
          [
            0.566214012973523,
            0.25683196328048197
          ],
          [
            0.550935565668439,
            0.23694530228385702
          ],
          [
            0.5370228003887902,
            0.2160199978804615
          ],
          [
            0.3428594125957085,
            0.2793486414676798
          ],
          [
            0.3437227588639688,
            0.2736972760176286
          ],
          [
            0.3562989176423461,
            0.2722861389962158
          ],
          [
            0.36933110083537124,
            0.27226735895133714
          ],
          [
            0.3808245560794911,
            0.2702032619438666
          ],
          [
            0.406084319759929,
            0.2620898017526737
          ],
          [
            0.41880119010884925,
            0.252748771046754
          ],
          [
            0.43798023325110236,
            0.2464218478417024
          ],
          [
            0.4573144093392387,
            0.24138279653353883
          ],
          [
            0.4828679648972063,
            0.24051233391842938
          ],
          [
            0.40493525462175806,
            0.28098325887029724
          ],
          [
            0.4095665264224249,
            0.29162159096449614
          ],
          [
            0.41554678404141987,
            0.30188400640950674
          ],
          [
            0.4191434940963826,
            0.31438603370250867
          ],
          [
            0.4176352912156039,
            0.32097116279016646
          ],
          [
            0.42770866950352987,
            0.3209262686515493
          ],
          [
            0.43731112587388865,
            0.32006552975092617
          ],
          [
            0.44379799381765744,
            0.31421285829440293
          ],
          [
            0.4529121125816668,
            0.31061395009913084
          ],
          [
            0.3667316452851371,
            0.28906644278738114
          ],
          [
            0.37228359969520064,
            0.2851718834385143
          ],
          [
            0.3863596873150931,
            0.28265210661837564
          ],
          [
            0.3977494525530982,
            0.28477363453878624
          ],
          [
            0.3877657237980101,
            0.2876856035685965
          ],
          [
            0.3760441135082926,
            0.2893624599258016
          ],
          [
            0.4382760354450771,
            0.2725432110434797
          ],
          [
            0.44512219984064655,
            0.2660705397637295
          ],
          [
            0.45753439086139513,
            0.2616211689476456
          ],
          [
            0.4735941423625542,
            0.2582675136426198
          ],
          [
            0.46410813621743013,
            0.2651558503940967
          ],
          [
            0.450151831715826,
            0.2696116080041975
          ],
          [
            0.431710119742565,
            0.33512088247308774
          ],
          [
            0.4313869878255501,
            0.32917275356261855
          ],
          [
            0.4371632618090463,
            0.3269968517789883
          ],
          [
            0.44504373401561115,
            0.32514189715896336
          ],
          [
            0.4526571832952045,
            0.3228865694919867
          ],
          [
            0.4699516605763208,
            0.3220375708104777
          ],
          [
            0.48946916694363596,
            0.32086801247870816
          ],
          [
            0.4759010333863516,
            0.3295695241706978
          ],
          [
            0.46396798541936923,
            0.33684703913916436
          ],
          [
            0.45521366039596534,
            0.33963249941423
          ],
          [
            0.44588089326702096,
            0.3412532668028559
          ],
          [
            0.4380001988675859,
            0.3394067226576486
          ],
          [
            0.4324290618063911,
            0.33562551096214777
          ],
          [
            0.4418784378697633,
            0.3326184648155634
          ],
          [
            0.45066107661320415,
            0.3315659068092438
          ],
          [
            0.459153510306878,
            0.3294949780850272
          ],
          [
            0.48419344059373964,
            0.32202095079368775
          ],
          [
            0.4578391654150826,
            0.3279394277571035
          ],
          [
            0.4473020600263404,
            0.32998314443310456
          ],
          [
            0.43878652885477376,
            0.3320278514209869
          ]
        ],
        "visibility": [
          1.0,
          0.0007314489921554923,
          8.157794439966892e-08,
          1.871305421730085e-08,
          0.9997881054878235,
          0.9999990463256836,
          0.0008668896043673158,
          0.00016756101103965193,
          0.9999843835830688,
          0.0017386332619935274,
          5.581657965686437e-12,
          3.8693866870104145e-15,
          0.9997754693031311,
          6.466051999387545e-11,
          0.9922904372215271,
          1.1624074099103598e-12,
          9.643642551182552e-10,
          3.462704256662619e-08,
          1.5371605897873675e-12,
          8.71809788804967e-08,
          1.830368073885861e-26,
          3.588595456177733e-20,
          7.875167398196936e-07,
          0.0008389129652641714,
          1.090842172146722e-08,
          1.0318877002868376e-10,
          2.3360450726594983e-11,
          2.669050961148778e-13,
          0.0008833711035549641
        ],
        "headpose": {
          "pitch": -21.616496873958177,
          "yaw": 19.669582186897305,
          "roll": -30.67923241193256
        },
        "attributes": {
          "5 oClock Shadow": 0.07615037262439728,
          "Arched Eyebrows": 0.013127324171364307,
          "Attractive": 0.3044450283050537,
          "Bags Under Eyes": 0.3551853895187378,
          "Bald": 7.487853963539237e-07,
          "Bangs": 0.04699287191033363,
          "Big Lips": 0.4495588541030884,
          "Big Nose": 0.39428526163101196,
          "Black Hair": 0.4273706078529358,
          "Blond Hair": 0.0005232991534285247,
          "Blurry": 0.00033082443405874074,
          "Brown Hair": 0.11583541333675385,
          "Bushy Eyebrows": 0.04015641286969185,
          "Chubby": 0.016074953600764275,
          "Double Chin": 0.0031306424643844366,
          "Eyeglasses": 0.00043595460010692477,
          "Goatee": 0.0007166034774854779,
          "Gray Hair": 0.000822177913505584,
          "Heavy Makeup": 0.005429358221590519,
          "High Cheekbones": 0.24677982926368713,
          "Male": 0.9848767518997192,
          "Mouth Slightly Open": 0.033074233680963516,
          "Mustache": 0.000691091874614358,
          "Narrow Eyes": 0.04994624853134155,
          "No Beard": 0.9838336110115051,
          "Oval Face": 0.14279596507549286,
          "Pale Skin": 0.0008697754237800837,
          "Pointy Nose": 0.028136668726801872,
          "Receding Hairline": 0.004015074577182531,
          "Rosy Cheeks": 0.001308348379097879,
          "Sideburns": 0.00016100342327263206,
          "Smiling": 0.025684701278805733,
          "Straight Hair": 0.005675857421010733,
          "Wavy Hair": 0.8139327764511108,
          "Wearing Earrings": 0.021093325689435005,
          "Wearing Hat": 0.00047160012763924897,
          "Wearing Lipstick": 0.014913402497768402,
          "Wearing Necklace": 0.0031066490337252617,
          "Wearing Necktie": 0.020200343802571297,
          "Young": 0.9771472811698914
        },
        "age": [
          0.008610698394477367,
          0.9576654434204102,
          0.9900553226470947,
          0.7422258257865906,
          0.09864430874586105,
          0.00019852444529533386,
          6.290670171438251e-06,
          3.9527904505121114e-08
        ],
        "race": [
          0.17674638330936432,
          0.9444612860679626,
          0.13911402225494385,
          0.14051951467990875,
          0.7709925174713135
        ],
        "gender": [
          0.9281522035598755,
          0.08358155190944672
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 3.2468426525156246e-05,
          "disgust": 4.206501119652373e-09,
          "fear": 0.04103119135834277,
          "happy": 0.0007558784545835806,
          "sad": 99.95144605636597,
          "surprise": 2.137826998760417e-08,
          "neutral": 0.006739262607879937
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 670,
          "h": 862,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 26,
        "gender": {
          "Woman": 1.4373733662068844,
          "Man": 98.56262803077698
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.03598826006054878,
          "indian": 1.1696058325469494,
          "black": 98.62428903579712,
          "white": 0.007392458792310208,
          "middle eastern": 0.003773456046474166,
          "latino hispanic": 0.15895245596766472
        },
        "dominant_race": "black"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.03294781967997551,
        0.1434187889099121,
        0.9153922200202942,
        0.9594743847846985
      ]
    ],
    "face_boxes": [
      [
        0.3444339632987976,
        0.21596065163612366,
        0.551758348941803,
        0.3563649356365204
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5423804828066527,
            0.35100049516558646
          ],
          [
            0.34407421440395053,
            0.35496913073956965
          ],
          [
            0.22107412387569217,
            0.5123916751742363
          ],
          [
            0.3089313313958767,
            0.5573695450127125
          ],
          [
            0.7406867512093549,
            0.34703185959160326
          ],
          [
            0.7934010757214657,
            0.5388492456674576
          ],
          [
            0.5298294531609121,
            0.5613381805866957
          ],
          [
            0.3867477151994687,
            0.5944101437032223
          ],
          [
            0.10560465113487823,
            0.587795751079917
          ],
          [
            0.2838292721043954,
            0.8523714560121298
          ],
          [
            0.6628703674057629,
            0.5957330222278834
          ],
          [
            0.798421487579762,
            0.6155762000977993
          ],
          [
            0.7005234563429849,
            0.8841205406039954
          ],
          [
            0.38172730334117244,
            0.28485656893253325
          ],
          [
            0.4570334812156163,
            0.2676591481119394
          ],
          [
            0.3591354499788393,
            0.28485656893253325
          ],
          [
            0.5574417183815416,
            0.24252445614337922
          ]
        ],
        "dw_hand_1": [
          [
            0.5248090413026159,
            0.5626610591113568
          ],
          [
            0.489666158294542,
            0.5507551523894072
          ],
          [
            0.4495028634281719,
            0.5375263671427966
          ],
          [
            0.41184977449095,
            0.5362034886181355
          ],
          [
            0.3867477151994687,
            0.5401721241921187
          ],
          [
            0.4193803922783944,
            0.5626610591113568
          ],
          [
            0.37670689148287617,
            0.56662969468534
          ],
          [
            0.34407421440395053,
            0.56662969468534
          ],
          [
            0.31897215511246924,
            0.5653068161606789
          ],
          [
            0.4168701863492463,
            0.5798584799319506
          ],
          [
            0.3666660677662837,
            0.587795751079917
          ],
          [
            0.3290129788290617,
            0.587795751079917
          ],
          [
            0.2988905076792842,
            0.587795751079917
          ],
          [
            0.4168701863492463,
            0.5930872651785613
          ],
          [
            0.37168647962457996,
            0.6010245363265276
          ],
          [
            0.334033390687358,
            0.6036702933758498
          ],
          [
            0.3039109195375804,
            0.6036702933758498
          ],
          [
            0.4193803922783944,
            0.6023474148511887
          ],
          [
            0.3867477151994687,
            0.607638928949833
          ],
          [
            0.35662524404969115,
            0.6102846859991551
          ],
          [
            0.3290129788290617,
            0.6116075645238161
          ]
        ],
        "dw_hand_2": [
          [
            0.31395174325417297,
            0.5613381805866957
          ],
          [
            0.34658442033309866,
            0.5520780309140683
          ],
          [
            0.38172730334117244,
            0.5401721241921187
          ],
          [
            0.4043191567035056,
            0.5401721241921187
          ],
          [
            0.41435998042009814,
            0.5454636382907629
          ],
          [
            0.34407421440395053,
            0.5520780309140683
          ],
          [
            0.36415586183713555,
            0.5560466664880515
          ],
          [
            0.38925792112861685,
            0.5626610591113568
          ],
          [
            0.41184977449095,
            0.56662969468534
          ],
          [
            0.334033390687358,
            0.5719212087839842
          ],
          [
            0.36415586183713555,
            0.5785356014072895
          ],
          [
            0.391768127057765,
            0.5825042369812727
          ],
          [
            0.4168701863492463,
            0.5825042369812727
          ],
          [
            0.3290129788290617,
            0.587795751079917
          ],
          [
            0.3591354499788393,
            0.5957330222278834
          ],
          [
            0.3867477151994687,
            0.5983787792772055
          ],
          [
            0.4043191567035056,
            0.5970559007525444
          ],
          [
            0.3265027728999136,
            0.5983787792772055
          ],
          [
            0.3516048321913949,
            0.6049931719005108
          ],
          [
            0.3691762736954318,
            0.607638928949833
          ],
          [
            0.3867477151994687,
            0.607638928949833
          ]
        ],
        "dw_face": [
          [
            0.3591354499788393,
            0.2835336904078722
          ],
          [
            0.37168647962457996,
            0.2980853541791439
          ],
          [
            0.3842375092703206,
            0.31131413942575453
          ],
          [
            0.40180895077435747,
            0.3232200461477041
          ],
          [
            0.42189059820754254,
            0.3338030743449926
          ],
          [
            0.4444824515698757,
            0.34306322401762007
          ],
          [
            0.46707430493220886,
            0.3523233736902475
          ],
          [
            0.4946865701528383,
            0.3536462522149086
          ],
          [
            0.5197886294443196,
            0.34703185959160326
          ],
          [
            0.5373600709483565,
            0.33644883139431475
          ],
          [
            0.5524213065232453,
            0.3232200461477041
          ],
          [
            0.5624621302398377,
            0.3086683823764324
          ],
          [
            0.567482542098134,
            0.2941167186051607
          ],
          [
            0.5649723361689859,
            0.27824217630922793
          ],
          [
            0.5574417183815416,
            0.2636905125379562
          ],
          [
            0.5499111005940971,
            0.24913884876668455
          ],
          [
            0.5398702768775046,
            0.23458718499541284
          ],
          [
            0.354115038120543,
            0.2822108118832111
          ],
          [
            0.3591354499788393,
            0.27824217630922793
          ],
          [
            0.3691762736954318,
            0.27824217630922793
          ],
          [
            0.37670689148287617,
            0.27691929778456686
          ],
          [
            0.3867477151994687,
            0.27691929778456686
          ],
          [
            0.4193803922783944,
            0.2676591481119394
          ],
          [
            0.43444162785328316,
            0.26236763401329516
          ],
          [
            0.4495028634281719,
            0.2570761199146509
          ],
          [
            0.4645640990030607,
            0.25178460581600665
          ],
          [
            0.4821355405070976,
            0.24913884876668455
          ],
          [
            0.41184977449095,
            0.28088793335855006
          ],
          [
            0.41435998042009814,
            0.29147096155583857
          ],
          [
            0.4193803922783944,
            0.3020539897531271
          ],
          [
            0.4244008041366906,
            0.3126370179504156
          ],
          [
            0.4193803922783944,
            0.3192514105737209
          ],
          [
            0.4294212159949869,
            0.320574289098382
          ],
          [
            0.4369518337824313,
            0.3192514105737209
          ],
          [
            0.4495028634281719,
            0.3152827749997377
          ],
          [
            0.45954368714476446,
            0.31131413942575453
          ],
          [
            0.37168647962457996,
            0.28882520450651644
          ],
          [
            0.37670689148287617,
            0.2835336904078722
          ],
          [
            0.38925792112861685,
            0.2822108118832111
          ],
          [
            0.39929874484520933,
            0.28485656893253325
          ],
          [
            0.391768127057765,
            0.28882520450651644
          ],
          [
            0.38172730334117244,
            0.2901480830311775
          ],
          [
            0.44197224564072757,
            0.27427354073524474
          ],
          [
            0.4495028634281719,
            0.2676591481119394
          ],
          [
            0.4620538930739126,
            0.2636905125379562
          ],
          [
            0.47711512864880135,
            0.26236763401329516
          ],
          [
            0.469584510861357,
            0.2689820266366005
          ],
          [
            0.4570334812156163,
            0.27295066221058367
          ],
          [
            0.43444162785328316,
            0.3351259528696537
          ],
          [
            0.4369518337824313,
            0.33248019582033156
          ],
          [
            0.44197224564072757,
            0.32983443877100943
          ],
          [
            0.4495028634281719,
            0.32851156024634837
          ],
          [
            0.4545232752864682,
            0.3271886817216873
          ],
          [
            0.4746049227196532,
            0.3245429246723652
          ],
          [
            0.4946865701528383,
            0.32189716762304305
          ],
          [
            0.48464574643624575,
            0.32851156024634837
          ],
          [
            0.4746049227196532,
            0.3351259528696537
          ],
          [
            0.4620538930739126,
            0.3390945884436369
          ],
          [
            0.45201306935732005,
            0.3390945884436369
          ],
          [
            0.44197224564072757,
            0.3377717099189758
          ],
          [
            0.4369518337824313,
            0.3351259528696537
          ],
          [
            0.4444824515698757,
            0.3338030743449926
          ],
          [
            0.45201306935732005,
            0.33248019582033156
          ],
          [
            0.47209471679050513,
            0.3271886817216873
          ],
          [
            0.489666158294542,
            0.3232200461477041
          ],
          [
            0.47209471679050513,
            0.32851156024634837
          ],
          [
            0.4545232752864682,
            0.33248019582033156
          ],
          [
            0.4444824515698757,
            0.3338030743449926
          ]
        ],
        "dw_foot_1": [
          [
            0.6955030444846886,
            0.9515873453617096
          ],
          [
            0.7708092223591325,
            0.9449729527384043
          ],
          [
            0.6427887199725779,
            0.8999950828999281
          ]
        ],
        "dw_foot_2": [
          [
            0.10560465113487823,
            0.8933806902766228
          ],
          [
            0.09305362148913758,
            0.8814747835546732
          ],
          [
            0.34658442033309866,
            0.8748603909313679
          ]
        ]
      }
    ]
  },
  "new_filename": "004203",
  "objects": [],
  "mask_file": "./person_labeling/./004203.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is seated on a modern wooden chair wearing an all-white outfit with sneakers against a backdrop of warm-toned wooden panels creating a minimalist and contemporary setting",
  "overall_past": "Before the current scene, the person likely arrived at the photography or filming location, removed any outer layers or accessories that didn’t align with the all-white aesthetic, and took a moment to compose themselves—perhaps adjusting their hoodie or sneakers, checking their posture in a mirror, or breathing deeply to center their focus. The calm, confident expression and poised posture suggest they had already gone through a brief preparation phase, possibly including a wardrobe check and mental readiness, indicating they were familiar with the setting or had been in similar situations before. This preparation helped them transition smoothly into the focused, engaged state captured in the image.",
  "overall_past_clean": "They stepped into the space with deliberate calm, shedding distractions and aligning their presence with purpose, their body and mind already synchronized in readiness.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person is likely to begin speaking or sharing a personal story, possibly in the context of an interview or a creative presentation. The calm, composed expression combined with the direct gaze suggests readiness to communicate, while the minimalist, warm-toned setting enhances focus on the individual—ideal for a narrative-driven moment. Given the all-white outfit and modern aesthetic, this could be part of a brand feature, a personal manifesto, or a candid conversation about identity, lifestyle, or artistic vision. The next moment would likely involve the person opening their mouth to speak, delivering a thoughtful statement that aligns with the serene yet confident atmosphere.",
  "overall_future_clean": "The voice emerges, clear and steady, weaving a story that carries weight and authenticity, drawing listeners into a moment of connection and revelation.",
  "future_scene_ok": true
}