{
  "video_path": "./ref_datasets/part2/10210559001.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./000341.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/10210559001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_-3503444475010878883_1_10210559001.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/10210559001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-3503444475010878883_1_10210559001.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a light-colored, possibly white or cream, long-sleeved top with a subtle pattern on the shoulders.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "shirt",
                "blouse",
                "top"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "hand gesture"
            ],
            "name": "hand gesture",
            "position": "hand"
          }
        ],
        "description": "The person appears to be an adult female with a neutral expression. She has light-colored hair and is wearing a light-colored, long-sleeved top with a subtle pattern on the shoulders. Her hand is extended forward, making a gesture as if she is pointing or reaching out. The background is plain and does not distract from the subject.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, with no strong emotions displayed.",
        "meaningful": false,
        "story": "unknown",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is extending their hand forward with an open palm facing towards the camera, suggesting a gesture of offering, greeting, or stopping. Their expression appears neutral to slightly serious, which could indicate they are focused on the interaction or the object they might be presenting. The simplicity of the background and their attire suggests a controlled environment, possibly for a professional or artistic purpose, where the emphasis is on the gesture and its meaning rather than the surroundings. The directness of the gesture implies a strong engagement with the viewer or another individual not visible in the frame, aiming to convey a clear message or initiate a connection.",
        "intention": "They are deliberately initiating a meaningful connection or conveying a clear message through a direct and intentional gesture",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              "pointing",
              "reaching out"
            ]
          },
          "object": 0,
          "deleted": true
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.4366616376542619,
            0.3170261116570266
          ],
          [
            0.439174805085973,
            0.37621600586901266
          ],
          [
            0.444880988224343,
            0.4285159817448369
          ],
          [
            0.4512835002803643,
            0.4812974866735872
          ],
          [
            0.4618867710066427,
            0.5273554880152304
          ],
          [
            0.4791540768928826,
            0.5627879440469086
          ],
          [
            0.5009085160979468,
            0.5770303963353394
          ],
          [
            0.5232067202949631,
            0.5876937215290372
          ],
          [
            0.5450963218463585,
            0.5867204666137695
          ],
          [
            0.567262460976573,
            0.5792455004636573
          ],
          [
            0.5852337015260543,
            0.5549703275085126
          ],
          [
            0.6042816224175372,
            0.524377737726484
          ],
          [
            0.6162340241218252,
            0.47231616513438957
          ],
          [
            0.6212440478681986,
            0.42341287804659083
          ],
          [
            0.6207925048324147,
            0.3689672726171988
          ],
          [
            0.6223679571412504,
            0.31700715123030243
          ],
          [
            0.623442438231515,
            0.2592131391404167
          ],
          [
            0.46439056870959966,
            0.252834212527704
          ],
          [
            0.47766027180477977,
            0.22634929229342748
          ],
          [
            0.493060238858951,
            0.2201695088986997
          ],
          [
            0.5098370841172125,
            0.21570051047537062
          ],
          [
            0.5263398109735655,
            0.22739216275316068
          ],
          [
            0.5549320078987097,
            0.22159865987363947
          ],
          [
            0.5691908015536943,
            0.20097258198198187
          ],
          [
            0.5821670649041022,
            0.19236712094652592
          ],
          [
            0.5963074838343476,
            0.19373764026732673
          ],
          [
            0.608043405859332,
            0.21259595792760294
          ],
          [
            0.5411452653019556,
            0.2616447727516215
          ],
          [
            0.5419969255370753,
            0.29738743264208395
          ],
          [
            0.543747465774816,
            0.3339073995433787
          ],
          [
            0.5436594773782417,
            0.3704307497178436
          ],
          [
            0.5276794485149107,
            0.4044122279636443
          ],
          [
            0.5361477772904826,
            0.4104036758185694
          ],
          [
            0.5441991737544802,
            0.4148345889237822
          ],
          [
            0.5524885017657652,
            0.40599245148361046
          ],
          [
            0.5586285468723093,
            0.39683101763800976
          ],
          [
            0.4838720583356917,
            0.2800220077630704
          ],
          [
            0.49306761551581857,
            0.26072221994400024
          ],
          [
            0.5065386463621897,
            0.2603987414370138
          ],
          [
            0.5168159696539598,
            0.278309131740893
          ],
          [
            0.5054298752719271,
            0.27836544914220374
          ],
          [
            0.49475131682785495,
            0.2795322084868396
          ],
          [
            0.5630392745203738,
            0.2683119589374179
          ],
          [
            0.573237608020593,
            0.24753133124775356
          ],
          [
            0.5834519410771983,
            0.24190687455197493
          ],
          [
            0.5922822117073727,
            0.25304125004975253
          ],
          [
            0.5851341120765677,
            0.2591995590578311
          ],
          [
            0.5746729130124939,
            0.2643533883586762
          ],
          [
            0.5081448057234021,
            0.4720066426292298
          ],
          [
            0.5230996808802176,
            0.45018861880378125
          ],
          [
            0.5367475315662367,
            0.43922375938879754
          ],
          [
            0.5462266914213875,
            0.44094039460338613
          ],
          [
            0.5533043875059644,
            0.4358634642823032
          ],
          [
            0.5661756090952882,
            0.4444622879936582
          ],
          [
            0.5786950878599393,
            0.46407469965162734
          ],
          [
            0.5664551523181477,
            0.47355026101309156
          ],
          [
            0.554608846183068,
            0.48429074363102986
          ],
          [
            0.5446157578511962,
            0.4876117081869216
          ],
          [
            0.5352970517373511,
            0.48461262448124154
          ],
          [
            0.521566903218627,
            0.48006428360308295
          ],
          [
            0.5129502165863025,
            0.4688874527260109
          ],
          [
            0.5361296059730063,
            0.4592904694496639
          ],
          [
            0.5451575435165847,
            0.46195644171780376
          ],
          [
            0.5536624165251851,
            0.45967028885291367
          ],
          [
            0.5722940557170659,
            0.46225590838326347
          ],
          [
            0.5547729836710329,
            0.46265565150629273
          ],
          [
            0.5446011878084391,
            0.4625270401359235
          ],
          [
            0.5345924756256863,
            0.4592635442340185
          ]
        ],
        "visibility": [
          1.0,
          0.9506139159202576,
          4.788586920767557e-06,
          5.948015703967835e-16,
          0.9999948740005493,
          0.9998793601989746,
          1.3382641839143616e-07,
          9.883106139030318e-11,
          0.9999352693557739,
          4.828851274396584e-07,
          2.4798149492378683e-15,
          5.225572832925169e-15,
          3.289069994139027e-08,
          6.143180408813009e-10,
          2.266560853933508e-12,
          1.563476453338153e-13,
          9.613578650594784e-14,
          1.712694520710975e-13,
          1.810184019973692e-17,
          1.690335154833078e-12,
          2.6372702280092775e-25,
          7.352537046345369e-21,
          0.00010974420001730323,
          7.667014142498374e-05,
          9.040226541553922e-20,
          9.30314732097058e-18,
          9.574255832589529e-10,
          2.193865531949224e-12,
          1.688639339469944e-09
        ],
        "headpose": {
          "pitch": -3.8404108915098925,
          "yaw": -5.341469185685725,
          "roll": -3.941160877522635
        },
        "attributes": {
          "5 oClock Shadow": 2.8689462851616554e-05,
          "Arched Eyebrows": 0.042942486703395844,
          "Attractive": 0.12970413267612457,
          "Bags Under Eyes": 0.3649227023124695,
          "Bald": 0.00015361071564257145,
          "Bangs": 0.000496710417792201,
          "Big Lips": 0.4330592155456543,
          "Big Nose": 0.15089789032936096,
          "Black Hair": 9.781851258594543e-05,
          "Blond Hair": 0.8397710919380188,
          "Blurry": 9.751294419402257e-05,
          "Brown Hair": 0.0034222761169075966,
          "Bushy Eyebrows": 0.0032495264895260334,
          "Chubby": 0.04546814784407616,
          "Double Chin": 0.006221628747880459,
          "Eyeglasses": 0.0035723077598959208,
          "Goatee": 2.107976979459636e-05,
          "Gray Hair": 0.05442715436220169,
          "Heavy Makeup": 0.06153881549835205,
          "High Cheekbones": 0.06467660516500473,
          "Male": 0.009892416186630726,
          "Mouth Slightly Open": 0.6429247856140137,
          "Mustache": 6.707085958623793e-06,
          "Narrow Eyes": 0.1281699538230896,
          "No Beard": 0.999904990196228,
          "Oval Face": 0.19421473145484924,
          "Pale Skin": 0.1917758733034134,
          "Pointy Nose": 0.03683244436979294,
          "Receding Hairline": 0.10334691405296326,
          "Rosy Cheeks": 0.001687310403212905,
          "Sideburns": 1.6516972891622572e-06,
          "Smiling": 0.002955816453322768,
          "Straight Hair": 0.8337172865867615,
          "Wavy Hair": 0.018651457503437996,
          "Wearing Earrings": 0.005340012721717358,
          "Wearing Hat": 0.00011283502681180835,
          "Wearing Lipstick": 0.3972689211368561,
          "Wearing Necklace": 0.015008620917797089,
          "Wearing Necktie": 0.0019200543174520135,
          "Young": 0.904328465461731
        },
        "age": [
          0.09988658130168915,
          0.9613825678825378,
          0.6563834547996521,
          0.5052388310432434,
          0.2939544916152954,
          0.006485344376415014,
          0.000854475365485996,
          4.956524207955226e-06
        ],
        "race": [
          0.9996787309646606,
          0.0011019249213859439,
          0.5393704771995544,
          0.01060138363391161,
          0.01250634714961052
        ],
        "gender": [
          0.004298756830394268,
          0.9967237114906311
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 15.170368552207947,
          "disgust": 0.01171757685369812,
          "fear": 21.447855234146118,
          "happy": 2.3113982751965523,
          "sad": 54.572099447250366,
          "surprise": 0.07345677586272359,
          "neutral": 6.413105875253677
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1101,
          "h": 1489,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 55,
        "gender": {
          "Woman": 91.41175150871277,
          "Man": 8.588247001171112
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 0.1862973684016027,
          "indian": 4.49951489053054e-07,
          "black": 2.1227446087812942e-09,
          "white": 99.81318118415103,
          "middle eastern": 0.0002372228154006108,
          "latino hispanic": 0.00027553491134775694
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.297567754983902,
        0.005838586017489433,
        0.7794028520584106,
        0.9879257082939148
      ]
    ],
    "face_boxes": [
      [
        0.44538000226020813,
        0.07329701632261276,
        0.6246312856674194,
        0.566670835018158
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5437434969743092,
            0.7895253682950868
          ],
          [
            0.3558796583016714,
            0.7627895278767797
          ],
          [
            0.40493299395508237,
            0.9806371164703933
          ],
          [
            0.46964164949787984,
            0.8776546200443215
          ],
          [
            0.7316073356469471,
            0.8162612087133938
          ],
          [
            0.7472626555363338,
            0.9964805774590197
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4967775373061498,
            0.28748569821798675
          ],
          [
            0.5781852007309597,
            0.2716422372293604
          ],
          [
            0.4383310097191069,
            0.3389769464310226
          ],
          [
            0.6272385363843707,
            0.31125088970092635
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.4999086012840271,
            0.8895372157857911
          ],
          [
            0.46233583354949953,
            0.7608090952532013
          ],
          [
            0.4477242016527388,
            0.6954548186751174
          ],
          [
            0.450855265630616,
            0.6914939534279607
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.47486008946100866,
            0.8301242370784421
          ],
          [
            0.4633795215421253,
            0.85586986118496
          ],
          [
            0.5771415127383338,
            0.6043549179905153
          ],
          [
            0.5980152725908491,
            0.5726679960132626
          ],
          [
            0.5280881770849228,
            0.8538894285613817
          ],
          [
            0.5562677528858185,
            0.7528873647588883
          ],
          [
            0.5802725767162111,
            0.6281201094734551
          ],
          [
            0.603233712553978,
            0.574648428636841
          ],
          [
            0.5562677528858185,
            0.8538894285613817
          ],
          [
            0.5729667607678307,
            0.7806134214889844
          ],
          [
            0.58549101667934,
            0.6914939534279607
          ],
          [
            0.6011463365687264,
            0.6162375137319852
          ],
          [
            0.576097824745708,
            0.8479481306906469
          ],
          [
            0.58549101667934,
            0.8083394782190807
          ],
          [
            0.589665768649843,
            0.7548677973824665
          ],
          [
            0.5980152725908491,
            0.6974352512986958
          ]
        ],
        "dw_face": [
          [
            0.4404183857043585,
            0.29936829395945647
          ],
          [
            0.4425057616896099,
            0.34491824430175766
          ],
          [
            0.4477242016527388,
            0.3904681946440585
          ],
          [
            0.4539863296084934,
            0.4360181449863595
          ],
          [
            0.4644232095347511,
            0.47760723008150385
          ],
          [
            0.48007852942413753,
            0.51721588255307
          ],
          [
            0.49782122529877554,
            0.5469223719067444
          ],
          [
            0.5218260491291682,
            0.5687071307661059
          ],
          [
            0.5468745609521866,
            0.574648428636841
          ],
          [
            0.5719230727752049,
            0.5627658328953711
          ],
          [
            0.5917531446350945,
            0.5350397761652748
          ],
          [
            0.607408464524481,
            0.4974115563172869
          ],
          [
            0.6168016564581129,
            0.4518616059749861
          ],
          [
            0.6230637844138676,
            0.4063116556326849
          ],
          [
            0.6241074724064933,
            0.3587812726668057
          ],
          [
            0.6251511603991191,
            0.31125088970092635
          ],
          [
            0.6230637844138676,
            0.263720506735047
          ],
          [
            0.4644232095347511,
            0.27560310247651687
          ],
          [
            0.47694746544626027,
            0.2617400741114688
          ],
          [
            0.491559097343021,
            0.255798776240734
          ],
          [
            0.5061707292397817,
            0.255798776240734
          ],
          [
            0.5207823611365425,
            0.25777920886431216
          ],
          [
            0.5541803769005669,
            0.24985747836999894
          ],
          [
            0.567748320804702,
            0.24193574787568575
          ],
          [
            0.5813162647088368,
            0.2359944500049509
          ],
          [
            0.5948842086129719,
            0.2359944500049509
          ],
          [
            0.6084521525171068,
            0.24589661312284222
          ],
          [
            0.5395687450038062,
            0.2815444003472517
          ],
          [
            0.5416561209890577,
            0.31125088970092635
          ],
          [
            0.5437434969743092,
            0.340957379054601
          ],
          [
            0.5458308729595608,
            0.3706638684082754
          ],
          [
            0.5260008010996712,
            0.40037035776195
          ],
          [
            0.5353939930333032,
            0.4023507903855284
          ],
          [
            0.5458308729595608,
            0.4023507903855284
          ],
          [
            0.5552240648931926,
            0.3983899251383719
          ],
          [
            0.5646172568268246,
            0.3944290598912152
          ],
          [
            0.48007852942413753,
            0.29342699608872164
          ],
          [
            0.491559097343021,
            0.2795639677236736
          ],
          [
            0.5051270412471559,
            0.2775835351000952
          ],
          [
            0.5166076091660393,
            0.28946613084156514
          ],
          [
            0.5051270412471559,
            0.2973878613358783
          ],
          [
            0.491559097343021,
            0.29936829395945647
          ],
          [
            0.5593988168636959,
            0.2815444003472517
          ],
          [
            0.5687920087973277,
            0.2657009393586253
          ],
          [
            0.5823599527014626,
            0.2617400741114688
          ],
          [
            0.5948842086129719,
            0.27362266985293876
          ],
          [
            0.5834036406940883,
            0.2835248329708301
          ],
          [
            0.5719230727752049,
            0.2835248329708301
          ],
          [
            0.5145202331807879,
            0.46572463434003414
          ],
          [
            0.527044489092297,
            0.44988117335140776
          ],
          [
            0.5395687450038062,
            0.4399790102335162
          ],
          [
            0.5479182489448123,
            0.4399790102335162
          ],
          [
            0.5541803769005669,
            0.4379985776099379
          ],
          [
            0.5667046328120762,
            0.4439398754806727
          ],
          [
            0.5781852007309597,
            0.457802903845721
          ],
          [
            0.5698356967899534,
            0.47364636483434736
          ],
          [
            0.5604425048563215,
            0.48552896057581724
          ],
          [
            0.5489619369374382,
            0.48948982582297373
          ],
          [
            0.5353939930333032,
            0.48948982582297373
          ],
          [
            0.5249571131070455,
            0.4795876627050822
          ],
          [
            0.5186949851512909,
            0.46572463434003414
          ],
          [
            0.5333066170480516,
            0.4597833364692991
          ],
          [
            0.5479182489448123,
            0.457802903845721
          ],
          [
            0.5614861928489473,
            0.4558224712221426
          ],
          [
            0.5740104487604565,
            0.457802903845721
          ],
          [
            0.5614861928489473,
            0.4617637690928774
          ],
          [
            0.5479182489448123,
            0.46572463434003414
          ],
          [
            0.5333066170480516,
            0.46572463434003414
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "000341",
  "objects": [
    {
      "box": [
        0.3701774477958679,
        0.5155532956123352,
        0.6179421544075012,
        0.9227165579795837
      ],
      "name": "hand gesture",
      "possible_names": [
        "hand gesture"
      ],
      "deleted": true
    }
  ],
  "mask_file": "./person_labeling/./000341.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A minimalist scene with a neutral background and soft lighting highlights a person wearing a light-colored top extending their hand forward creating an intimate and focused atmosphere",
  "overall_past": "Before this scene, the person likely paused their movement or activity—perhaps after walking toward the camera or approaching a specific object or individual—just long enough to prepare the gesture of extending their hand. The neutral expression and focused posture suggest a moment of deliberate intention: they may have been in conversation, preparing to present something meaningful, or responding to a cue that required a clear, open gesture. The controlled environment implies this was not spontaneous, so prior to this moment, they likely rehearsed or mentally prepared for the interaction, possibly to initiate a connection, offer an item, or signal a pause in a process—such as a performance, a presentation, or a personal moment of exchange.",
  "overall_past_clean": "They halted their motion with deliberate precision, drawing a breath to center themselves, their body aligning into a poised stance as thoughts crystallized into purpose, every muscle tensing in anticipation of the gesture to come.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person may gently place an object—such as a document, a small gift, or a symbolic item—into the viewer’s hand, completing the gesture of offering and deepening the sense of connection or exchange. This next action would naturally follow the open-palm gesture, maintaining the intimate and intentional atmosphere, and could signify a pivotal moment of trust, introduction, or transition in the narrative.",
  "overall_future_clean": "The moment the gesture is complete, a quiet stillness settles, as if time itself holds its breath, before the recipient slowly closes their fingers around the offering, their eyes meeting yours with a newfound understanding that shifts the course of everything.",
  "future_scene_ok": true
}