{
  "video_path": "./ref_datasets/part2/4718162001.mp4",
  "start_time": 0.0,
  "end_time": 5.36,
  "image_path": "./001315.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/4718162001.mp4",
      "start_time": 0.0,
      "end_time": 5.36,
      "image_path": "./ref_datasets/extracted_frames/person_3801147054497364452_1_4718162001.mp4_0.00_5.36.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4718162001.mp4",
      "start_time": 0.0,
      "end_time": 5.36,
      "image_path": "./ref_datasets/extracted_frames/face_3801147054497364452_1_4718162001.mp4_0.00_5.36.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "child",
        "gender": "female",
        "emotion": "complex",
        "clothing_description": "The person appears to be wearing a light blue top with a visible collar. The rest of the clothing is not fully visible in the image.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "earrings",
                "ear studs"
              ],
              "name": "earrings",
              "type": "accessory",
              "color": [
                "light blue"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [],
        "description": "The person in the image is a child with blonde hair styled in braids. She has light blue eyes and is sticking her tongue out slightly. She is wearing a light blue top. The background is a solid light blue color. There are no other objects or people in the image.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The child appears to be making a playful expression by sticking out her tongue, which could indicate a sense of fun or mischief. However, the redness on her cheeks might suggest she is also feeling shy or embarrassed.",
        "meaningful": true,
        "story": "The child seems to be engaging in a playful moment, possibly posing for a photo in a lighthearted manner. The redness on her cheeks suggests she might be feeling shy or self-conscious despite her playful gesture.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "complex_emotion": "The person in the image appears to be expressing a playful and mischievous emotion. The act of sticking out the tongue suggests a sense of fun and perhaps a desire to engage in light-hearted behavior. This gesture often indicates a feeling of being carefree and enjoying the moment. The individual's eyes are wide open, which could imply curiosity or excitement. The overall expression seems to convey a sense of joy and spontaneity, as if the person is in a cheerful mood and wants to share their happiness with others.\n\nHowever, there might also be an underlying layer of rebellion or defiance in this expression. Sticking out the tongue can sometimes be seen as a way of challenging authority or norms, especially in certain cultural contexts. It may suggest that the person is feeling confident and unafraid to express themselves in unconventional ways. This could indicate a strong sense of self and a willingness to stand out from the crowd. The individual might be thinking about how they want to be perceived by others and using this gesture as a form of self-expression.\n\nAdditionally, the person's facial features, such as the slight blush on their cheeks, could hint at a sense of embarrassment or shyness. Despite the playful nature of the expression, there might be an element of vulnerability present. The individual might be feeling a mix of emotions, including excitement and nervousness. They could be trying to mask their true feelings with a playful demeanor, possibly as a way to cope with social anxiety or uncertainty. Overall, the emotion conveyed by the person in the image is multifaceted, combining elements of playfulness, confidence, and perhaps even a touch of vulnerability.",
        "complex_emotion_clean": "Playful joy mixed with confidence and defiance intertwined with underlying vulnerability and nervousness creates a complex emotional state of spontaneous self-expression and hidden uncertainty",
        "behaviour": "The person in the image is making a playful face by sticking out their tongue and looking directly at the camera with wide eyes, possibly to entertain or amuse someone watching them. Their hair is styled in two braids, suggesting they might be engaging in a casual or fun activity. The light blue background provides a simple setting that focuses attention on their expressive face, indicating that the intention behind this behavior could be to capture a moment of lightheartedness or to share a humorous expression with an audience. The overall appearance and action suggest a youthful and carefree attitude, likely aiming to evoke laughter or joy from viewers.",
        "intention": "The intention is to create a lighthearted moment and elicit amusement through an exaggerated expressive gesture",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.2909962998861114,
            0.29847288131713867
          ],
          [
            0.30268669338381315,
            0.38864609173366
          ],
          [
            0.3188429002558613,
            0.4811171804155623
          ],
          [
            0.3295163050061092,
            0.5718847002301898
          ],
          [
            0.3420385495202416,
            0.6639531680515834
          ],
          [
            0.36892626682778684,
            0.7514886174883161
          ],
          [
            0.4042916892295969,
            0.8300271034240723
          ],
          [
            0.4483441539840507,
            0.8925370488848005
          ],
          [
            0.5039906886273197,
            0.904872076851981
          ],
          [
            0.5611020683177881,
            0.8819300106593541
          ],
          [
            0.6098981355649553,
            0.8160725321088519
          ],
          [
            0.6526169237248334,
            0.7415390014648438
          ],
          [
            0.6820650046658037,
            0.6529344831194196
          ],
          [
            0.6970686703654272,
            0.5504424912588937
          ],
          [
            0.7016398847502257,
            0.44838268416268484
          ],
          [
            0.7081448744949219,
            0.34498551913670134
          ],
          [
            0.7142944427074066,
            0.2441034487315587
          ],
          [
            0.3091912395736602,
            0.19683895792279923
          ],
          [
            0.3274449244906594,
            0.13420861107962473
          ],
          [
            0.36355138263232745,
            0.11168667248317174
          ],
          [
            0.4061417874514258,
            0.11383392129625593
          ],
          [
            0.44693214354005506,
            0.13694857699530466
          ],
          [
            0.5274775986992088,
            0.11973433835165839
          ],
          [
            0.5661204272515274,
            0.08300670555659703
          ],
          [
            0.6065149467405198,
            0.07396401677812849
          ],
          [
            0.6477223062788002,
            0.09159695250647408
          ],
          [
            0.6769118875797306,
            0.1345059531075614
          ],
          [
            0.488817192996586,
            0.23286209787641252
          ],
          [
            0.48970937778774115,
            0.2984929765973772
          ],
          [
            0.4934213748534343,
            0.3611625943865095
          ],
          [
            0.4933159944734403,
            0.42682528495788574
          ],
          [
            0.4623341627552041,
            0.4951294830867222
          ],
          [
            0.4795973174872675,
            0.5020425660269601
          ],
          [
            0.4968248227877276,
            0.5117022309984479
          ],
          [
            0.5153129109697017,
            0.5008115087236676
          ],
          [
            0.5313535460154526,
            0.4877031190054758
          ],
          [
            0.362284363047885,
            0.2751926694597517
          ],
          [
            0.38306171001334277,
            0.2425239086151123
          ],
          [
            0.41293131247428916,
            0.24153910364423475
          ],
          [
            0.4421921720079679,
            0.27431895051683697
          ],
          [
            0.4131029578857124,
            0.28429222106933594
          ],
          [
            0.3847044102398546,
            0.2866687093462263
          ],
          [
            0.5425891823251732,
            0.25379858698163715
          ],
          [
            0.5689518338435195,
            0.21350407600402832
          ],
          [
            0.5958377356707518,
            0.20508490289960588
          ],
          [
            0.6216210220341705,
            0.2307940891810826
          ],
          [
            0.6010425939457491,
            0.2534211703709194
          ],
          [
            0.5738567252576883,
            0.25484515939440044
          ],
          [
            0.41588089033029974,
            0.6102579661778041
          ],
          [
            0.44397361206522745,
            0.5953183855329242
          ],
          [
            0.47295775526436046,
            0.5807595252990723
          ],
          [
            0.49343717778434176,
            0.5903940882001605
          ],
          [
            0.5157115326811825,
            0.5764944893973214
          ],
          [
            0.5462417017801531,
            0.5871483939034599
          ],
          [
            0.5796251251262479,
            0.6026762553623745
          ],
          [
            0.5493822351563722,
            0.6563184601919991
          ],
          [
            0.5174833383145077,
            0.6827900069100517
          ],
          [
            0.4958873954019509,
            0.6908200127737862
          ],
          [
            0.47301333371849197,
            0.6858761651175362
          ],
          [
            0.44286814959819565,
            0.6622002465384347
          ],
          [
            0.43097772317871985,
            0.6121365683419364
          ],
          [
            0.4752014413658929,
            0.6178915841238839
          ],
          [
            0.49544846177533536,
            0.6259105546133858
          ],
          [
            0.5118878216848575,
            0.6196119444710868
          ],
          [
            0.5662230431501354,
            0.6066901343209403
          ],
          [
            0.5129799981368706,
            0.6338857923235212
          ],
          [
            0.4941381388593332,
            0.6399046352931431
          ],
          [
            0.473403435050776,
            0.6312851224626813
          ]
        ],
        "visibility": [
          7.338553018598759e-07,
          5.5760843838614186e-15,
          2.7630458684924086e-13,
          3.269180569954116e-16,
          0.007837850600481033,
          0.0011885336134582758,
          4.753528300149856e-12,
          5.402523838958105e-16,
          1.0820414786394394e-08,
          4.221341514259975e-19,
          2.2692857042912e-16,
          2.423021652754312e-19,
          1.414615369288441e-10,
          4.693267042360505e-12,
          1.318591763554977e-10,
          4.644672555500487e-15,
          6.999938823026852e-12,
          4.3577481575497734e-13,
          1.7881982404235683e-20,
          3.341701568237987e-11,
          8.153041187541138e-18,
          2.6019845047256323e-18,
          1.8878231458074879e-06,
          2.244559489071867e-16,
          3.7744163350339477e-10,
          1.6959387902340983e-15,
          2.071565100990498e-14,
          3.5396493136725937e-13,
          4.1335799366715165e-11
        ],
        "headpose": {
          "pitch": -1.1198396099446208,
          "yaw": 3.6187725336034484,
          "roll": -3.010905547709589
        },
        "attributes": {
          "5 oClock Shadow": 0.03704693913459778,
          "Arched Eyebrows": 0.0015744217671453953,
          "Attractive": 0.042145390063524246,
          "Bags Under Eyes": 0.3221859633922577,
          "Bald": 3.539312456268817e-05,
          "Bangs": 0.0005073120119050145,
          "Big Lips": 0.1475294679403305,
          "Big Nose": 0.337693989276886,
          "Black Hair": 0.00042709975969046354,
          "Blond Hair": 0.41754278540611267,
          "Blurry": 2.4341896278201602e-05,
          "Brown Hair": 0.12378277629613876,
          "Bushy Eyebrows": 0.004384723491966724,
          "Chubby": 0.21323832869529724,
          "Double Chin": 0.04462480917572975,
          "Eyeglasses": 0.007111215963959694,
          "Goatee": 0.00214600027538836,
          "Gray Hair": 0.028456004336476326,
          "Heavy Makeup": 0.0021238988265395164,
          "High Cheekbones": 0.11214516311883926,
          "Male": 0.9053269028663635,
          "Mouth Slightly Open": 0.9914819002151489,
          "Mustache": 4.0233418985735625e-05,
          "Narrow Eyes": 0.037275005131959915,
          "No Beard": 0.9800961017608643,
          "Oval Face": 0.6070241928100586,
          "Pale Skin": 0.030427156016230583,
          "Pointy Nose": 0.006825719494372606,
          "Receding Hairline": 0.07510998845100403,
          "Rosy Cheeks": 0.0031926636584103107,
          "Sideburns": 0.0005426520947366953,
          "Smiling": 0.04883749410510063,
          "Straight Hair": 0.05513942241668701,
          "Wavy Hair": 0.3393101692199707,
          "Wearing Earrings": 0.009760684333741665,
          "Wearing Hat": 0.0005060618277639151,
          "Wearing Lipstick": 0.009294153191149235,
          "Wearing Necklace": 0.005756658967584372,
          "Wearing Necktie": 0.001184366294182837,
          "Young": 0.9580647349357605
        },
        "age": [
          0.6873158812522888,
          0.9950592517852783,
          0.5213548541069031,
          0.07668201625347137,
          0.013767754659056664,
          0.0016698500839993358,
          0.0001929282007040456,
          1.3215424587542657e-05
        ],
        "race": [
          0.996009349822998,
          0.004416096955537796,
          0.6941040754318237,
          0.023541973903775215,
          0.17005465924739838
        ],
        "gender": [
          0.03478100895881653,
          0.9667885899543762
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.005644865814247169,
          "disgust": 3.455342262315142e-09,
          "fear": 1.7208447679877281,
          "happy": 0.0686297775246203,
          "sad": 0.18564212368801236,
          "surprise": 5.36823533475399,
          "neutral": 92.65100359916687
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 2480,
          "h": 2159,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 34,
        "gender": {
          "Woman": 18.017898499965668,
          "Man": 81.98210597038269
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 38.69663178920746,
          "indian": 0.21261237561702728,
          "black": 0.09403115836903453,
          "white": 52.42012143135071,
          "middle eastern": 1.8672989681363106,
          "latino hispanic": 6.709306687116623
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.21980896592140198,
        0.0023840952198952436,
        0.7739591598510742,
        0.9853015542030334
      ]
    ],
    "face_boxes": [
      [
        0.304132342338562,
        0.008628219366073608,
        0.7079691886901855,
        0.9295174479484558
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.49916365051269523,
            1.0024642240465782
          ],
          [
            0.2643180362780889,
            1.003630787793931
          ],
          [
            0.1450508918762207,
            0.9779663853521666
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7340092647473015,
            1.0012976602992252
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.3995694371461868,
            0.2663624994668834
          ],
          [
            0.588921398361524,
            0.2360318420357075
          ],
          [
            0.3048934565385183,
            0.41568265912805746
          ],
          [
            0.716795450091362,
            0.3713532367286465
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.3061230147282282,
            0.287360646919236
          ],
          [
            0.3110412474870682,
            0.38535200169688155
          ],
          [
            0.32210727119445803,
            0.48567648396923285
          ],
          [
            0.33563241128126775,
            0.5860009662415844
          ],
          [
            0.3565349005063375,
            0.6793260660298183
          ],
          [
            0.3860442970593771,
            0.7633186558392288
          ],
          [
            0.4217014845609665,
            0.8356456081751101
          ],
          [
            0.4647360212008159,
            0.9033063055215795
          ],
          [
            0.5163774651686351,
            0.9219713254792263
          ],
          [
            0.5692484673261643,
            0.8846412855639328
          ],
          [
            0.6110534457763036,
            0.8146474607227575
          ],
          [
            0.6454810750881832,
            0.7399873808921702
          ],
          [
            0.6725313552618026,
            0.6489954085986422
          ],
          [
            0.6897451699177423,
            0.5440046713368791
          ],
          [
            0.7008111936251321,
            0.4413470615698219
          ],
          [
            0.7069589845736823,
            0.3363563243080588
          ],
          [
            0.7081885427633919,
            0.2313655870462957
          ],
          [
            0.32210727119445803,
            0.19636867462570798
          ],
          [
            0.3466984349886576,
            0.16137176220512028
          ],
          [
            0.3762078315416971,
            0.1450398697421795
          ],
          [
            0.4081763444741566,
            0.14270674224747337
          ],
          [
            0.4401448574066162,
            0.1497061247315909
          ],
          [
            0.5323617216348648,
            0.13104110477394443
          ],
          [
            0.5655597927570343,
            0.11004295732159179
          ],
          [
            0.5987578638792038,
            0.09604419235335672
          ],
          [
            0.6319559350013733,
            0.09837731984806242
          ],
          [
            0.6626948897441228,
            0.1263748497845326
          ],
          [
            0.49055674318472553,
            0.2523637344986483
          ],
          [
            0.49424541775385544,
            0.31302504936100045
          ],
          [
            0.4979340923229854,
            0.3736863642233522
          ],
          [
            0.4991636505126953,
            0.4366808065804101
          ],
          [
            0.45981778844197585,
            0.49500899394805653
          ],
          [
            0.4807202776670456,
            0.5043415039268798
          ],
          [
            0.5016227668921154,
            0.5090077589162914
          ],
          [
            0.5249843724966049,
            0.5020083764321739
          ],
          [
            0.5483459781010945,
            0.49500899394805653
          ],
          [
            0.3614531332651775,
            0.28269439192982415
          ],
          [
            0.3860442970593771,
            0.24769747950923648
          ],
          [
            0.41678325180212666,
            0.24536435201453077
          ],
          [
            0.4426039737860363,
            0.2780281369404128
          ],
          [
            0.4155536936124165,
            0.29669315689805925
          ],
          [
            0.387273855249087,
            0.3013594118874711
          ],
          [
            0.5458868617216747,
            0.2593631169827659
          ],
          [
            0.5692484673261643,
            0.2150336945833549
          ],
          [
            0.5999874220689139,
            0.20570118460453124
          ],
          [
            0.6294968186219533,
            0.2313655870462957
          ],
          [
            0.6036760966380437,
            0.2640293719721777
          ],
          [
            0.5753962582747141,
            0.2710287544562952
          ],
          [
            0.4192423681815465,
            0.620997878662172
          ],
          [
            0.45121088111400603,
            0.6046659861992313
          ],
          [
            0.48317939404646565,
            0.5999997312098194
          ],
          [
            0.5003932087024053,
            0.6023328587045254
          ],
          [
            0.5176070233583451,
            0.5976666037151137
          ],
          [
            0.5495755362908046,
            0.6023328587045254
          ],
          [
            0.581544049223264,
            0.620997878662172
          ],
          [
            0.5594120018084843,
            0.6629941735668773
          ],
          [
            0.5335912798245748,
            0.697991085987465
          ],
          [
            0.4991636505126953,
            0.7166561059451119
          ],
          [
            0.4647360212008159,
            0.7073235959662885
          ],
          [
            0.4389152992169063,
            0.6746598110404066
          ],
          [
            0.4290788336992264,
            0.6256641336515839
          ],
          [
            0.4659655793905258,
            0.6256641336515839
          ],
          [
            0.5003932087024053,
            0.6303303886409954
          ],
          [
            0.5360503962039948,
            0.623331006156878
          ],
          [
            0.5729371418952942,
            0.6256641336515839
          ],
          [
            0.5385095125834148,
            0.6489954085986422
          ],
          [
            0.4991636505126953,
            0.6653273010615832
          ],
          [
            0.4622769048213959,
            0.6559947910827597
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "001315",
  "objects": [],
  "mask_file": "./person_labeling/./001315.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A close-up shot features braided hair against a solid light blue background with no additional objects or cultural elements present",
  "overall_past": "Before the current scene, the individual likely engaged in a lighthearted interaction—perhaps a playful challenge or joke with someone nearby—prompting them to strike the exaggerated, tongue-out expression for comedic effect. The deliberate braiding of their hair suggests preparation or a deliberate choice to present a specific, cheerful image, indicating they may have been getting ready for a photo or video moment, possibly to share online or with friends. The simple, uncluttered background further supports the idea that this was a planned, intentional act focused solely on capturing a joyful, carefree expression.",
  "overall_past_clean": "A playful exchange erupted in a burst of laughter and teasing, sparking a spontaneous challenge that led to an immediate, exaggerated reaction as the individual leaned into the moment with deliberate flair.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to laugh or react to their own playful expression, possibly breaking into giggles or turning away briefly to compose themselves, as the exaggerated face and tongue-sticking-out gesture suggest a moment of spontaneous humor that could naturally lead to a burst of laughter or a shared joke with someone nearby.",
  "overall_future_clean": "A sudden, unrestrained burst of laughter erupts, followed by a quick, self-conscious turn away, hands rising briefly to the face before dropping as the moment settles into a shared, knowing smile.",
  "future_scene_ok": true
}