{
  "video_path": "./ref_datasets/part1/videvo__6009560_man_people_smartphone_h47ae58b0TolikV101071080p12000br001.mp4",
  "start_time": 0.0,
  "end_time": 3.92,
  "image_path": "./000112.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part1/videvo__6009560_man_people_smartphone_h47ae58b0TolikV101071080p12000br001.mp4",
      "start_time": 0.0,
      "end_time": 3.92,
      "image_path": "./ref_datasets/extracted_frames/person_-896353352527313715_1_videvo__6009560_man_people_smartphone_h47ae58b0TolikV101071080p12000br001.mp4_0.00_3.92.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part1/videvo__6009560_man_people_smartphone_h47ae58b0TolikV101071080p12000br001.mp4",
      "start_time": 0.0,
      "end_time": 3.92,
      "image_path": "./ref_datasets/extracted_frames/face_-896353352527313715_1_videvo__6009560_man_people_smartphone_h47ae58b0TolikV101071080p12000br001.mp4_0.00_3.92.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a denim jacket over a white t-shirt. The denim jacket is blue with visible stitching and buttons. The person also has tattoos on their left arm and hand, and they are wearing rings on their fingers.",
        "clothing": [
          {
            "possible_names": [
              "denim jacket",
              "jean jacket"
            ],
            "name": "jacket",
            "type": "top",
            "color": [
              "blue"
            ]
          },
          {
            "possible_names": [
              "t-shirt",
              "tee"
            ],
            "name": "t shirt",
            "type": "top",
            "color": [
              "white"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "smartphone",
              "mobile phone"
            ],
            "name": "smartphone",
            "position": "hand"
          }
        ],
        "description": "The person is an adult male with a neutral expression, wearing a blue denim jacket over a white t-shirt. He has tattoos on his left arm and hand and is wearing rings on his fingers. He is holding a smartphone in his hand. The background is plain and light-colored.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused on their phone, showing a neutral expression without any strong emotions.",
        "meaningful": true,
        "story": "The person seems to be engaged in an activity on their smartphone, possibly texting or browsing. The tattoos and rings suggest a personal style that embraces individuality.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is focused on their smartphone, holding it with both hands as they appear to be reading or interacting with something on the screen. Their gaze is directed downwards towards the device, suggesting concentration or interest in the content they are viewing. The individual's facial expression is neutral, possibly indicating engagement or curiosity. They have tattoos visible on their hand and arm, which may reflect personal style or artistic expression. The casual attire, consisting of a denim shirt over a white t-shirt, along with their hairstyle and glasses, contributes to an overall relaxed yet stylish appearance. The presence of rings on their fingers could imply a sense of personal identity or relationship status.",
        "intention": "The individual is deeply engaged in digital content seeking information connection or entertainment through focused interaction with their smartphone",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.3275759637444502,
            0.21507424778408474
          ],
          [
            0.33487949750962714,
            0.27935694512866793
          ],
          [
            0.34207179007076083,
            0.34308770913926384
          ],
          [
            0.3530669913050674,
            0.4027184683179098
          ],
          [
            0.37237196007654777,
            0.44369553762768943
          ],
          [
            0.3991789113552798,
            0.4751633348919096
          ],
          [
            0.42912079287426813,
            0.49291715924701995
          ],
          [
            0.45666043602284934,
            0.5009491140880282
          ],
          [
            0.4794388324731872,
            0.5022947599017431
          ],
          [
            0.4964037942034858,
            0.48418759164356057
          ],
          [
            0.5062552420865922,
            0.44588428830343574
          ],
          [
            0.5129547704543387,
            0.40541279883611775
          ],
          [
            0.5180886153663908,
            0.3650502931504022
          ],
          [
            0.5185960935694831,
            0.3197716323156205
          ],
          [
            0.5196617075375148,
            0.28012536820911227
          ],
          [
            0.5185926336617697,
            0.23939234680599636
          ],
          [
            0.5174943386089235,
            0.19956637185717388
          ],
          [
            0.38374915204587434,
            0.21066658648233566
          ],
          [
            0.4015639630101976,
            0.1786489373161679
          ],
          [
            0.420890020295268,
            0.1677773888148959
          ],
          [
            0.44229965656995773,
            0.16439909972841776
          ],
          [
            0.46310571758520036,
            0.17344500337328228
          ],
          [
            0.4846364224240894,
            0.17081187736420403
          ],
          [
            0.4953794170703207,
            0.16061298525522627
          ],
          [
            0.5072434406195367,
            0.1533784582501366
          ],
          [
            0.515911976141589,
            0.1504464386001466
          ],
          [
            0.521403564228898,
            0.16954845852322048
          ],
          [
            0.4766984163295655,
            0.21057437904297358
          ],
          [
            0.48042003597532,
            0.24028503137921528
          ],
          [
            0.4867929039256913,
            0.26694440841674805
          ],
          [
            0.4920143559575081,
            0.29367555323101224
          ],
          [
            0.4638783300206775,
            0.3287730973864359
          ],
          [
            0.4741097096176375,
            0.32975905092935714
          ],
          [
            0.48482062490213484,
            0.3342179154592847
          ],
          [
            0.4931098116295678,
            0.3267977351234072
          ],
          [
            0.4989869161730721,
            0.31598948297046486
          ],
          [
            0.4118300545073691,
            0.22639821635352242
          ],
          [
            0.42171832032146905,
            0.21976371416969906
          ],
          [
            0.4345306594456945,
            0.21346396870083278
          ],
          [
            0.442983176381815,
            0.22096682351733013
          ],
          [
            0.43374715958322796,
            0.22728009829445492
          ],
          [
            0.4233985003970918,
            0.2300128312337966
          ],
          [
            0.4841650099981399,
            0.21405245198143852
          ],
          [
            0.49240570160604663,
            0.20277244325668092
          ],
          [
            0.5033953839114734,
            0.20099381795005192
          ],
          [
            0.5090339052535239,
            0.2088617975749667
          ],
          [
            0.5045864759456544,
            0.21671443704574828
          ],
          [
            0.49493389754068284,
            0.21553940621633377
          ],
          [
            0.43406760532941135,
            0.3810158759828598
          ],
          [
            0.455913942129839,
            0.3808006975385878
          ],
          [
            0.47273945453621097,
            0.37353366897219703
          ],
          [
            0.4820558953852881,
            0.37411946720547146
          ],
          [
            0.4882635903500375,
            0.3683457828703381
          ],
          [
            0.49616682813281104,
            0.3670178708576021
          ],
          [
            0.5019063637370155,
            0.36584215315561447
          ],
          [
            0.49754759456430164,
            0.3848438376472109
          ],
          [
            0.4897250064781734,
            0.39589753226628377
          ],
          [
            0.48056192979926154,
            0.40094417238992364
          ],
          [
            0.4714308196590061,
            0.40101044518607
          ],
          [
            0.45437106773966834,
            0.39611970432220944
          ],
          [
            0.4386231191456318,
            0.38247716616070465
          ],
          [
            0.4715463504904792,
            0.3779808566683815
          ],
          [
            0.48109543252558934,
            0.3824921108427502
          ],
          [
            0.49164561253218425,
            0.37603259465051075
          ],
          [
            0.49922600707837517,
            0.36603231278676834
          ],
          [
            0.4908970126083919,
            0.3768403151678661
          ],
          [
            0.4809364272015435,
            0.3825058482942127
          ],
          [
            0.47114812263420647,
            0.37942108275398373
          ]
        ],
        "visibility": [
          4.70146277464778e-09,
          1.5005045497673564e-05,
          0.4519627094268799,
          1.990946643659619e-11,
          3.4267895188122566e-09,
          5.907725608267356e-06,
          2.478903338300192e-18,
          2.4540152895879963e-12,
          0.9852725863456726,
          2.2606849725548273e-08,
          0.32371237874031067,
          0.4947616755962372,
          0.997138500213623,
          0.19894957542419434,
          6.038624633220024e-06,
          1.3411753485570443e-08,
          0.011824597604572773,
          3.9781202332278554e-08,
          0.47066327929496765,
          0.9993730187416077,
          2.7491046239447314e-06,
          5.0694244357885054e-09,
          4.615766329152393e-07,
          1.8222831230096936e-11,
          1.3548394350859638e-10,
          4.926573815566826e-09,
          4.975366785231472e-09,
          3.4007850757689084e-08,
          3.106444182776613e-06
        ],
        "headpose": {
          "pitch": -7.666468140479004,
          "yaw": -28.273861767402092,
          "roll": -2.6553762721638536
        },
        "attributes": {
          "5 oClock Shadow": 0.6010434627532959,
          "Arched Eyebrows": 0.002556353574618697,
          "Attractive": 0.266217976808548,
          "Bags Under Eyes": 0.1119517982006073,
          "Bald": 0.026187969371676445,
          "Bangs": 5.1701488700928167e-05,
          "Big Lips": 0.2202952802181244,
          "Big Nose": 0.1965441107749939,
          "Black Hair": 0.05132868140935898,
          "Blond Hair": 0.013181809335947037,
          "Blurry": 0.001037230365909636,
          "Brown Hair": 0.0690787136554718,
          "Bushy Eyebrows": 0.05255260691046715,
          "Chubby": 0.12261700630187988,
          "Double Chin": 0.03253978118300438,
          "Eyeglasses": 0.12350877374410629,
          "Goatee": 0.5961222648620605,
          "Gray Hair": 0.023847363889217377,
          "Heavy Makeup": 0.00023778397007845342,
          "High Cheekbones": 0.029655708000063896,
          "Male": 0.9999408721923828,
          "Mouth Slightly Open": 0.059064529836177826,
          "Mustache": 0.09498360008001328,
          "Narrow Eyes": 0.20101872086524963,
          "No Beard": 0.018826713785529137,
          "Oval Face": 0.1080971285700798,
          "Pale Skin": 0.03789601847529411,
          "Pointy Nose": 0.2807547152042389,
          "Receding Hairline": 0.10794995725154877,
          "Rosy Cheeks": 0.0032346518710255623,
          "Sideburns": 0.8848487138748169,
          "Smiling": 0.044121671468019485,
          "Straight Hair": 0.1333332359790802,
          "Wavy Hair": 0.027234870940446854,
          "Wearing Earrings": 0.0026454320177435875,
          "Wearing Hat": 0.0013672580244019628,
          "Wearing Lipstick": 0.0002473033673595637,
          "Wearing Necklace": 0.0020405049435794353,
          "Wearing Necktie": 0.12712064385414124,
          "Young": 0.8522535562515259
        },
        "age": [
          0.0005808369605802,
          0.026808826252818108,
          0.9762333035469055,
          0.9730697870254517,
          0.650882363319397,
          0.029358357191085815,
          0.0003507858782541007,
          1.1914393326151185e-05
        ],
        "race": [
          0.9981300234794617,
          0.0014815269969403744,
          0.3490358591079712,
          0.0434318371117115,
          0.2663781940937042
        ],
        "gender": [
          0.9991517066955566,
          0.0023123358841985464
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 99.20493359595142,
          "disgust": 1.8908813776040934e-05,
          "fear": 0.01240171624227412,
          "happy": 7.664587430832764e-05,
          "sad": 0.12119052257034317,
          "surprise": 3.6700675798809235e-07,
          "neutral": 0.6613774619327463
        },
        "dominant_emotion": "angry",
        "region": {
          "x": 0,
          "y": 0,
          "w": 529,
          "h": 659,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 39,
        "gender": {
          "Woman": 0.14699033927172422,
          "Man": 99.85300302505493
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 6.4452457260166796e-09,
          "indian": 3.639630263840843e-09,
          "black": 4.27812624735624e-12,
          "white": 99.99908208847046,
          "middle eastern": 0.0007873348295106553,
          "latino hispanic": 0.00013027955674260738
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.15802495181560516,
        0.0011313428403809667,
        0.7456491589546204,
        0.9884973764419556
      ]
    ],
    "face_boxes": [
      [
        0.34059497714042664,
        0.01692606508731842,
        0.5246256589889526,
        0.4924134910106659
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.41749942170249094,
            0.705996103617173
          ],
          [
            0.22799629741244848,
            0.7390320190519813
          ],
          [
            0.3470759633514616,
            1.012432698512464
          ],
          [
            0.5775527361366484,
            0.8894023927552467
          ],
          [
            0.6070025459925334,
            0.6729601881823647
          ],
          [
            0.6915106960137685,
            1.0033193425304479
          ],
          [
            0.6530979005495708,
            0.9099074437147828
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.427742833826277,
            0.22868408405908053
          ],
          [
            0.5032879982391993,
            0.2127357110905526
          ],
          [
            0.3227478595574697,
            0.2696941859781529
          ],
          [
            0.5250552490022448,
            0.2195707280770646
          ]
        ],
        "dw_hand_1": [
          [
            0.6146851050853729,
            0.8643406638047024
          ],
          [
            0.6236480906936858,
            0.791433815948574
          ],
          [
            0.6262089437246323,
            0.7390320190519813
          ],
          [
            0.6415740619103114,
            0.704856934119421
          ],
          [
            0.6761455778280895,
            0.6752385271778688
          ],
          [
            0.6518174740340975,
            0.7321970020654691
          ],
          [
            0.6787064308590359,
            0.6957435781374051
          ],
          [
            0.6966324020756615,
            0.6729601881823647
          ],
          [
            0.7132779467768139,
            0.6478984592318207
          ],
          [
            0.6569391800959904,
            0.7504237140295016
          ],
          [
            0.6851085634364021,
            0.704856934119421
          ],
          [
            0.7017541081375546,
            0.6820735441643808
          ],
          [
            0.7171192263232338,
            0.6501767982273243
          ],
          [
            0.6633413126733567,
            0.7732071039845415
          ],
          [
            0.6863889899518754,
            0.7413103580474852
          ],
          [
            0.6979128285911347,
            0.7162486290969412
          ],
          [
            0.7132779467768139,
            0.6866302221553888
          ],
          [
            0.674865151312616,
            0.8073821889171019
          ],
          [
            0.6863889899518754,
            0.7823204599665576
          ],
          [
            0.6940715490447151,
            0.7640937480025256
          ],
          [
            0.6991932551066081,
            0.7413103580474852
          ]
        ],
        "dw_hand_2": [
          [
            0.5801135891675949,
            0.8780106977777266
          ],
          [
            0.5903570012913809,
            0.8028255109260938
          ],
          [
            0.600600413415167,
            0.7299186630699654
          ],
          [
            0.6287697967555788,
            0.6957435781374051
          ],
          [
            0.6569391800959904,
            0.6706818491868606
          ],
          [
            0.624928517209159,
            0.7094136121104292
          ],
          [
            0.6595000331269371,
            0.6638468322003486
          ],
          [
            0.6863889899518754,
            0.6342284252587964
          ],
          [
            0.7132779467768139,
            0.6160017132947642
          ],
          [
            0.6466957679722044,
            0.7527020530250053
          ],
          [
            0.6799868573745091,
            0.702578595123917
          ],
          [
            0.7081562407149209,
            0.6661251711958527
          ],
          [
            0.7337647710243862,
            0.6410634422453084
          ],
          [
            0.6620608861578835,
            0.805103849921598
          ],
          [
            0.6902302694982952,
            0.7549803920205095
          ],
          [
            0.7119975202613407,
            0.7162486290969412
          ],
          [
            0.7350451975398594,
            0.6797952051688767
          ],
          [
            0.6710238717661964,
            0.8529489688271825
          ],
          [
            0.6902302694982952,
            0.816495544899118
          ],
          [
            0.7017541081375546,
            0.7845987989620617
          ],
          [
            0.7158387998077606,
            0.7413103580474852
          ]
        ],
        "dw_face": [
          [
            0.33171084516578253,
            0.23096242305458464
          ],
          [
            0.3368325512276756,
            0.27425086396916115
          ],
          [
            0.3419542572895685,
            0.3175393048837375
          ],
          [
            0.35091724289788134,
            0.3608277457983138
          ],
          [
            0.36244108153714066,
            0.39955950872188223
          ],
          [
            0.3803670527537664,
            0.4314562546589385
          ],
          [
            0.4021343035168118,
            0.45651798360948276
          ],
          [
            0.4251819807953304,
            0.4747446955735148
          ],
          [
            0.4507905111047957,
            0.4838580515555309
          ],
          [
            0.47639904141426087,
            0.4838580515555309
          ],
          [
            0.49816629217730624,
            0.4610746616004908
          ],
          [
            0.5084097043010923,
            0.4223428986769224
          ],
          [
            0.516092263393932,
            0.3767761187668421
          ],
          [
            0.5224943959712982,
            0.3334876778522656
          ],
          [
            0.5263356755177181,
            0.29019923693768906
          ],
          [
            0.5250552490022448,
            0.24463245702760886
          ],
          [
            0.5212139694558249,
            0.20134401611303232
          ],
          [
            0.3906104648775524,
            0.2127357110905526
          ],
          [
            0.40725600957870484,
            0.1990656771175284
          ],
          [
            0.4251819807953304,
            0.19223066013101642
          ],
          [
            0.44182752549648285,
            0.19223066013101642
          ],
          [
            0.4584730701976353,
            0.19450899912652034
          ],
          [
            0.4892033065689935,
            0.18995232113551228
          ],
          [
            0.49816629217730624,
            0.18311730414900027
          ],
          [
            0.507129277785619,
            0.1785606261579922
          ],
          [
            0.5148118368784588,
            0.17400394816698414
          ],
          [
            0.5224943959712982,
            0.1785606261579922
          ],
          [
            0.47639904141426087,
            0.22412740606807266
          ],
          [
            0.48280117399162714,
            0.25146747401412084
          ],
          [
            0.48664245353804686,
            0.27880754196016905
          ],
          [
            0.4917641595999401,
            0.3061476099062174
          ],
          [
            0.46103392322858167,
            0.33120933885676146
          ],
          [
            0.472557761867841,
            0.33120933885676146
          ],
          [
            0.48408160050710036,
            0.3334876778522656
          ],
          [
            0.49304458611541324,
            0.33120933885676146
          ],
          [
            0.49944671869277957,
            0.32209598287474556
          ],
          [
            0.4098168626096514,
            0.23779744004109665
          ],
          [
            0.42262112776438393,
            0.23096242305458464
          ],
          [
            0.43414496640364325,
            0.22640574506357658
          ],
          [
            0.44566880504290257,
            0.23096242305458464
          ],
          [
            0.43414496640364325,
            0.2355191010455927
          ],
          [
            0.42262112776438393,
            0.23779744004109665
          ],
          [
            0.4892033065689935,
            0.22184906707256852
          ],
          [
            0.49816629217730624,
            0.21501405008605654
          ],
          [
            0.507129277785619,
            0.21501405008605654
          ],
          [
            0.5148118368784588,
            0.21501405008605654
          ],
          [
            0.507129277785619,
            0.22184906707256852
          ],
          [
            0.49816629217730624,
            0.22184906707256852
          ],
          [
            0.4392666724655363,
            0.38133279675785
          ],
          [
            0.4584730701976353,
            0.37449777977133797
          ],
          [
            0.4776794679297342,
            0.36766276278482596
          ],
          [
            0.48408160050710036,
            0.36766276278482596
          ],
          [
            0.49048373308446674,
            0.36766276278482596
          ],
          [
            0.496885865661833,
            0.36538442378932184
          ],
          [
            0.5032879982391993,
            0.36766276278482596
          ],
          [
            0.49816629217730624,
            0.37905445776234603
          ],
          [
            0.49304458611541324,
            0.3904461527398661
          ],
          [
            0.48408160050710036,
            0.3972811697263783
          ],
          [
            0.4687164823214214,
            0.3972811697263783
          ],
          [
            0.4533513641357422,
            0.3904461527398661
          ],
          [
            0.44182752549648285,
            0.38133279675785
          ],
          [
            0.4635947762595282,
            0.38133279675785
          ],
          [
            0.48408160050710036,
            0.37905445776234603
          ],
          [
            0.4917641595999401,
            0.37449777977133797
          ],
          [
            0.5007271452082529,
            0.3699411017803299
          ],
          [
            0.4917641595999401,
            0.37449777977133797
          ],
          [
            0.48408160050710036,
            0.37905445776234603
          ],
          [
            0.462314349744055,
            0.38133279675785
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "000112",
  "objects": [
    {
      "box": [
        0.649828314781189,
        0.45533278584480286,
        0.7613413333892822,
        0.7733156681060791
      ],
      "name": "smartphone",
      "possible_names": [
        "smartphone"
      ]
    }
  ],
  "mask_file": "./person_labeling/./000112.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is holding a smartphone with tattoos visible on their hand and arm against a plain light background wearing a denim shirt over a white t-shirt and rings on their fingers",
  "overall_past": "Before this scene, the individual likely received a notification on their smartphone—perhaps a message, social media update, or email—that immediately captured their attention, prompting them to pause and focus intently on the screen. The neutral yet engaged expression and the two-handed grip suggest a moment of reaction or decision-making, possibly in response to something meaningful or unexpected. The tattoos, rings, and casual yet put-together outfit indicate a person who values personal style and self-expression, so the content on the screen may have been related to a personal connection, creative project, or a significant update in their life—something that warranted their full attention in that quiet, reflective moment.",
  "overall_past_clean": "A sudden digital alert pierced the silence, triggering an immediate shift in focus as the mind registered the incoming signal, prompting a swift, instinctive response to engage with the source of the notification.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to lower the smartphone, take a moment to process what they’ve read or seen, and then either respond to a message, save the information, or continue browsing—perhaps with a subtle shift in expression, such as a thoughtful frown or a small smile, indicating a reaction to the content. The rings on their fingers might catch the light as they move their hand, and the casual yet intentional posture suggests they are fully immersed in the digital moment, possibly preparing to act on what they’ve just encountered.",
  "overall_future_clean": "The individual swiftly taps the screen, their fingers moving with purpose as they send a reply, then pauses briefly to review the message before arching a brow in quiet satisfaction, fingers lingering just a moment longer before swiping to the next task with focused intent.",
  "future_scene_ok": true
}