{
  "video_path": "./ref_datasets/part2/5124613002.mp4",
  "start_time": 0.0,
  "end_time": 3.04,
  "image_path": "./016018.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5124613002.mp4",
      "start_time": 0.0,
      "end_time": 3.04,
      "image_path": "./ref_datasets/extracted_frames/face_4825617632652275305_1_5124613002.mp4_0.00_3.04.jpg",
      "type": "face"
    }
  ],
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a black leather jacket with visible stitching along the edges. The jacket appears to have a zipper closure and possibly some buttons on the sleeves.",
        "clothing": [
          {
            "possible_names": [
              "black leather jacket",
              "jacket",
              "leather jacket"
            ],
            "name": "jacket",
            "type": "top",
            "color": [
              "black"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "vape pen",
              "e-cigarette",
              "vaping device"
            ],
            "name": "vape pen",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "smartphone",
              "mobile phone",
              "cell phone"
            ],
            "name": "smartphone",
            "position": "hand"
          }
        ],
        "description": "The person is an adult female who appears to be in the foreground of the image. She is wearing a black leather jacket and is holding a vape pen in one hand and a smartphone in the other. The lighting is red, casting a warm glow over her face and hair. Her expression is neutral, and she seems to be focused on the smartphone. The background is blurred with bokeh lights, suggesting an outdoor setting at night.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused on an activity, possibly applying makeup, which suggests a neutral emotional state as they concentrate on the task at hand.",
        "meaningful": true,
        "story": "A young adult woman is seen outdoors during the evening, illuminated by red lighting, possibly from a nearby event or street light. She is holding a phone in one hand and appears to be applying makeup with the other, suggesting she might be preparing for an outing or simply maintaining her appearance while out.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a smartphone in one hand while using an electronic vaping device with the other, exhaling vapor into the air. The red lighting casts a dramatic glow on their face, suggesting they might be at a social event or gathering during the evening. Their focused gaze towards the phone indicates they could be engaged in communication or entertainment, possibly seeking distraction or connection with others through digital means. The combination of vaping and phone use suggests a moment of leisure or relaxation, where the individual is enjoying personal time amidst a vibrant atmosphere.",
        "intention": "The individual is seeking personal enjoyment and digital connection in a vibrant social setting through simultaneous use of a smartphone and vaping device",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "left hand",
            "action": [
              [
                "left hand",
                "holding"
              ]
            ]
          },
          "object": 0
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ],
              [
                "right hand",
                "inhaling"
              ]
            ]
          },
          "object": 1
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.390990655682981,
            0.37793795469576724
          ],
          [
            0.398814037522035,
            0.4269918031162686
          ],
          [
            0.40127852650891455,
            0.48549317771164835
          ],
          [
            0.4010612119388367,
            0.5233351743410505
          ],
          [
            0.4035065907319742,
            0.5492931460577344
          ],
          [
            0.4123895924538374,
            0.5996662450215172
          ],
          [
            0.4188763783978564,
            0.6293475013561349
          ],
          [
            0.42553726245782203,
            0.662113467536906
          ],
          [
            0.4326830038002559,
            0.7043986913388368
          ],
          [
            0.4569005245875035,
            0.7037355877104259
          ],
          [
            0.4779878042372209,
            0.676391271813206
          ],
          [
            0.5073100823909045,
            0.6449362081194681
          ],
          [
            0.5335471317704236,
            0.5924961407348591
          ],
          [
            0.5570347969553301,
            0.5341239033552705
          ],
          [
            0.5628665727696249,
            0.4566564664008126
          ],
          [
            0.5631589429719107,
            0.3886702570334944
          ],
          [
            0.5686077315892493,
            0.32207384443787673
          ],
          [
            0.38568663358954447,
            0.32029411098944444
          ],
          [
            0.37973145110798734,
            0.29960533446735804
          ],
          [
            0.38215292424761826,
            0.3189377579739485
          ],
          [
            0.38517446511292036,
            0.30594707453061665
          ],
          [
            0.38756338262132234,
            0.3093634907846098
          ],
          [
            0.3971222719177604,
            0.29929880105629175
          ],
          [
            0.40664812794753485,
            0.28520091800462627
          ],
          [
            0.41716050175683844,
            0.30280436630602237
          ],
          [
            0.42913971309150967,
            0.30818525540134895
          ],
          [
            0.45146478497024095,
            0.3313654371670314
          ],
          [
            0.3947921178968889,
            0.36847069206691924
          ],
          [
            0.3895736594152238,
            0.41070819796708524
          ],
          [
            0.3794875943368035,
            0.4396950454623611
          ],
          [
            0.37385249924180763,
            0.4773265628587631
          ],
          [
            0.3967407558379429,
            0.5116101747467404
          ],
          [
            0.3962555976451508,
            0.5127861169910934
          ],
          [
            0.40095392069114105,
            0.5145181840689725
          ],
          [
            0.40564751992268216,
            0.5072701645906639
          ],
          [
            0.4102060677350632,
            0.4952634953947924
          ],
          [
            0.39540467578917743,
            0.3599156607080389
          ],
          [
            0.390191141728844,
            0.3629960934636455
          ],
          [
            0.3964295142596322,
            0.3656252416353377
          ],
          [
            0.39563936673636946,
            0.3654212295693695
          ],
          [
            0.3978748868485647,
            0.35862238189530754
          ],
          [
            0.397696437473808,
            0.3632492920709035
          ],
          [
            0.42148547151259014,
            0.38306286249841964
          ],
          [
            0.41893573892968045,
            0.37364218408468536
          ],
          [
            0.42636509064052786,
            0.3741342298568241
          ],
          [
            0.4370433758944273,
            0.3823117435609222
          ],
          [
            0.4290144675278238,
            0.3778540876491991
          ],
          [
            0.4202331878244877,
            0.37886636676611724
          ],
          [
            0.40395077735717805,
            0.5487731446034063
          ],
          [
            0.4032637465479118,
            0.5682626094767657
          ],
          [
            0.3980034710839391,
            0.5514999701863245
          ],
          [
            0.39790230312251623,
            0.5491780253314468
          ],
          [
            0.3979711447177189,
            0.5480540265481939
          ],
          [
            0.4121187062934041,
            0.5456621538394343
          ],
          [
            0.4230275652770485,
            0.5570844075667164
          ],
          [
            0.4127892156929842,
            0.5619598270093323
          ],
          [
            0.4075905695291502,
            0.5944841633398066
          ],
          [
            0.3977309179758387,
            0.5971818737882785
          ],
          [
            0.40283411347440307,
            0.586887122966625
          ],
          [
            0.4060484471065658,
            0.5609841350525144
          ],
          [
            0.4083722533525101,
            0.5557518619708914
          ],
          [
            0.4016676465448524,
            0.5668016996333208
          ],
          [
            0.4020010886181678,
            0.5721402816040807
          ],
          [
            0.40953271162829225,
            0.5476733654895156
          ],
          [
            0.42081936113536356,
            0.5495735273790107
          ],
          [
            0.40837153212300364,
            0.5598070591215104
          ],
          [
            0.4017593716537314,
            0.57473915518907
          ],
          [
            0.40099874677668723,
            0.5653730998594294
          ]
        ],
        "visibility": [
          0.8658865690231323,
          1.0,
          1.2412103345127434e-08,
          1.0493629076790967e-08,
          7.205937436083332e-06,
          2.0127021116422839e-07,
          0.002116295276209712,
          0.38522812724113464,
          0.005332078784704208,
          1.0,
          2.237689589179581e-09,
          1.113933421947877e-06,
          2.8301079257886386e-09,
          8.438326426496445e-11,
          0.9259443879127502,
          0.9963411688804626,
          7.787035447882895e-14,
          0.0007384183700196445,
          7.839634719175592e-08,
          0.033648598939180374,
          6.320839108586387e-17,
          4.738578418539419e-10,
          0.9742234945297241,
          0.9998304843902588,
          6.308940555754816e-06,
          0.9820833206176758,
          0.880968451499939,
          0.009862453676760197,
          0.021010298281908035
        ],
        "headpose": {
          "pitch": -27.587796586030993,
          "yaw": 67.17207595856985,
          "roll": -23.192650109850536
        },
        "attributes": {
          "5 oClock Shadow": 0.012268523685634136,
          "Arched Eyebrows": 0.006455612368881702,
          "Attractive": 0.05294576659798622,
          "Bags Under Eyes": 0.09016267210245132,
          "Bald": 5.003043042961508e-05,
          "Bangs": 0.0013196234358474612,
          "Big Lips": 0.05681736767292023,
          "Big Nose": 0.046004440635442734,
          "Black Hair": 0.11611869931221008,
          "Blond Hair": 0.0036219055764377117,
          "Blurry": 0.016103532165288925,
          "Brown Hair": 0.07771933078765869,
          "Bushy Eyebrows": 0.00834493525326252,
          "Chubby": 0.001272261026315391,
          "Double Chin": 0.0001462924265069887,
          "Eyeglasses": 0.002260334324091673,
          "Goatee": 0.0022796003613620996,
          "Gray Hair": 0.001268212217837572,
          "Heavy Makeup": 0.0022481007035821676,
          "High Cheekbones": 0.010871278122067451,
          "Male": 0.41947126388549805,
          "Mouth Slightly Open": 0.019942771643400192,
          "Mustache": 0.0007017994066700339,
          "Narrow Eyes": 0.30448776483535767,
          "No Beard": 0.9588558673858643,
          "Oval Face": 0.01143964659422636,
          "Pale Skin": 0.0013812541728839278,
          "Pointy Nose": 0.3312559723854065,
          "Receding Hairline": 0.05595812946557999,
          "Rosy Cheeks": 0.00023643049644306302,
          "Sideburns": 0.002981045516207814,
          "Smiling": 0.0013618771918118,
          "Straight Hair": 0.0934053510427475,
          "Wavy Hair": 0.11804280430078506,
          "Wearing Earrings": 0.01532247569411993,
          "Wearing Hat": 0.0014827033737674356,
          "Wearing Lipstick": 0.003883670549839735,
          "Wearing Necklace": 0.04910506308078766,
          "Wearing Necktie": 0.0002714686270337552,
          "Young": 0.9296848773956299
        },
        "age": [
          0.24830776453018188,
          0.8961533904075623,
          0.9655066132545471,
          0.17061802744865417,
          0.0799589604139328,
          0.0003009504289366305,
          8.940839325077832e-05,
          1.6731172536310623e-06
        ],
        "race": [
          0.9966848492622375,
          0.00024672987638041377,
          0.7925052046775818,
          0.18508301675319672,
          0.30135422945022583
        ],
        "gender": [
          0.02921222895383835,
          0.9734192490577698
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 15.91249406337738,
          "disgust": 0.0011688992344716098,
          "fear": 7.761210203170776,
          "happy": 0.4479210823774338,
          "sad": 74.42781329154968,
          "surprise": 0.0011380331670807209,
          "neutral": 1.4482557773590088
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1076,
          "h": 1633,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 30,
        "gender": {
          "Woman": 81.67287707328796,
          "Man": 18.327121436595917
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 7.354997098445892,
          "indian": 12.330097705125809,
          "black": 29.217466711997986,
          "white": 12.663672864437103,
          "middle eastern": 8.237025141716003,
          "latino hispanic": 30.196738243103027
        },
        "dominant_race": "latino hispanic"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.09984025359153748,
        0.005029189400374889,
        0.8152865767478943,
        0.9855887293815613
      ]
    ],
    "face_boxes": [
      [
        0.38041722774505615,
        0.1708921641111374,
        0.5673527717590332,
        0.6750636100769043
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6117415153616005,
            0.8136054491834142
          ],
          [
            0.506874784939819,
            0.745878155250802
          ],
          [
            0.39967768273088666,
            0.9697928821300509
          ],
          [
            0.25830179431041084,
            0.8343382942648263
          ],
          [
            0.716608245783382,
            0.8813327431160264
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.24431956358750664,
            0.8288095355764495
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.39967768273088666,
            0.3948019785388933
          ],
          [
            0.4369636313252979,
            0.403095116571458
          ],
          [
            0.5721251949800386,
            0.40585949591564635
          ],
          [
            0.5830002633200752,
            0.41415263394821106
          ]
        ],
        "dw_hand_1": [
          [
            0.2349980764389038,
            0.7956369834461907
          ],
          [
            0.24898030716180802,
            0.7071768444321663
          ],
          [
            0.25830179431041084,
            0.6021304293530125
          ],
          [
            0.24276598239607278,
            0.5357853250924944
          ],
          [
            0.23965882001320518,
            0.49431963492967057
          ],
          [
            0.171301247590118,
            0.5938372913204478
          ],
          [
            0.14333678614430959,
            0.5496072218134357
          ],
          [
            0.1464439485271771,
            0.5219634283715533
          ],
          [
            0.15265827329291232,
            0.5053771523064237
          ],
          [
            0.14799752971861097,
            0.6380673608274601
          ],
          [
            0.12469381184710392,
            0.5993660500088244
          ],
          [
            0.12469381184710392,
            0.57448663591113
          ],
          [
            0.12624739303853777,
            0.5606647391901888
          ],
          [
            0.140229623761442,
            0.6850618096786604
          ],
          [
            0.12469381184710392,
            0.6518892575484011
          ],
          [
            0.12780097422997153,
            0.6297742227948953
          ],
          [
            0.13246171780427302,
            0.6187167054181422
          ],
          [
            0.14333678614430959,
            0.723763120497296
          ],
          [
            0.13712246137857437,
            0.6988837063996016
          ],
          [
            0.140229623761442,
            0.6850618096786604
          ],
          [
            0.1464439485271771,
            0.6878261890228488
          ]
        ],
        "dw_hand_2": [
          [
            0.25208746954467565,
            0.8066945008229434
          ],
          [
            0.24898030716180802,
            0.7209987411531078
          ],
          [
            0.2598553755018446,
            0.6187167054181422
          ],
          [
            0.28160551218191776,
            0.5661934978785651
          ],
          [
            0.30490923005342485,
            0.5357853250924944
          ],
          [
            0.19771212784449266,
            0.6131879467297658
          ],
          [
            0.1821763159301546,
            0.5717222565669419
          ],
          [
            0.14799752971861097,
            0.5579003598460004
          ],
          [
            0.14489036733574334,
            0.5468428424692475
          ],
          [
            0.1573190168672138,
            0.6491248782042129
          ],
          [
            0.1293545554214054,
            0.6131879467297658
          ],
          [
            0.12314023065567016,
            0.6021304293530125
          ],
          [
            0.12314023065567016,
            0.5993660500088244
          ],
          [
            0.14178320495287586,
            0.6878261890228488
          ],
          [
            0.12624739303853777,
            0.6657111542693424
          ],
          [
            0.12314023065567016,
            0.6574180162367776
          ],
          [
            0.12469381184710392,
            0.6574180162367776
          ],
          [
            0.13712246137857437,
            0.734820637874049
          ],
          [
            0.12780097422997153,
            0.715469982464731
          ],
          [
            0.12780097422997153,
            0.7099412237763547
          ],
          [
            0.13246171780427302,
            0.7044124650879782
          ]
        ],
        "dw_face": [
          [
            0.39657052034801904,
            0.38927321985051677
          ],
          [
            0.4012312639223205,
            0.4307389100133407
          ],
          [
            0.4027848451137543,
            0.4749689795203528
          ],
          [
            0.4089991698794895,
            0.5164346696831765
          ],
          [
            0.4152134946452247,
            0.5579003598460004
          ],
          [
            0.4245349817938275,
            0.5966016706646362
          ],
          [
            0.43851721251673165,
            0.6353029814832718
          ],
          [
            0.45716018681393733,
            0.660182395580966
          ],
          [
            0.48046390468544425,
            0.660182395580966
          ],
          [
            0.5022140413655176,
            0.6408317401716481
          ],
          [
            0.5239641780455906,
            0.6159523260739538
          ],
          [
            0.5379464087684949,
            0.5855441532878831
          ],
          [
            0.5534822206828329,
            0.5496072218134357
          ],
          [
            0.561250126640002,
            0.5136702903389886
          ],
          [
            0.5643572890228695,
            0.46667584148778807
          ],
          [
            0.5643572890228695,
            0.42521015132496415
          ],
          [
            0.5643572890228695,
            0.38098008181795207
          ],
          [
            0.3903561955822838,
            0.3588650470644459
          ],
          [
            0.3919097767737177,
            0.3588650470644459
          ],
          [
            0.3919097767737177,
            0.3588650470644459
          ],
          [
            0.3919097767737177,
            0.3588650470644459
          ],
          [
            0.3934633579651514,
            0.36162942640863427
          ],
          [
            0.4058920074966219,
            0.3588650470644459
          ],
          [
            0.41832065702809224,
            0.3533362883760694
          ],
          [
            0.43230288775099646,
            0.3505719090318812
          ],
          [
            0.4478386996653345,
            0.3561006677202577
          ],
          [
            0.4618209303882387,
            0.36439380575282243
          ],
          [
            0.4012312639223205,
            0.4003307372272698
          ],
          [
            0.3950169391565853,
            0.42521015132496415
          ],
          [
            0.38880261439085007,
            0.4500895654226585
          ],
          [
            0.3810347084336811,
            0.4749689795203528
          ],
          [
            0.38569545200798244,
            0.49431963492967057
          ],
          [
            0.3950169391565853,
            0.4998483936180471
          ],
          [
            0.4058920074966219,
            0.5026127729622353
          ],
          [
            0.4136599134537909,
            0.5026127729622353
          ],
          [
            0.42142781941095986,
            0.4998483936180471
          ],
          [
            0.39812410153945293,
            0.3975663578830815
          ],
          [
            0.39812410153945293,
            0.3975663578830815
          ],
          [
            0.39967768273088666,
            0.3975663578830815
          ],
          [
            0.39967768273088666,
            0.3975663578830815
          ],
          [
            0.39967768273088666,
            0.4003307372272698
          ],
          [
            0.39812410153945293,
            0.4003307372272698
          ],
          [
            0.42764214417669505,
            0.4086238752598345
          ],
          [
            0.435410050133864,
            0.403095116571458
          ],
          [
            0.4447315372824669,
            0.4086238752598345
          ],
          [
            0.4540530244310697,
            0.4113882546040229
          ],
          [
            0.4447315372824669,
            0.41691701329239944
          ],
          [
            0.435410050133864,
            0.4196813926365876
          ],
          [
            0.41832065702809224,
            0.5579003598460004
          ],
          [
            0.4121063322623571,
            0.5523716011576238
          ],
          [
            0.40744558868805564,
            0.5440784631250591
          ],
          [
            0.4089991698794895,
            0.5468428424692475
          ],
          [
            0.4121063322623571,
            0.5440784631250591
          ],
          [
            0.42764214417669505,
            0.5523716011576238
          ],
          [
            0.4447315372824669,
            0.5634291185343772
          ],
          [
            0.43851721251673165,
            0.57448663591113
          ],
          [
            0.42919572536812894,
            0.5827797739436947
          ],
          [
            0.4198742382195261,
            0.5855441532878831
          ],
          [
            0.41832065702809224,
            0.57448663591113
          ],
          [
            0.41832065702809224,
            0.5661934978785651
          ],
          [
            0.41832065702809224,
            0.5579003598460004
          ],
          [
            0.41676707583665845,
            0.5579003598460004
          ],
          [
            0.4152134946452247,
            0.5579003598460004
          ],
          [
            0.42919572536812894,
            0.5606647391901888
          ],
          [
            0.44317795609103317,
            0.5634291185343772
          ],
          [
            0.43230288775099646,
            0.5661934978785651
          ],
          [
            0.4198742382195261,
            0.5634291185343772
          ],
          [
            0.41832065702809224,
            0.5606647391901888
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "016018",
  "objects": [
    {
      "box": [
        0.1963277906179428,
        0.44894617795944214,
        0.2591586709022522,
        0.6001841425895691
      ],
      "name": "smartphone",
      "possible_names": [
        "smartphone"
      ]
    },
    {
      "box": [
        0.35220348834991455,
        0.5630338191986084,
        0.42291194200515747,
        0.6457055807113647
      ],
      "name": "vape pen",
      "possible_names": [
        "vape pen"
      ]
    }
  ],
  "mask_file": "./person_labeling/./016018.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A nighttime urban setting bathed in red light with blurred city lights in the background and a person holding an electronic device and a vape pen creating a modern and moody atmosphere",
  "overall_past": "Before this scene, the individual likely arrived at a nighttime social gathering or urban event—perhaps a rooftop party, music venue, or street festival—where the atmosphere was already charged with energy and red lighting was used to create a bold, immersive ambiance. They may have been navigating through the crowd, possibly checking messages or scrolling through social media to connect with friends or catch up on updates, while seeking a moment of personal calm. The act of vaping could have been a deliberate pause, a ritual to center themselves amid the sensory overload of the environment, signaling a transition from the external buzz to a private, introspective moment.",
  "overall_past_clean": "The individual pushed through a dense throng of people, the pulse of music vibrating through the air as red-lit shadows danced across faces, pausing only to glance at a screen glowing faintly in their hand before stepping into a quiet corner, exhaling slowly as if shedding the weight of the crowd.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to lower the phone slightly, taking a final drag from the vape pen before pocketing both devices, their gaze briefly lifting to scan the surrounding red-lit urban landscape—perhaps noticing a familiar face in the crowd or a flickering neon sign that catches their attention. This moment of pause may lead to them stepping forward into the gathering, initiating a conversation or joining a group, suggesting a transition from solitary digital immersion to a fleeting human connection within the vibrant, atmospheric night.",
  "overall_future_clean": "A breath is drawn in, the device stowed away, and with deliberate motion, the figure steps into the pulsing rhythm of the crowd, eyes locking onto a stranger’s face across the haze—words are spoken, a smile forms, and the night shifts from isolation to shared presence.",
  "future_scene_ok": true
}