{
  "video_path": "./ref_datasets/part2/7926444001.mp4",
  "start_time": 0.0,
  "end_time": 5.4,
  "image_path": "./027924.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/7926444001.mp4",
      "start_time": 0.0,
      "end_time": 5.4,
      "image_path": "./ref_datasets/extracted_frames/face_-4612783878568190705_1_7926444001.mp4_0.00_5.40.jpg",
      "type": "face"
    }
  ],
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a black hat, a white shirt with a checkered pattern, and has a ring on his finger.",
        "clothing": [
          {
            "possible_names": [
              "hat",
              "cap"
            ],
            "name": "hat",
            "type": "headwear",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "shirt",
              "blouse"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "white",
              "black"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "cigarette",
              "smoke"
            ],
            "name": "cigarette",
            "position": "hand"
          }
        ],
        "description": "The person is an adult male with a neutral expression. He is wearing a black hat and a white shirt with a checkered pattern. He has a ring on his finger and is holding a cigarette in his hand. The setting appears to be indoors near a window.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be in a relaxed state, possibly enjoying a moment of leisure as indicated by the act of smoking.",
        "meaningful": true,
        "story": "The individual seems to be taking a break, perhaps reflecting or simply enjoying some downtime. The setting suggests an indoor environment with natural light streaming in, adding to the calm atmosphere.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a cigarette between their fingers, exhaling smoke while standing near a window, suggesting they might be taking a break or enjoying a moment of relaxation. Their eyes are closed, indicating a sense of calmness or perhaps deep thought. The individual's attire, including a hat and a checkered shirt, along with their beard, gives off a casual yet stylish vibe, possibly reflecting their personal style or the setting they are in. The sunlight streaming through the window adds to the serene atmosphere, enhancing the overall feeling of tranquility and introspection.",
        "intention": "The individual is seeking a moment of calm and introspection using the ritual of smoking as a grounding practice amidst a serene environment",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "face",
            "action": [
              [
                "face",
                "mouth holding"
              ],
              [
                "face",
                "smoking"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.5248291416714589,
            0.2513484968079461
          ],
          [
            0.5170539082515807,
            0.301903564210922
          ],
          [
            0.5041207515945038,
            0.34356853924100356
          ],
          [
            0.4920598644674534,
            0.4000814059424021
          ],
          [
            0.4809153534072851,
            0.4442779520201304
          ],
          [
            0.4821499460243753,
            0.5015272000479319
          ],
          [
            0.4830562307721093,
            0.5460930990794349
          ],
          [
            0.4837494653560931,
            0.5643422872301131
          ],
          [
            0.4918428144905539,
            0.6124499794036624
          ],
          [
            0.5176419195674715,
            0.6334839135881454
          ],
          [
            0.5462286436132023,
            0.644004201510596
          ],
          [
            0.5803261328488588,
            0.6386958288767982
          ],
          [
            0.6170720723768075,
            0.6273955034831215
          ],
          [
            0.6536243764772302,
            0.5897026501004659
          ],
          [
            0.6778741344099953,
            0.5334991315054515
          ],
          [
            0.6947532321370783,
            0.4644138059918842
          ],
          [
            0.7152397838376817,
            0.3934939516915215
          ],
          [
            0.5207969680428505,
            0.24550667111835786
          ],
          [
            0.5224068992992952,
            0.20116693339650593
          ],
          [
            0.5304468339929979,
            0.20071191579576525
          ],
          [
            0.5410426311904476,
            0.19587332568471394
          ],
          [
            0.5447387377775851,
            0.1907039681124309
          ],
          [
            0.5716988539057118,
            0.1798365512537578
          ],
          [
            0.5885144303597155,
            0.17906717875647168
          ],
          [
            0.6021572733209247,
            0.18131274968858752
          ],
          [
            0.6160167215480691,
            0.19155980991938756
          ],
          [
            0.6335356445894356,
            0.2419684797998459
          ],
          [
            0.5434711253713994,
            0.22054763057875254
          ],
          [
            0.5277808227886757,
            0.2466165947535681
          ],
          [
            0.5138886986477744,
            0.26092589885469464
          ],
          [
            0.5012518177429836,
            0.27811206371065167
          ],
          [
            0.5057004321632641,
            0.3535433935740637
          ],
          [
            0.5104037315185581,
            0.35370826002151246
          ],
          [
            0.5170347701669449,
            0.35490309473067994
          ],
          [
            0.5307050869578407,
            0.35091945235691374
          ],
          [
            0.5448995576727957,
            0.35715303383176283
          ],
          [
            0.5226614135894038,
            0.27344752341981915
          ],
          [
            0.523409986247619,
            0.2786792104206388
          ],
          [
            0.5346352356175582,
            0.2725335543117826
          ],
          [
            0.5357341267523311,
            0.2560694656674824
          ],
          [
            0.532037565112114,
            0.2566504832298036
          ],
          [
            0.5266937940603211,
            0.2625215833149259
          ],
          [
            0.578828263584347,
            0.25755837266407317
          ],
          [
            0.5815582511148283,
            0.25222486390007864
          ],
          [
            0.5976845979690552,
            0.25971604377504376
          ],
          [
            0.6042725461934294,
            0.2566750318285019
          ],
          [
            0.5949735158256123,
            0.25963184795682387
          ],
          [
            0.5834846045644511,
            0.24568755418535268
          ],
          [
            0.4954821842323457,
            0.44446642190691016
          ],
          [
            0.49795259500720673,
            0.4289367127040076
          ],
          [
            0.5041499422153547,
            0.400366971795521
          ],
          [
            0.5100042673093932,
            0.39279458484952406
          ],
          [
            0.5125525645556904,
            0.38819939882036236
          ],
          [
            0.536361003738074,
            0.405474383111984
          ],
          [
            0.5518480010153283,
            0.4452872289551629
          ],
          [
            0.533723619509311,
            0.4508088755229163
          ],
          [
            0.5212410533091142,
            0.4749894240545847
          ],
          [
            0.5033556108673414,
            0.47825012169187026
          ],
          [
            0.49678783493914774,
            0.475292896845984
          ],
          [
            0.4974183109810665,
            0.45538242506602455
          ],
          [
            0.49418691183839525,
            0.43471610678566824
          ],
          [
            0.4981063046980472,
            0.4293713071989634
          ],
          [
            0.5094798651745632,
            0.41222948819871924
          ],
          [
            0.5309211647758881,
            0.4132815527537513
          ],
          [
            0.549643765265743,
            0.44055246587783575
          ],
          [
            0.5290096626040481,
            0.45071793586488745
          ],
          [
            0.5054375717859892,
            0.4581250221010238
          ],
          [
            0.4944622499779577,
            0.4420337860546415
          ]
        ],
        "visibility": [
          0.05494513735175133,
          1.1765722774725873e-05,
          0.00011535642988746986,
          3.9792567027921444e-13,
          1.9067210814682767e-05,
          9.962303693100694e-07,
          2.0035296713011737e-18,
          1.4818533553007107e-11,
          0.001852201297879219,
          3.701678110701323e-07,
          0.9951352477073669,
          5.121468138469254e-09,
          8.688898134323608e-08,
          4.236287338699185e-07,
          9.93032218954415e-12,
          1.8921755327028222e-05,
          4.4298399188846815e-06,
          1.8013412272921414e-07,
          0.9999922513961792,
          0.0015872076619416475,
          1.150533762483974e-06,
          9.510687959846109e-05,
          1.0,
          0.2183336615562439,
          0.009811216033995152,
          0.6039307713508606,
          0.9999256134033203,
          0.9995997548103333,
          1.0
        ],
        "headpose": {
          "pitch": 37.00145016808771,
          "yaw": 55.67753694397705,
          "roll": 19.677056121396593
        },
        "attributes": {
          "5 oClock Shadow": 0.021947184577584267,
          "Arched Eyebrows": 0.003933771979063749,
          "Attractive": 0.031987134367227554,
          "Bags Under Eyes": 0.0227813683450222,
          "Bald": 0.0036298902705311775,
          "Bangs": 0.0005407293210737407,
          "Big Lips": 0.03475296124815941,
          "Big Nose": 0.10181634873151779,
          "Black Hair": 0.10509315878152847,
          "Blond Hair": 0.00020340524497441947,
          "Blurry": 0.017303582280874252,
          "Brown Hair": 0.006321124266833067,
          "Bushy Eyebrows": 0.18423885107040405,
          "Chubby": 0.05370169132947922,
          "Double Chin": 0.0022789358627051115,
          "Eyeglasses": 0.011077502742409706,
          "Goatee": 0.5882776379585266,
          "Gray Hair": 0.00109008455183357,
          "Heavy Makeup": 0.000677035131957382,
          "High Cheekbones": 0.005471829790621996,
          "Male": 0.998348593711853,
          "Mouth Slightly Open": 0.14389799535274506,
          "Mustache": 0.10054907947778702,
          "Narrow Eyes": 0.27902379631996155,
          "No Beard": 0.02731592021882534,
          "Oval Face": 0.023978887125849724,
          "Pale Skin": 0.007693884428590536,
          "Pointy Nose": 0.14469875395298004,
          "Receding Hairline": 0.005704081617295742,
          "Rosy Cheeks": 0.00036076470860280097,
          "Sideburns": 0.9285902976989746,
          "Smiling": 0.0056840525940060616,
          "Straight Hair": 0.011852098628878593,
          "Wavy Hair": 0.04038288816809654,
          "Wearing Earrings": 0.004642656538635492,
          "Wearing Hat": 0.5400621294975281,
          "Wearing Lipstick": 0.00042199765448458493,
          "Wearing Necklace": 0.008851139806210995,
          "Wearing Necktie": 0.006859209388494492,
          "Young": 0.7090669274330139
        },
        "age": [
          0.006862949579954147,
          0.012568848207592964,
          0.9309088587760925,
          0.9682746529579163,
          0.7328237295150757,
          0.04721637815237045,
          0.0005555415991693735,
          3.0788321510044625e-06
        ],
        "race": [
          0.950544536113739,
          0.006197940558195114,
          0.28925228118896484,
          0.6256195306777954,
          0.6745314598083496
        ],
        "gender": [
          0.9971428513526917,
          0.005974804982542992
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 4.851119062010412e-07,
          "disgust": 7.464596649131572e-10,
          "fear": 0.027687157853506505,
          "happy": 0.0045495671656681225,
          "sad": 99.96775388717651,
          "surprise": 6.74131499863069e-12,
          "neutral": 5.639992650685599e-06
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1165,
          "h": 1619,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 37,
        "gender": {
          "Woman": 9.787961840629578,
          "Man": 90.21203517913818
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 16.684383153915405,
          "indian": 11.01372018456459,
          "black": 14.556755125522614,
          "white": 25.652676820755005,
          "middle eastern": 19.051237404346466,
          "latino hispanic": 13.041229546070099
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.19171342253684998,
        0.06787513941526413,
        0.9983842968940735,
        0.9884390234947205
      ]
    ],
    "face_boxes": [
      [
        0.49302494525909424,
        0.14733389019966125,
        0.6953970789909363,
        0.6473841667175293
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.7131861163973808,
            0.9804133199075787
          ],
          [
            0.491305469751358,
            0.997578772997941
          ],
          [
            0.2615318356752396,
            1.0194257132947657
          ],
          [
            0.2667938272953033,
            0.922674977694542
          ],
          [
            0.9350667630434036,
            0.9632478668172164
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5263854138851166,
            0.32344461526734974
          ],
          [
            0.5860213189125061,
            0.3109606493834499
          ],
          [
            0.7456350647211075,
            0.46076823999024796
          ],
          [
            0.7421270703077316,
            0.44516328263537314
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.28608779656887057,
            0.9039490288686922
          ],
          [
            0.32642973232269284,
            0.8165612676813934
          ],
          [
            0.3772956513166428,
            0.7416574723779943
          ],
          [
            0.3860656373500824,
            0.6761166514875202
          ],
          [
            0.3878196345567703,
            0.613696822068021
          ],
          [
            0.3404617099761963,
            0.6043338476550961
          ],
          [
            0.34923169600963594,
            0.5512769926485218
          ],
          [
            0.3650176708698273,
            0.5450350097065718
          ],
          [
            0.3772956513166428,
            0.5824869073582714
          ],
          [
            0.30713576304912565,
            0.6043338476550961
          ],
          [
            0.322921737909317,
            0.5762449244163215
          ],
          [
            0.35098569321632384,
            0.6261807879519208
          ],
          [
            0.3650176708698273,
            0.691721608842395
          ],
          [
            0.27380981612205507,
            0.6293017794228958
          ],
          [
            0.29310378539562226,
            0.6261807879519208
          ],
          [
            0.32467573511600495,
            0.68860061737142
          ],
          [
            0.347477698802948,
            0.7447784638489693
          ],
          [
            0.24399186360836028,
            0.6667536770745953
          ],
          [
            0.2615318356752396,
            0.6667536770745953
          ],
          [
            0.28608779656887057,
            0.7073265661972697
          ],
          [
            0.3106437574625015,
            0.7572624297328691
          ]
        ],
        "dw_face": [
          [
            0.5246314166784286,
            0.32344461526734974
          ],
          [
            0.5176154278516769,
            0.36713849586099917
          ],
          [
            0.5088454418182373,
            0.4108323764546486
          ],
          [
            0.5000754557847976,
            0.45764724851927296
          ],
          [
            0.4965674613714218,
            0.5075831120548724
          ],
          [
            0.4983214585781097,
            0.5543979841194967
          ],
          [
            0.5053374474048614,
            0.6012128561841211
          ],
          [
            0.5281394110918045,
            0.613696822068021
          ],
          [
            0.5562033663988113,
            0.6043338476550961
          ],
          [
            0.5842673217058182,
            0.5918498817711962
          ],
          [
            0.6105772798061371,
            0.5824869073582714
          ],
          [
            0.6351332406997681,
            0.5606399670614467
          ],
          [
            0.659689201593399,
            0.5387930267646219
          ],
          [
            0.6789831708669662,
            0.49822013764194745
          ],
          [
            0.6947691457271576,
            0.46076823999024796
          ],
          [
            0.7052931289672851,
            0.41707435939659854
          ],
          [
            0.7123091177940368,
            0.3702594873319741
          ],
          [
            0.5263854138851166,
            0.29847668349955003
          ],
          [
            0.5298934082984924,
            0.29223470055760015
          ],
          [
            0.5316474055051803,
            0.29223470055760015
          ],
          [
            0.5351553999185562,
            0.2891137090866252
          ],
          [
            0.5386633943319321,
            0.2891137090866252
          ],
          [
            0.5614653580188751,
            0.27038776026077543
          ],
          [
            0.5790053300857544,
            0.26102478584785055
          ],
          [
            0.5965453021526337,
            0.2547828029059006
          ],
          [
            0.6158392714262009,
            0.26102478584785055
          ],
          [
            0.6316252462863922,
            0.2766297432027253
          ],
          [
            0.5386633943319321,
            0.31408164085442486
          ],
          [
            0.5263854138851166,
            0.33280758968027463
          ],
          [
            0.5141074334383011,
            0.3484125470351494
          ],
          [
            0.5018294529914856,
            0.3640175043900242
          ],
          [
            0.4965674613714218,
            0.4014694020417237
          ],
          [
            0.5053374474048614,
            0.41707435939659854
          ],
          [
            0.5176154278516769,
            0.4201953508675735
          ],
          [
            0.5298934082984924,
            0.4201953508675735
          ],
          [
            0.5421713887453079,
            0.41707435939659854
          ],
          [
            0.5246314166784286,
            0.33280758968027463
          ],
          [
            0.5246314166784286,
            0.3265656067383247
          ],
          [
            0.5263854138851166,
            0.32344461526734974
          ],
          [
            0.5298934082984924,
            0.32344461526734974
          ],
          [
            0.5281394110918045,
            0.3265656067383247
          ],
          [
            0.5263854138851166,
            0.32968659820929963
          ],
          [
            0.5754973356723785,
            0.3172026323253998
          ],
          [
            0.5842673217058182,
            0.3078396579124749
          ],
          [
            0.5965453021526337,
            0.3078396579124749
          ],
          [
            0.6088232825994492,
            0.31408164085442486
          ],
          [
            0.5982992993593216,
            0.3172026323253998
          ],
          [
            0.5860213189125061,
            0.32032362379637475
          ],
          [
            0.5018294529914856,
            0.5044621205838974
          ],
          [
            0.4983214585781097,
            0.48885716322902256
          ],
          [
            0.5018294529914856,
            0.47013121440317285
          ],
          [
            0.5053374474048614,
            0.46701022293219785
          ],
          [
            0.5123534362316131,
            0.4638892314612229
          ],
          [
            0.5281394110918045,
            0.47637319734512273
          ],
          [
            0.5439253859519958,
            0.49197815469999756
          ],
          [
            0.5316474055051803,
            0.49822013764194745
          ],
          [
            0.5176154278516769,
            0.5075831120548724
          ],
          [
            0.5035834501981735,
            0.5169460864677973
          ],
          [
            0.5000754557847976,
            0.5138250949968223
          ],
          [
            0.5000754557847976,
            0.5107041035258473
          ],
          [
            0.5018294529914856,
            0.5044621205838974
          ],
          [
            0.5053374474048614,
            0.49822013764194745
          ],
          [
            0.5070914446115494,
            0.48885716322902256
          ],
          [
            0.5246314166784286,
            0.4857361717580476
          ],
          [
            0.54041739153862,
            0.49197815469999756
          ],
          [
            0.5246314166784286,
            0.49197815469999756
          ],
          [
            0.5070914446115494,
            0.49822013764194745
          ],
          [
            0.5053374474048614,
            0.5013411291129224
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            0.4053596066236496,
            0.5107041035258473
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.2703018217086792,
            0.9351589435784418
          ]
        ]
      }
    ]
  },
  "new_filename": "027924",
  "objects": [
    {
      "box": [
        0.44710975885391235,
        0.4104522168636322,
        0.506600558757782,
        0.502694308757782
      ],
      "name": "cigarette",
      "possible_names": [
        "cigarette"
      ]
    }
  ],
  "mask_file": "./person_labeling/./027924.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is holding a lit cigarette near their mouth with smoke rising against a bright window backdrop and wearing a checkered shirt and a hat with rings on their fingers.",
  "overall_past": "Before this scene, the individual likely finished a period of focused work or deep contemplation, possibly indoors in a quiet space such as an office or study. The act of stepping near the window with a cigarette suggests a deliberate pause—a transition from mental engagement to physical relaxation. The careful positioning of the cigarette, the closed eyes, and the serene expression indicate a moment of intentional stillness, implying that the person had been mentally or emotionally invested in something significant, perhaps a decision, creative process, or personal reflection. The sunlight streaming through the window may symbolize a shift in perspective or a moment of clarity, suggesting that the current scene follows a period of inner struggle or concentration.",
  "overall_past_clean": "The mind had been locked in relentless pursuit—thoughts weaving through complexity, decisions crystallizing under pressure, emotions simmering beneath silence—until the weight of focus finally released, leaving only the quiet echo of resolution and the instinct to step into stillness.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to slowly lower the cigarette, letting the ember glow faintly before extinguishing it against the windowsill or in a nearby ashtray. With a final breath of smoke drifting into the sunlight, they open their eyes, briefly gazing out at the view beyond the window—perhaps a quiet street, a distant skyline, or the shifting clouds—before turning away, the moment of stillness giving way to a quiet continuation of their day, perhaps stepping back into motion with a renewed sense of clarity or purpose.",
  "overall_future_clean": "The figure rises with deliberate calm, the lingering haze of smoke dissolving into the air as they step forward, shoulders settling into a steady rhythm, eyes now fixed on the path ahead, moving with quiet intention toward whatever comes next.",
  "future_scene_ok": true
}