{
  "video_path": "./ref_datasets/part2/5900722004.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./003117.jpg",
  "represents_multiple_types": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5900722002.mp4",
      "start_time": 0.0,
      "end_time": 3.04,
      "image_path": "./ref_datasets/extracted_frames/person_-588908277274928873_1_5900722002.mp4_0.00_3.04.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5900722003.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_2201825760614866250_1_5900722003.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5900722004.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_4076002595179046790_1_5900722004.mp4_0.00_6.08.jpg",
      "type": "person"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a loose-fitting, olive-green shirt with visible white buttons on the cuffs. The shirt appears to be made of a soft material and is worn in a casual manner.",
        "clothing": [
          {
            "possible_names": [
              "shirt",
              "blouse",
              "top"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "olive-green"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "wine glass",
              "glass"
            ],
            "name": "wine glass",
            "position": "standalone"
          }
        ],
        "description": "The person is an adult female who appears to be in a neutral emotional state. She is wearing a loose-fitting, olive-green shirt with white buttons on the cuffs. The shirt is casual and made of a soft material. In front of her is a wine glass placed on the table. The setting includes a plain background with a hint of green curtains.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and neutral expression, possibly indicating a state of relaxation or contemplation.",
        "meaningful": true,
        "story": "The person seems to be in a relaxed setting, perhaps enjoying a quiet moment at home or in a café. The presence of the wine glass suggests she might be taking a break or indulging in a leisurely drink.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box is leaning on a table with their head resting near a wine glass, suggesting a moment of relaxation or contemplation. Their hand is gently placed on the table, indicating a calm demeanor. The individual appears to be in a quiet setting, possibly enjoying a solitary moment, as there are no other people present. The expression seems serene, hinting at a desire for peace or reflection. The presence of the wine glass suggests they might be taking a break, perhaps after a long day, to unwind and savor a drink. The overall scene conveys a sense of tranquility and introspection.",
        "intention": "The individual is seeking calm and introspection through a deliberate pause in a quiet environment to unwind and reflect",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": true,
            "position": "standalone",
            "action": [
              [
                "standalone",
                "look at"
              ],
              [
                "standalone",
                "lying behind"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.7067185633017549,
            0.3744640797692001
          ],
          [
            0.6845704855264297,
            0.40592482755423853
          ],
          [
            0.6627995109385145,
            0.4351435559767264
          ],
          [
            0.6299793514190242,
            0.4574802237528342
          ],
          [
            0.59091784183069,
            0.47679913996388673
          ],
          [
            0.5697192215427225,
            0.5282740306286584
          ],
          [
            0.5624670693318227,
            0.5647283704507918
          ],
          [
            0.5583722646780578,
            0.6150058689571561
          ],
          [
            0.5535421913290131,
            0.6426741759613077
          ],
          [
            0.5726529394409486,
            0.6859495182516714
          ],
          [
            0.5979658894939348,
            0.7301646784499839
          ],
          [
            0.6257588223920071,
            0.75470889270621
          ],
          [
            0.6611016095017216,
            0.7786230126385967
          ],
          [
            0.7102421465595918,
            0.775540552442036
          ],
          [
            0.7455219805706292,
            0.7748051599219993
          ],
          [
            0.7726504442814206,
            0.769343299462051
          ],
          [
            0.8276099959787513,
            0.759297860236395
          ],
          [
            0.7065709501039237,
            0.37753084084344285
          ],
          [
            0.7188198244465249,
            0.39156379195117447
          ],
          [
            0.7257021744070309,
            0.4259107554715777
          ],
          [
            0.7416361197829247,
            0.46599688353361907
          ],
          [
            0.7411157951490688,
            0.5040891252812885
          ],
          [
            0.7539712626686585,
            0.5871283996672858
          ],
          [
            0.7606900828291796,
            0.6050540595142929
          ],
          [
            0.7856526018918626,
            0.6443472569581692
          ],
          [
            0.7901821479733502,
            0.675009848327233
          ],
          [
            0.7879068291346942,
            0.7105767368639588
          ],
          [
            0.7295732375101319,
            0.5627453268520416
          ],
          [
            0.701269938344402,
            0.5721448748515396
          ],
          [
            0.6904168576999966,
            0.5597204916691654
          ],
          [
            0.6605229752770226,
            0.5723111008525525
          ],
          [
            0.6534671371503334,
            0.5423444640699518
          ],
          [
            0.655015579175337,
            0.5660834491568267
          ],
          [
            0.6506633955120508,
            0.5975947709310623
          ],
          [
            0.6571720549836755,
            0.6126833549252263
          ],
          [
            0.669115590713253,
            0.6162529333558663
          ],
          [
            0.7004038122416074,
            0.41902452287850556
          ],
          [
            0.7149119209830782,
            0.4413444159522889
          ],
          [
            0.7192489992594346,
            0.47324298998666187
          ],
          [
            0.7194702372320795,
            0.5100892972378503
          ],
          [
            0.7001872457497353,
            0.48233987629098235
          ],
          [
            0.7031910078866142,
            0.44334212655112853
          ],
          [
            0.7391139397597206,
            0.6137176065848617
          ],
          [
            0.741992159347449,
            0.6273254102500028
          ],
          [
            0.7448077475252961,
            0.6652577491033644
          ],
          [
            0.7532988211938314,
            0.6916225400551286
          ],
          [
            0.7402027304550367,
            0.6715527820839453
          ],
          [
            0.7433544414650117,
            0.6301898427741238
          ],
          [
            0.614721693797037,
            0.526638801356472
          ],
          [
            0.6262193268963269,
            0.5650480241371841
          ],
          [
            0.6299162584556532,
            0.5831031881627582
          ],
          [
            0.6392285336873361,
            0.6005774955270151
          ],
          [
            0.6414081850754363,
            0.6049228387534934
          ],
          [
            0.6444389131252787,
            0.6444283057142187
          ],
          [
            0.632665494822764,
            0.6866192026113076
          ],
          [
            0.6112756655119094,
            0.6669142292290138
          ],
          [
            0.594879677120064,
            0.6519927838492016
          ],
          [
            0.5978163251836252,
            0.6230018828281019
          ],
          [
            0.6012718013288187,
            0.6020225752913763
          ],
          [
            0.6069079428811425,
            0.5586381757070148
          ],
          [
            0.6230014039403093,
            0.54097221954159
          ],
          [
            0.6258254679186004,
            0.5825564675860935
          ],
          [
            0.6321536320028827,
            0.6124541586038297
          ],
          [
            0.6245052011550537,
            0.6399238201045485
          ],
          [
            0.6341169266961515,
            0.6739685565075546
          ],
          [
            0.612130630412139,
            0.6427088118104076
          ],
          [
            0.6174805388686114,
            0.6100754102071126
          ],
          [
            0.6107039965489613,
            0.5874728677449403
          ]
        ],
        "visibility": [
          0.9999977350234985,
          0.9999997615814209,
          0.7613613605499268,
          1.5300824429687054e-07,
          0.9999998807907104,
          0.9996040463447571,
          4.514092571961115e-11,
          3.3197548532371e-07,
          0.9989705085754395,
          0.9694784283638,
          0.9999995231628418,
          0.08444111049175262,
          0.0009490661323070526,
          0.9991433620452881,
          0.006954973563551903,
          0.9174984097480774,
          0.40051698684692383,
          0.012788863852620125,
          0.0004731625667773187,
          7.789292340021348e-07,
          0.012701774947345257,
          0.0010135816410183907,
          0.8764463067054749,
          2.6995164784104908e-11,
          0.0006800119299441576,
          0.09592889994382858,
          0.6328394412994385,
          0.8041576147079468,
          0.0012863923329859972
        ],
        "headpose": {
          "pitch": 11.621499424658642,
          "yaw": 16.819960670823576,
          "roll": 69.13328281646898
        },
        "attributes": {
          "5 oClock Shadow": 0.0004689637862611562,
          "Arched Eyebrows": 0.11470132321119308,
          "Attractive": 0.09386726468801498,
          "Bags Under Eyes": 0.03684188425540924,
          "Bald": 9.128585588769056e-06,
          "Bangs": 0.037451233714818954,
          "Big Lips": 0.27751708030700684,
          "Big Nose": 0.0658167228102684,
          "Black Hair": 0.000132177141495049,
          "Blond Hair": 0.746708333492279,
          "Blurry": 0.001012112945318222,
          "Brown Hair": 0.016971930861473083,
          "Bushy Eyebrows": 0.00025880514294840395,
          "Chubby": 0.019377896562218666,
          "Double Chin": 0.003865709062665701,
          "Eyeglasses": 0.01702684909105301,
          "Goatee": 3.699873559526168e-05,
          "Gray Hair": 0.03165603056550026,
          "Heavy Makeup": 0.023082805797457695,
          "High Cheekbones": 0.08401761949062347,
          "Male": 0.021643707528710365,
          "Mouth Slightly Open": 0.021742234006524086,
          "Mustache": 1.2323263035796117e-05,
          "Narrow Eyes": 0.07954677939414978,
          "No Beard": 0.9990326166152954,
          "Oval Face": 0.07766252756118774,
          "Pale Skin": 0.002776301931589842,
          "Pointy Nose": 0.3804447650909424,
          "Receding Hairline": 0.00523039698600769,
          "Rosy Cheeks": 0.020710168406367302,
          "Sideburns": 4.431423076312058e-05,
          "Smiling": 0.006413768511265516,
          "Straight Hair": 0.8913657069206238,
          "Wavy Hair": 0.043164681643247604,
          "Wearing Earrings": 0.012072816491127014,
          "Wearing Hat": 0.0003981514018960297,
          "Wearing Lipstick": 0.22941185534000397,
          "Wearing Necklace": 0.0804223120212555,
          "Wearing Necktie": 0.0014557780232280493,
          "Young": 0.8054593801498413
        },
        "age": [
          0.9754462838172913,
          0.06594456732273102,
          0.031087415292859077,
          0.0004897653707303107,
          0.009108061902225018,
          0.0028349468484520912,
          0.16687557101249695,
          0.0057882810942828655
        ],
        "race": [
          0.981316328048706,
          4.474959860090166e-05,
          0.9998056292533875,
          0.02109532058238983,
          0.08250229060649872
        ],
        "gender": [
          0.03321058303117752,
          0.9705843329429626
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.810161791741848,
          "disgust": 1.905458901774182e-05,
          "fear": 39.22139108181,
          "happy": 0.030950410291552544,
          "sad": 0.5761059932410717,
          "surprise": 0.017908438167069107,
          "neutral": 59.34346914291382
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1681,
          "h": 1377,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 42,
        "gender": {
          "Woman": 19.528697431087494,
          "Man": 80.47130703926086
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 7.282149791717529,
          "indian": 2.678445912897587,
          "black": 0.5225266329944134,
          "white": 55.675214529037476,
          "middle eastern": 20.6708624958992,
          "latino hispanic": 13.17080408334732
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.0010856628650799394,
        0.23467281460762024,
        0.9041200280189514,
        0.9593115448951721
      ]
    ],
    "face_boxes": [
      [
        0.5590459704399109,
        0.36996227502822876,
        0.8328798413276672,
        0.7953968048095703
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.477176926198519,
            0.6190514663870943
          ],
          [
            0.35462261958916985,
            0.38100727240219406
          ],
          [
            0.03231444315198394,
            0.6337003398630883
          ],
          [
            0.25040320924421156,
            0.7655402011470329
          ],
          [
            0.5997312328078681,
            0.8570956603719946
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5727113856813973,
            0.8570956603719946
          ],
          [
            0.0728442138416899,
            0.8094868215750143
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6962306868309777,
            0.5055226969481419
          ],
          [
            0.7116705994746751,
            0.7032824888740592
          ],
          [
            0.6653508615435826,
            0.37002061729519875
          ],
          [
            0.7078106213137507,
            0.7948379480990204
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5669214184400108,
            0.8131490399440129
          ],
          [
            0.5534114948767755,
            0.8168112583130115
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5669214184400108,
            0.8168112583130115
          ],
          [
            0.547621527635389,
            0.8314601317890054
          ],
          [
            0.5360415931526159,
            0.835122350158004
          ],
          [
            0.5167417023479939,
            0.8277979134200066
          ],
          [
            0.5707813966009353,
            0.8387845685270027
          ],
          [
            0.5553414839572376,
            0.8461090052649991
          ],
          [
            0.5321816149916913,
            0.8387845685270027
          ],
          [
            0.49937180062383413,
            0.8314601317890054
          ],
          [
            0.5727113856813973,
            0.853433442002996
          ],
          [
            0.5572714730377,
            0.8570956603719946
          ],
          [
            0.5321816149916913,
            0.8570956603719946
          ],
          [
            0.49937180062383413,
            0.8461090052649991
          ],
          [
            0.5649914293595486,
            0.8680823154789902
          ],
          [
            0.5553414839572376,
            0.8644200971099915
          ],
          [
            0.537971582233078,
            0.8717445338479888
          ],
          [
            0.5341116040721535,
            0.8607578787409929
          ]
        ],
        "dw_hand_2": [
          [
            0.26005315464652246,
            0.7875135113610235
          ],
          [
            0.30830288165807723,
            0.7362424541950454
          ],
          [
            0.356552608669632,
            0.6593358684460775
          ],
          [
            0.39515239027887583,
            0.6263759031250913
          ],
          [
            0.4163822701639599,
            0.6080648112800994
          ],
          [
            0.3526926305087077,
            0.5897537194351065
          ],
          [
            0.397082379359338,
            0.6227136847560927
          ],
          [
            0.4163822701639599,
            0.6849713970290668
          ],
          [
            0.42410222648580875,
            0.7289180174570481
          ],
          [
            0.3430426851063967,
            0.6153892480180958
          ],
          [
            0.3932224011984137,
            0.6556736500770789
          ],
          [
            0.41445228108349774,
            0.7252557990880499
          ],
          [
            0.42024224832488427,
            0.7692024195160316
          ],
          [
            0.33725271786501015,
            0.6520114317080806
          ],
          [
            0.38357245579610266,
            0.688633615398065
          ],
          [
            0.4028723466007245,
            0.7508913276710392
          ],
          [
            0.41059230292257337,
            0.7948379480990204
          ],
          [
            0.3314627506236235,
            0.6959580521360619
          ],
          [
            0.3681325431524051,
            0.717931362350053
          ],
          [
            0.3855024448765648,
            0.7618779827780343
          ],
          [
            0.3932224011984137,
            0.7985001664680191
          ]
        ],
        "dw_face": [
          [
            0.6962306868309777,
            0.37002061729519875
          ],
          [
            0.6692108397045069,
            0.38466949077119256
          ],
          [
            0.6421909925780362,
            0.40298058261618497
          ],
          [
            0.6171011345320278,
            0.42129167446117716
          ],
          [
            0.5939412655664814,
            0.4505894214131649
          ],
          [
            0.5746413747618596,
            0.4835493867341511
          ],
          [
            0.5611314511986243,
            0.5311582255311312
          ],
          [
            0.5514815057963133,
            0.578767064328111
          ],
          [
            0.547621527635389,
            0.6300381214940896
          ],
          [
            0.5514815057963133,
            0.6813091786600681
          ],
          [
            0.568851407520473,
            0.7252557990880499
          ],
          [
            0.5920112764860194,
            0.7508913276710392
          ],
          [
            0.6171011345320278,
            0.7801890746230267
          ],
          [
            0.6441209816584985,
            0.7875135113610235
          ],
          [
            0.6730708178654313,
            0.7985001664680191
          ],
          [
            0.6981606759114397,
            0.7948379480990204
          ],
          [
            0.7271105121183727,
            0.7875135113610235
          ],
          [
            0.7213205448769862,
            0.4176294560921787
          ],
          [
            0.7309704902792971,
            0.44692720304416644
          ],
          [
            0.7348304684402215,
            0.4835493867341511
          ],
          [
            0.7348304684402215,
            0.5201715704241356
          ],
          [
            0.7309704902792971,
            0.5531315357451221
          ],
          [
            0.7348304684402215,
            0.6520114317080806
          ],
          [
            0.7406204356816078,
            0.6813091786600681
          ],
          [
            0.7464104029229945,
            0.7106069256120557
          ],
          [
            0.7483403920034568,
            0.7435668909330418
          ],
          [
            0.7444804138425325,
            0.7728646378850302
          ],
          [
            0.7020206540723641,
            0.6153892480180958
          ],
          [
            0.6865807414286667,
            0.6190514663870944
          ],
          [
            0.6711408287849691,
            0.6263759031250913
          ],
          [
            0.6537709270608093,
            0.6300381214940896
          ],
          [
            0.6364010253366496,
            0.5897537194351065
          ],
          [
            0.6344710362561875,
            0.6117270296490972
          ],
          [
            0.6344710362561875,
            0.6337003398630883
          ],
          [
            0.6364010253366496,
            0.6556736500770789
          ],
          [
            0.6402610034975742,
            0.6776469602910695
          ],
          [
            0.6943006977505154,
            0.46523829488915885
          ],
          [
            0.7039506431528264,
            0.49453604184114663
          ],
          [
            0.7058806322332885,
            0.5274960071621327
          ],
          [
            0.6962306868309777,
            0.560455972483119
          ],
          [
            0.6885107305091287,
            0.5311582255311312
          ],
          [
            0.6885107305091287,
            0.49819826021014507
          ],
          [
            0.7020206540723641,
            0.6629980868150758
          ],
          [
            0.7136005885551374,
            0.6813091786600681
          ],
          [
            0.7174605667160617,
            0.7106069256120557
          ],
          [
            0.7136005885551374,
            0.7399046725640441
          ],
          [
            0.7039506431528264,
            0.717931362350053
          ],
          [
            0.700090664991902,
            0.6922958337670637
          ],
          [
            0.6035912109687924,
            0.5641181908521172
          ],
          [
            0.6093811782101791,
            0.5934159378041052
          ],
          [
            0.6132411563711034,
            0.6263759031250913
          ],
          [
            0.6132411563711034,
            0.6410247766010855
          ],
          [
            0.6151711454515655,
            0.6556736500770789
          ],
          [
            0.6151711454515655,
            0.6849713970290668
          ],
          [
            0.6132411563711034,
            0.7069447072430579
          ],
          [
            0.6016612218883302,
            0.6922958337670637
          ],
          [
            0.5920112764860194,
            0.6739847419220717
          ],
          [
            0.588151298325095,
            0.648349213339082
          ],
          [
            0.588151298325095,
            0.6190514663870944
          ],
          [
            0.5939412655664814,
            0.5897537194351065
          ],
          [
            0.6035912109687924,
            0.5714426275901145
          ],
          [
            0.6035912109687924,
            0.6080648112800994
          ],
          [
            0.6055212000492547,
            0.6446869949700833
          ],
          [
            0.6074511891297167,
            0.6739847419220717
          ],
          [
            0.6113111672906412,
            0.6996202705050606
          ],
          [
            0.6055212000492547,
            0.6739847419220717
          ],
          [
            0.6016612218883302,
            0.6446869949700833
          ],
          [
            0.6016612218883302,
            0.6080648112800994
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "003117",
  "objects": [
    {
      "box": [
        0.4661550521850586,
        0.2017558515071869,
        0.6122111082077026,
        0.8530317544937134
      ],
      "name": "wine glass",
      "possible_names": [
        "wine glass"
      ]
    }
  ],
  "mask_file": "./person_labeling/./003117.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is leaning on a white table with a glass of water nearby in a room with green curtains and soft lighting creating a calm and minimalist atmosphere",
  "overall_past": "Before the current scene, the individual likely finished a long day—perhaps working, attending meetings, or engaging in mentally demanding tasks—before retreating to this quiet, softly lit room. They may have poured a glass of wine as a deliberate act of self-care, seeking a moment to pause and decompress. The placement of the glass and the relaxed posture suggest they had just sat down, perhaps after walking through the space, removing their shoes or outer layers, and choosing this serene corner to unwind. The green curtains and minimalist setting imply a personal sanctuary, possibly a private living area or a quiet study, where they regularly go to reflect. The calm atmosphere and their still, contemplative stance indicate that this moment is part of a routine or intentional practice of mindfulness and rest.",
  "overall_past_clean": "The individual moved through a demanding day marked by intense focus and sustained effort, navigating a series of responsibilities that drained mental energy, before deliberately stepping into a space of quiet, shedding the weight of the day with each deliberate motion, and settling into stillness as a conscious act of restoration.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to slowly lift their head, take a quiet sip from the glass of water, and sit back for a moment longer, absorbing the stillness of the room. The soft lighting and green curtains suggest a space designed for calm, and the gentle posture implies a deliberate pause. Following this brief moment of reflection, they may reach for a book nearby, or simply close their eyes for a few seconds, allowing the tranquility to settle deeper—perhaps preparing to return to their day with renewed clarity and peace.",
  "overall_future_clean": "A quiet breath is drawn, the body shifts slightly into deeper stillness, then rises with purpose—eyes open, focused, moving forward with a calm certainty, as if the moment of pause has forged a clear path ahead.",
  "future_scene_ok": true
}