{
  "video_path": "./ref_datasets/part2/7463926001.mp4",
  "start_time": 0.0,
  "end_time": 2.966666666666667,
  "image_path": "./007653.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/7463926001.mp4",
      "start_time": 0.0,
      "end_time": 2.966666666666667,
      "image_path": "./ref_datasets/extracted_frames/person_7881236023668210718_1_7463926001.mp4_0.00_2.97.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/7463926001.mp4",
      "start_time": 0.0,
      "end_time": 2.966666666666667,
      "image_path": "./ref_datasets/extracted_frames/face_7881236023668210718_1_7463926001.mp4_0.00_2.97.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark green t-shirt with a turquoise pocket featuring a geometric pattern. The shirt appears casual and comfortable, suitable for indoor activities such as moving or organizing.",
        "clothing": [
          {
            "possible_names": [
              "t-shirt",
              "shirt",
              "tee"
            ],
            "name": "t shirt",
            "type": "top",
            "color": [
              "dark green"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "cardboard box",
              "box"
            ],
            "name": "cardboard box",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "potted plant",
              "plant"
            ],
            "name": "potted plant",
            "position": "hand"
          }
        ],
        "description": "The individual is an adult male who appears to be engaged in moving or setting up a space. He is holding a cardboard box in one hand and a potted plant in the other, suggesting he might be in the process of unpacking or arranging items. His attire consists of a dark green t-shirt with a turquoise pocket that has a geometric design, indicating a casual and practical choice of clothing for the task at hand. His expression is neutral, focused on his activity.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, possibly indicating they are focused on the task at hand rather than expressing strong emotions.",
        "meaningful": true,
        "story": "The person seems to be involved in moving or organizing items, as indicated by the cardboard box and potted plant he is holding. This suggests a scenario of relocation or setting up a new space.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a potted plant in one hand and a cardboard box in the other, suggesting they might be in the process of moving into a new space. Their gaze is directed off to the side, indicating they could be looking for a suitable place to set down the items or perhaps engaging in conversation with someone out of frame. The individual appears focused on the task at hand, possibly motivated by the desire to settle into their new environment comfortably and efficiently. The casual attire and relaxed posture suggest a sense of ease despite the physical effort involved in carrying the items.",
        "intention": "The individual is motivated to efficiently and comfortably establish their new space by carefully transporting essential items while remaining attentive to their surroundings",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "left hand",
            "action": [
              [
                "left hand",
                "holding"
              ]
            ]
          },
          "object": 0
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ]
            ]
          },
          "object": 1
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.38120346214799655,
            0.26001580783299033
          ],
          [
            0.38343203532553854,
            0.2822886443011975
          ],
          [
            0.3842826994756858,
            0.3041408705332922
          ],
          [
            0.38717106094672565,
            0.3274767812597688
          ],
          [
            0.3925367848504157,
            0.3471005752603844
          ],
          [
            0.4008256867527962,
            0.3621319152690746
          ],
          [
            0.41009317324275063,
            0.37321583051530144
          ],
          [
            0.4204593201123533,
            0.380247744302901
          ],
          [
            0.4302605533883685,
            0.3840394557468475
          ],
          [
            0.44062402830237435,
            0.381918961156613
          ],
          [
            0.44852740260816754,
            0.37055523937972135
          ],
          [
            0.45627292877151854,
            0.3541117579848678
          ],
          [
            0.4613166257029488,
            0.3376704543986649
          ],
          [
            0.4639507503736587,
            0.3150997293058526
          ],
          [
            0.4648199695206824,
            0.29360090487848517
          ],
          [
            0.4654863994036402,
            0.2717445010230654
          ],
          [
            0.4661649139154525,
            0.24869204046864993
          ],
          [
            0.392879480052562,
            0.23610853644275162
          ],
          [
            0.3976592977132116,
            0.21900851903138338
          ],
          [
            0.405299207284337,
            0.2170857862189964
          ],
          [
            0.41291884964420683,
            0.21659253350010624
          ],
          [
            0.41970566642426305,
            0.222220598326789
          ],
          [
            0.4329115658998489,
            0.22165229497132477
          ],
          [
            0.43981625061659585,
            0.2160796909735947
          ],
          [
            0.4469940335268066,
            0.2147339936917421
          ],
          [
            0.4542315186489196,
            0.2170482190197738
          ],
          [
            0.46014440769240966,
            0.23178457065864846
          ],
          [
            0.4270001097094445,
            0.24275679991989538
          ],
          [
            0.42777693686740736,
            0.2546072200492576
          ],
          [
            0.4281526733012427,
            0.26548687150238687
          ],
          [
            0.42890608818048526,
            0.27718969274450234
          ],
          [
            0.4186062941238994,
            0.28989075655659674
          ],
          [
            0.42382069882892426,
            0.2918790958545826
          ],
          [
            0.4284713163971901,
            0.29394694610878275
          ],
          [
            0.4338489672257787,
            0.2908699328306491
          ],
          [
            0.4382476459656443,
            0.28990639908603894
          ],
          [
            0.40104795470833776,
            0.24888220085668816
          ],
          [
            0.4043386460060165,
            0.2404719226574772
          ],
          [
            0.41251200047277264,
            0.24148762957759634
          ],
          [
            0.41653802025885805,
            0.2477559596773178
          ],
          [
            0.41162923680884494,
            0.24885317736832555
          ],
          [
            0.4051414402467864,
            0.24960149545518182
          ],
          [
            0.43789304636773607,
            0.2492653800066186
          ],
          [
            0.4428556924774533,
            0.2389302644780073
          ],
          [
            0.44923148318415596,
            0.23873005266542788
          ],
          [
            0.4535163537377403,
            0.2453059563561091
          ],
          [
            0.449443950965291,
            0.24671672614163193
          ],
          [
            0.4433368607645943,
            0.2501109456259107
          ],
          [
            0.41087866961246444,
            0.321727701469704
          ],
          [
            0.41671130085984864,
            0.30772881028513427
          ],
          [
            0.4245589110468115,
            0.3021155084882464
          ],
          [
            0.429198007214637,
            0.30384592404441235
          ],
          [
            0.4342546178471475,
            0.3021866641978107
          ],
          [
            0.44147600815409704,
            0.3082047871180943
          ],
          [
            0.4481753082502456,
            0.3241359390278973
          ],
          [
            0.4422005091394697,
            0.33463881911424104
          ],
          [
            0.4358020631330354,
            0.34128402528308693
          ],
          [
            0.429775811980168,
            0.34358797931166557
          ],
          [
            0.42338512050254,
            0.3411302803685425
          ],
          [
            0.41653336123341606,
            0.33541215058987733
          ],
          [
            0.41276754846885094,
            0.32156872143821114
          ],
          [
            0.4226241403392383,
            0.3139846284553488
          ],
          [
            0.4293927580827759,
            0.31478388423011416
          ],
          [
            0.43544311090594245,
            0.31517679022733497
          ],
          [
            0.445413091920671,
            0.322271818584866
          ],
          [
            0.43564505307447343,
            0.32650005502044843
          ],
          [
            0.43015893797079724,
            0.3272620786434759
          ],
          [
            0.42243904996485937,
            0.326215934753418
          ]
        ],
        "visibility": [
          0.9999998807907104,
          7.087138431671747e-09,
          0.15571428835391998,
          1.0351872137270846e-11,
          0.9999997615814209,
          0.9999955892562866,
          2.8436368211259833e-06,
          1.4822992009180802e-12,
          0.9887754917144775,
          4.409717382913847e-11,
          1.1093643479398452e-05,
          9.47060572326075e-13,
          0.00029882611124776304,
          0.0029279442969709635,
          3.193023970227138e-12,
          4.884106452607284e-09,
          2.773156495550211e-07,
          2.058911895141957e-11,
          6.285620166853823e-15,
          4.586614074653106e-11,
          6.847403757691923e-16,
          3.868090818650808e-21,
          4.503770156816245e-08,
          1.574335523057968e-10,
          2.3800454032497627e-21,
          4.818045287006041e-23,
          7.726606680857895e-12,
          5.903924051031684e-12,
          4.733831815428857e-08
        ],
        "headpose": {
          "pitch": 2.0433853461151874,
          "yaw": -3.960252110026467,
          "roll": -0.5924876410388121
        },
        "attributes": {
          "5 oClock Shadow": 0.08310195803642273,
          "Arched Eyebrows": 0.08060813695192337,
          "Attractive": 0.020565425977110863,
          "Bags Under Eyes": 0.07092085480690002,
          "Bald": 0.0005964851006865501,
          "Bangs": 0.00015626773529220372,
          "Big Lips": 0.8183721899986267,
          "Big Nose": 0.7560074925422668,
          "Black Hair": 0.9097373485565186,
          "Blond Hair": 1.2277760106371716e-05,
          "Blurry": 0.007983662188053131,
          "Brown Hair": 0.0011568078771233559,
          "Bushy Eyebrows": 0.6387026906013489,
          "Chubby": 0.3199508488178253,
          "Double Chin": 0.14055664837360382,
          "Eyeglasses": 0.00011799400817835703,
          "Goatee": 0.6891992688179016,
          "Gray Hair": 8.94909753696993e-05,
          "Heavy Makeup": 0.002712904941290617,
          "High Cheekbones": 0.6907831430435181,
          "Male": 0.9989476799964905,
          "Mouth Slightly Open": 0.9997106194496155,
          "Mustache": 0.24346233904361725,
          "Narrow Eyes": 0.08722291141748428,
          "No Beard": 0.04054858535528183,
          "Oval Face": 0.2958296835422516,
          "Pale Skin": 4.17043011111673e-05,
          "Pointy Nose": 0.0018820121185854077,
          "Receding Hairline": 0.19879470765590668,
          "Rosy Cheeks": 0.00017188249330502003,
          "Sideburns": 0.23302745819091797,
          "Smiling": 0.8737093806266785,
          "Straight Hair": 0.003844199702143669,
          "Wavy Hair": 0.08948741108179092,
          "Wearing Earrings": 0.012419654987752438,
          "Wearing Hat": 0.007504754234105349,
          "Wearing Lipstick": 0.004883558489382267,
          "Wearing Necklace": 0.010771404951810837,
          "Wearing Necktie": 0.008483088575303555,
          "Young": 0.8954126238822937
        },
        "age": [
          0.21152150630950928,
          0.9302456378936768,
          0.9695396423339844,
          0.5487164258956909,
          0.05086078122258186,
          0.0007958906935527921,
          0.0001006517923087813,
          1.4375167666003108e-05
        ],
        "race": [
          0.01549182552844286,
          0.9890249371528625,
          0.14984548091888428,
          0.27287644147872925,
          0.6132046580314636
        ],
        "gender": [
          0.9977673292160034,
          0.003866844577714801
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 1.4549340249676674,
          "disgust": 0.00014824275292041957,
          "fear": 2.854682909884106,
          "happy": 0.11660653173398593,
          "sad": 1.38353893804086,
          "surprise": 1.5550874182477692,
          "neutral": 92.63500063002103
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 253,
          "h": 331,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 28,
        "gender": {
          "Woman": 1.0164858773350716,
          "Man": 98.98350834846497
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.06463642348535359,
          "indian": 1.2571999803185463,
          "black": 97.8429913520813,
          "white": 0.03885916667059064,
          "middle eastern": 0.154690386261791,
          "latino hispanic": 0.6416234187781811
        },
        "dominant_race": "black"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.31570711731910706,
        0.10238440334796906,
        0.6803760528564453,
        0.9861791133880615
      ]
    ],
    "face_boxes": [
      [
        0.38114452362060547,
        0.16540302336215973,
        0.46950387954711914,
        0.3706391751766205
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4380534631237388,
            0.47036722424182686
          ],
          [
            0.3559974515040716,
            0.4855461841446933
          ],
          [
            0.3381238648146391,
            0.7240726969040231
          ],
          [
            0.3397487363318602,
            0.9047746005095764
          ],
          [
            0.520109474743406,
            0.4551882643389604
          ],
          [
            0.643599710052212,
            0.6344445527156689
          ],
          [
            0.5331084468811751,
            0.8671886045596211
          ],
          [
            0.36980885940045116,
            0.9568167487479756
          ],
          [
            0.26500464653968814,
            1.0970414259458847
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.48354986560593044,
            0.9640448248921977
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.40799334005514787,
            0.2484652866142076
          ],
          [
            0.44699025646845497,
            0.24701967138536313
          ],
          [
            0.379558088503778,
            0.2773775911910961
          ],
          [
            0.46973845770955086,
            0.27304074550456287
          ]
        ],
        "dw_hand_1": [
          [
            0.5298587038467328,
            0.8787535263903766
          ],
          [
            0.5038607595711947,
            0.8628517588730878
          ],
          [
            0.47786281529565655,
            0.8455043761269547
          ],
          [
            0.45430217829595004,
            0.8512868370423325
          ],
          [
            0.4323664128134648,
            0.8541780675000213
          ],
          [
            0.46405140739927686,
            0.9221219832557094
          ],
          [
            0.44049077039957046,
            0.9409149812306867
          ],
          [
            0.42586692674458027,
            0.938023750772998
          ],
          [
            0.415305261882643,
            0.930795674628776
          ],
          [
            0.46973845770955086,
            0.9582623639768199
          ],
          [
            0.44292807767540215,
            0.9770553619517974
          ],
          [
            0.42911666977902246,
            0.9683816705787309
          ],
          [
            0.41936744067569576,
            0.9539255182902866
          ],
          [
            0.4794876868128777,
            0.978500977180642
          ],
          [
            0.45511461405456066,
            0.9915115142402418
          ],
          [
            0.44292807767540215,
            0.9813922076383307
          ],
          [
            0.4356161558479071,
            0.9698272858075754
          ],
          [
            0.48923691591620444,
            0.9886202837825527
          ],
          [
            0.4738006365026038,
            0.9972939751556193
          ],
          [
            0.46567627891649793,
            0.9900658990113973
          ],
          [
            0.45998922860622404,
            0.9799465924094862
          ]
        ],
        "dw_hand_2": [
          [
            0.3381238648146391,
            0.9018833700518873
          ],
          [
            0.3446233508835236,
            0.9120026766537984
          ],
          [
            0.3535601442282399,
            0.9235675984845537
          ],
          [
            0.3535601442282399,
            0.9351325203153092
          ],
          [
            0.3397487363318602,
            0.9264588289422426
          ],
          [
            0.336498993297418,
            0.9365781355441535
          ],
          [
            0.3381238648146391,
            0.9510342878325978
          ],
          [
            0.3397487363318602,
            0.9597079792056644
          ],
          [
            0.3438109151249131,
            0.9568167487479756
          ],
          [
            0.3332492502629757,
            0.9524799030614424
          ],
          [
            0.3340616860215863,
            0.9640448248921977
          ],
          [
            0.336498993297418,
            0.9683816705787309
          ],
          [
            0.3421860436076919,
            0.9640448248921977
          ],
          [
            0.330811942987144,
            0.9654904401210421
          ],
          [
            0.3324368145043651,
            0.9698272858075754
          ],
          [
            0.3356865575388074,
            0.9741641314941086
          ],
          [
            0.3397487363318602,
            0.9770553619517974
          ],
          [
            0.3259373284354806,
            0.9741641314941086
          ],
          [
            0.3316243787457546,
            0.9741641314941086
          ],
          [
            0.3340616860215863,
            0.975609746722953
          ],
          [
            0.3373114290560285,
            0.975609746722953
          ]
        ],
        "dw_face": [
          [
            0.38199539577960967,
            0.25713897798727414
          ],
          [
            0.3828078315382203,
            0.2788232064199405
          ],
          [
            0.38443270305544136,
            0.297616204394918
          ],
          [
            0.3868700103312731,
            0.31640920236989556
          ],
          [
            0.39093218912432587,
            0.3352022003448731
          ],
          [
            0.3974316751932105,
            0.3496583526333173
          ],
          [
            0.4063684685379267,
            0.362668889692917
          ],
          [
            0.41611769764125345,
            0.37134258106598356
          ],
          [
            0.4266793625031909,
            0.3756794267525168
          ],
          [
            0.4380534631237388,
            0.37278819629482823
          ],
          [
            0.44699025646845497,
            0.3612232744640727
          ],
          [
            0.45430217829595004,
            0.3482127374044729
          ],
          [
            0.45998922860622404,
            0.33086535465833977
          ],
          [
            0.46405140739927686,
            0.3135179719122067
          ],
          [
            0.46648871467510866,
            0.29472497393722924
          ],
          [
            0.46730115043371917,
            0.27448636073340726
          ],
          [
            0.4681135861923298,
            0.2542477475295854
          ],
          [
            0.3917446248829365,
            0.23979159524114108
          ],
          [
            0.398244110951821,
            0.232563519096919
          ],
          [
            0.40555603277931607,
            0.22967228863923003
          ],
          [
            0.4120555188482007,
            0.22967228863923003
          ],
          [
            0.41936744067569576,
            0.232563519096919
          ],
          [
            0.43642859160651754,
            0.23111790386807451
          ],
          [
            0.44292807767540215,
            0.22967228863923003
          ],
          [
            0.44942756374428666,
            0.22967228863923003
          ],
          [
            0.4559270498131713,
            0.23111790386807451
          ],
          [
            0.46161410012344517,
            0.23834598001229657
          ],
          [
            0.42830423402041196,
            0.2484652866142076
          ],
          [
            0.42911666977902246,
            0.26003020844496294
          ],
          [
            0.42911666977902246,
            0.27014951504687396
          ],
          [
            0.4299291055376332,
            0.2802688216487849
          ],
          [
            0.42017987643430627,
            0.29327935870838473
          ],
          [
            0.42505449098596965,
            0.29327935870838473
          ],
          [
            0.42911666977902246,
            0.29472497393722924
          ],
          [
            0.43399128433068596,
            0.29327935870838473
          ],
          [
            0.4380534631237388,
            0.29183374347954033
          ],
          [
            0.39986898246904207,
            0.2528021323007409
          ],
          [
            0.40474359702070556,
            0.24557405615651884
          ],
          [
            0.41124308308959007,
            0.24557405615651884
          ],
          [
            0.41693013339986407,
            0.2528021323007409
          ],
          [
            0.41124308308959007,
            0.2542477475295854
          ],
          [
            0.40555603277931607,
            0.2556933627584297
          ],
          [
            0.4380534631237388,
            0.2513565170718964
          ],
          [
            0.44292807767540215,
            0.24557405615651884
          ],
          [
            0.44942756374428666,
            0.24557405615651884
          ],
          [
            0.45430217829595004,
            0.2513565170718964
          ],
          [
            0.44942756374428666,
            0.2542477475295854
          ],
          [
            0.44374051343401266,
            0.2542477475295854
          ],
          [
            0.40799334005514787,
            0.31785481759873996
          ],
          [
            0.41611769764125345,
            0.30918112622567345
          ],
          [
            0.42586692674458027,
            0.30773551099682905
          ],
          [
            0.4299291055376332,
            0.30773551099682905
          ],
          [
            0.4331788485720754,
            0.30773551099682905
          ],
          [
            0.44211564191679154,
            0.30918112622567345
          ],
          [
            0.44861512798567615,
            0.31785481759873996
          ],
          [
            0.44374051343401266,
            0.32941973942949543
          ],
          [
            0.4380534631237388,
            0.3366478155737175
          ],
          [
            0.4299291055376332,
            0.34098466126025073
          ],
          [
            0.4209923121929169,
            0.33809343080256193
          ],
          [
            0.41368039036542176,
            0.32941973942949543
          ],
          [
            0.409618211572369,
            0.31785481759873996
          ],
          [
            0.41936744067569576,
            0.3135179719122067
          ],
          [
            0.4299291055376332,
            0.3120723566833623
          ],
          [
            0.4388658988823494,
            0.3135179719122067
          ],
          [
            0.44699025646845497,
            0.31785481759873996
          ],
          [
            0.43967833464095984,
            0.3279741242006509
          ],
          [
            0.42911666977902246,
            0.33086535465833977
          ],
          [
            0.4185550049170852,
            0.3279741242006509
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "007653",
  "objects": [
    {
      "box": [
        0.367145299911499,
        0.6317564249038696,
        0.6189879775047302,
        0.9716509580612183
      ],
      "name": "cardboard box",
      "possible_names": [
        "cardboard box"
      ]
    },
    {
      "box": [
        0.1264125257730484,
        0.2357586920261383,
        0.40604162216186523,
        0.8778790235519409
      ],
      "name": "potted plant",
      "possible_names": [
        "potted plant"
      ]
    }
  ],
  "mask_file": "./person_labeling/./007653.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is holding a potted plant and a cardboard box in a bright room with large arched windows and light wooden flooring suggesting a modern and minimalistic living space with an emphasis on natural light and simplicity",
  "overall_past": "Before this scene, the individual likely arrived at the new living space, possibly after transporting belongings from a previous home or storage. They may have just entered through the front door, carrying the potted plant—perhaps a cherished item from their old home—and the cardboard box, which could contain essential or sentimental belongings. The act of holding both items while scanning the room suggests they were assessing the space for the best spot to place them, indicating a moment of transition and intentionality as they begin to establish a sense of home in the new environment.",
  "overall_past_clean": "The individual had just stepped through the threshold, setting down a heavy load of belongings, their hands still gripping the remnants of a life uprooted, as they paused to absorb the silence and emptiness of the unfamiliar space, the weight of transition pressing into the stillness.",
  "past_scene_ok": false,
  "overall_future": "After the current scene, the individual is likely to place the potted plant on a sunny windowsill to ensure it receives ample natural light, then carefully set the cardboard box down nearby—possibly near a wall or in a corner—before beginning to unpack its contents. This sequence reflects a natural progression in settling into a new space: prioritizing the care of a living element like the plant while organizing belongings in a thoughtful, orderly manner, consistent with the room’s minimalist and light-filled aesthetic.",
  "overall_future_clean": "The individual moves with purpose, positioning the plant where sunlight streams in most generously, then aligns the box precisely against the wall, its edges flush and its presence deliberate, before reaching inside to extract each item with focused precision, arranging them in quiet symmetry.",
  "future_scene_ok": true
}