{
  "video_path": "./ref_datasets/part2/5495030005.mp4",
  "start_time": 0.0,
  "end_time": 3.04,
  "image_path": "./016516.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5495030005.mp4",
      "start_time": 0.0,
      "end_time": 3.04,
      "image_path": "./ref_datasets/extracted_frames/face_6063844596149792635_1_5495030005.mp4_0.00_3.04.jpg",
      "type": "face"
    }
  ],
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a light beige short-sleeved shirt over a green apron-like garment. The shirt appears loose-fitting, and the apron covers the front of her torso.",
        "clothing": [
          {
            "possible_names": [
              "shirt",
              "t-shirt",
              "tee"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "light beige"
            ]
          },
          {
            "possible_names": [
              "apron",
              "garment"
            ],
            "name": "apron",
            "type": "accessory",
            "color": [
              "green"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "pumpkin",
              "squash"
            ],
            "name": "pumpkin",
            "position": "hand"
          }
        ],
        "description": "The person is an adult female with red hair tied back in a braid. She is holding a pumpkin with both hands. She is dressed in a light beige short-sleeved shirt over a green apron. Her expression is neutral, and she appears to be looking slightly off-camera.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and neutral expression, neither displaying strong emotions nor engaging directly with the camera.",
        "meaningful": true,
        "story": "The person seems to be engaged in an activity involving a large vegetable, possibly preparing for cooking or showcasing it. The setting suggests a casual, home-like environment.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a large, textured object close to their chest with both hands, suggesting a sense of care or admiration for it. Their gaze is directed slightly upwards and away from the camera, indicating they might be lost in thought or observing something out of frame. The individual's calm and composed expression implies a serene moment, possibly reflecting on the object's significance or simply enjoying its presence. The way they are dressed in casual attire suggests a relaxed setting, perhaps at home or in a comfortable environment where they feel free to engage intimately with the object.",
        "intention": "The individual is deeply engaged with the object showing reverence and emotional connection likely seeking comfort or meaning through tactile and visual focus",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "both hands",
            "action": [
              [
                "both hands",
                "holding"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.47483591982927276,
            0.3225380383165819
          ],
          [
            0.4629932860218028,
            0.3366315942257643
          ],
          [
            0.4520922229088173,
            0.3567925482057035
          ],
          [
            0.4453544615437745,
            0.3782004779204726
          ],
          [
            0.4438961430832192,
            0.400770829724414
          ],
          [
            0.4495558569040248,
            0.42265449171619757
          ],
          [
            0.4659760562831132,
            0.44062984827905893
          ],
          [
            0.47912899583735796,
            0.4556227237252253
          ],
          [
            0.50886734181611,
            0.4661283293472869
          ],
          [
            0.5486033748697352,
            0.4695136830476778
          ],
          [
            0.5939987344085854,
            0.4693797486168998
          ],
          [
            0.6511907190242142,
            0.4707557673432997
          ],
          [
            0.7037360576094773,
            0.4646111641611372
          ],
          [
            0.747183523354707,
            0.4467300872451493
          ],
          [
            0.7727533974975505,
            0.4224100107593196
          ],
          [
            0.7925966329675502,
            0.3943425685699497
          ],
          [
            0.8095562392441684,
            0.36291558355359094
          ],
          [
            0.47477501551940965,
            0.2803312768228352
          ],
          [
            0.48764475382194317,
            0.26423037664166515
          ],
          [
            0.5045972701733704,
            0.2662385854470943
          ],
          [
            0.5304909400208287,
            0.26864792639389634
          ],
          [
            0.5509018915670889,
            0.27908218525616185
          ],
          [
            0.5978902949857964,
            0.28125465541545835
          ],
          [
            0.6377791066649099,
            0.2749442153809858
          ],
          [
            0.6750722815750768,
            0.27765516474443885
          ],
          [
            0.7130988343052133,
            0.29040223825722933
          ],
          [
            0.7388782064750712,
            0.3074134352750012
          ],
          [
            0.5549058131439977,
            0.30097668804228306
          ],
          [
            0.5429764666885296,
            0.31423125974833965
          ],
          [
            0.5298981313352231,
            0.3260005061248583
          ],
          [
            0.5173354070022623,
            0.33863861998543143
          ],
          [
            0.5083829197303328,
            0.3657502863290054
          ],
          [
            0.5151429360505766,
            0.37028499173798735
          ],
          [
            0.5245647561613215,
            0.3738614528306893
          ],
          [
            0.5426415056147903,
            0.37279635900631547
          ],
          [
            0.5607501344706015,
            0.3736962131889803
          ],
          [
            0.488797599234909,
            0.30392778431996703
          ],
          [
            0.5029404085464578,
            0.2971405256539583
          ],
          [
            0.5262309391031821,
            0.2991644098157329
          ],
          [
            0.5427830851897991,
            0.3116551434754261
          ],
          [
            0.5196488108584489,
            0.3094874282500574
          ],
          [
            0.5006391383983471,
            0.30789821102683035
          ],
          [
            0.6164604762874584,
            0.3188852935231158
          ],
          [
            0.6409367168391192,
            0.3103199057014925
          ],
          [
            0.6604270222325804,
            0.3117889300254839
          ],
          [
            0.6814050499093596,
            0.32297010027936524
          ],
          [
            0.6612535289986423,
            0.3227834520595414
          ],
          [
            0.6383824744552531,
            0.319194432481059
          ],
          [
            0.4872155859987572,
            0.3997114804972495
          ],
          [
            0.4977831700176159,
            0.3915254408493638
          ],
          [
            0.5127993368597887,
            0.38613564361418995
          ],
          [
            0.5247315293897397,
            0.3896529751696757
          ],
          [
            0.5401059058608201,
            0.38892039683248314
          ],
          [
            0.5648203072724519,
            0.39906615178499905
          ],
          [
            0.6013837587896479,
            0.41257953750235693
          ],
          [
            0.5603965812889987,
            0.4105475199009691
          ],
          [
            0.5313035195466703,
            0.40910035917269333
          ],
          [
            0.5175198461012867,
            0.40842222369142944
          ],
          [
            0.5063004857648618,
            0.406681644863316
          ],
          [
            0.49526892424260505,
            0.40376188792288303
          ],
          [
            0.4941915503254643,
            0.4003035949010934
          ],
          [
            0.5087234719089729,
            0.39634152914264376
          ],
          [
            0.5212861288792242,
            0.39755148919565336
          ],
          [
            0.5332783921055062,
            0.3995209646278194
          ],
          [
            0.5892892221294384,
            0.4100825829165322
          ],
          [
            0.5323329901569104,
            0.4010467523975032
          ],
          [
            0.5225696747895903,
            0.39860628824681044
          ],
          [
            0.5090530102845854,
            0.39646072100315777
          ]
        ],
        "visibility": [
          1.0,
          0.0008438407676294446,
          4.990042270947015e-06,
          1.711371116434185e-14,
          0.9999961853027344,
          0.9793013334274292,
          6.584336754208303e-14,
          9.533896978413519e-20,
          0.9957385063171387,
          2.4992933188929282e-15,
          2.945586459190963e-07,
          5.940060943121495e-11,
          9.589157592970743e-12,
          0.0038196942768990993,
          3.4476235885247397e-13,
          3.748368726519402e-09,
          3.0134905681933333e-09,
          3.891602209753209e-13,
          3.245777258076288e-11,
          3.902542012961495e-14,
          9.550597346395101e-14,
          6.114282935206286e-14,
          0.0015952641842886806,
          1.5099981811803054e-13,
          1.8164908223649509e-19,
          8.789405346547384e-20,
          3.2408377739247263e-13,
          1.7717145806006585e-10,
          5.772518418230624e-16
        ],
        "headpose": {
          "pitch": 10.944556814697739,
          "yaw": 20.494803934870955,
          "roll": 11.454784752302386
        },
        "attributes": {
          "5 oClock Shadow": 0.0005303452489897609,
          "Arched Eyebrows": 0.07626329362392426,
          "Attractive": 0.33787962794303894,
          "Bags Under Eyes": 0.13575883209705353,
          "Bald": 5.428300937637687e-07,
          "Bangs": 0.0006639329949393868,
          "Big Lips": 0.12928473949432373,
          "Big Nose": 0.030343087390065193,
          "Black Hair": 0.006593621335923672,
          "Blond Hair": 0.013051926158368587,
          "Blurry": 1.3322285667527467e-05,
          "Brown Hair": 0.7515427470207214,
          "Bushy Eyebrows": 0.04146420583128929,
          "Chubby": 0.030356910079717636,
          "Double Chin": 0.005866623017936945,
          "Eyeglasses": 0.0017097496893256903,
          "Goatee": 2.823857357725501e-05,
          "Gray Hair": 0.00032067959546111524,
          "Heavy Makeup": 0.19598762691020966,
          "High Cheekbones": 0.4385163486003876,
          "Male": 0.002907524351030588,
          "Mouth Slightly Open": 0.796058714389801,
          "Mustache": 2.035222678387072e-06,
          "Narrow Eyes": 0.06115990877151489,
          "No Beard": 0.9993403553962708,
          "Oval Face": 0.4198998510837555,
          "Pale Skin": 0.001817250275053084,
          "Pointy Nose": 0.08871569484472275,
          "Receding Hairline": 0.009749150834977627,
          "Rosy Cheeks": 0.01856263168156147,
          "Sideburns": 1.2057249477948062e-05,
          "Smiling": 0.1286023110151291,
          "Straight Hair": 0.2582874894142151,
          "Wavy Hair": 0.24372276663780212,
          "Wearing Earrings": 0.3045384883880615,
          "Wearing Hat": 7.618772360729054e-05,
          "Wearing Lipstick": 0.5139274597167969,
          "Wearing Necklace": 0.010844973847270012,
          "Wearing Necktie": 0.0008903717971406877,
          "Young": 0.9861961603164673
        },
        "age": [
          0.04761410504579544,
          0.9515330791473389,
          0.928636372089386,
          0.7481778860092163,
          0.17322112619876862,
          0.0017600985011085868,
          0.00010305376054020599,
          6.288525469244632e-07
        ],
        "race": [
          0.9705232381820679,
          0.0006717632641084492,
          0.8559099435806274,
          0.18022964894771576,
          0.7766608595848083
        ],
        "gender": [
          0.017381267622113228,
          0.9855028390884399
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 2.0856376737356186,
          "disgust": 1.5228430738645216e-07,
          "fear": 9.462989121675491,
          "happy": 26.28415822982788,
          "sad": 56.58308267593384,
          "surprise": 0.0010658629435056355,
          "neutral": 5.58306910097599
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1067,
          "h": 1367,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 33,
        "gender": {
          "Woman": 99.98169541358948,
          "Man": 0.018306192941963673
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 32.89632201194763,
          "indian": 5.427892506122589,
          "black": 0.9594052098691463,
          "white": 22.40477353334427,
          "middle eastern": 6.084255874156952,
          "latino hispanic": 32.227352261543274
        },
        "dominant_race": "asian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.021116556599736214,
        0.19653338193893433,
        0.995343029499054,
        0.9986507296562195
      ]
    ],
    "face_boxes": [
      [
        0.4454740285873413,
        0.23938657343387604,
        0.7751727104187012,
        0.462035208940506
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6600795652927062,
            0.6023375095427035
          ],
          [
            0.4209962795328899,
            0.5919993030528226
          ],
          [
            0.14880915420632967,
            0.900853221938014
          ],
          [
            0.15371342673473612,
            0.6346444048235814
          ],
          [
            0.8991628510525225,
            0.6126757160325844
          ],
          [
            0.5362466839504423,
            0.9318678414076567
          ],
          [
            0.28367664873750814,
            0.6475671629359324
          ],
          [
            0.33271937402157314,
            0.9990661835918825
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6931834048594498,
            1.005527562648058
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5092731850442067,
            0.32062138269344975
          ],
          [
            0.6539492246321981,
            0.3270827617496252
          ],
          [
            0.452874050967532,
            0.35292827797432746
          ],
          [
            0.8010774004843927,
            0.3826506216327349
          ]
        ],
        "dw_hand_1": [
          [
            0.2763202399448984,
            0.6462748871246975
          ],
          [
            0.31555442017215024,
            0.6113834402213495
          ],
          [
            0.36459714545621524,
            0.5777842691292366
          ],
          [
            0.3523364641351989,
            0.5454773738483586
          ],
          [
            0.33271937402157314,
            0.5157550301899513
          ],
          [
            0.22482537839663017,
            0.5416005464146533
          ],
          [
            0.20520828828300425,
            0.5067090995113055
          ],
          [
            0.19294760696198807,
            0.476986755852898
          ],
          [
            0.18068692564097177,
            0.45243351543943083
          ],
          [
            0.17823478937676848,
            0.548061925470829
          ],
          [
            0.14880915420632967,
            0.5105859269450108
          ],
          [
            0.1340963366211101,
            0.476986755852898
          ],
          [
            0.12428779156429717,
            0.4485566880057255
          ],
          [
            0.1439048816779232,
            0.55840013196071
          ],
          [
            0.11447924650748416,
            0.5235086850573619
          ],
          [
            0.09486215639385824,
            0.4924940655877193
          ],
          [
            0.08014933880863877,
            0.46277172192931176
          ],
          [
            0.11938351903589062,
            0.571322890073061
          ],
          [
            0.09486215639385824,
            0.5467696496595941
          ],
          [
            0.0776972025444356,
            0.5260932366798321
          ],
          [
            0.06053224869501285,
            0.5028322720776002
          ]
        ],
        "dw_hand_2": [
          [
            0.17578265311256533,
            0.6333521290123463
          ],
          [
            0.19539974322619136,
            0.6036297853539389
          ],
          [
            0.20520828828300425,
            0.5751997175067664
          ],
          [
            0.28367664873750814,
            0.5519387529045343
          ],
          [
            0.32291082896476,
            0.5157550301899513
          ],
          [
            0.15861769926314256,
            0.5416005464146533
          ],
          [
            0.15371342673473612,
            0.5092936511337757
          ],
          [
            0.1561655629989393,
            0.48474041072030866
          ],
          [
            0.14880915420632967,
            0.45889489449560644
          ],
          [
            0.12919206409270373,
            0.5428928222258887
          ],
          [
            0.11693138277168745,
            0.5092936511337757
          ],
          [
            0.11202711024328088,
            0.48086358328660334
          ],
          [
            0.11938351903589062,
            0.45114123962819574
          ],
          [
            0.09731429265806142,
            0.5493542012820639
          ],
          [
            0.07279293001602904,
            0.5183395818124215
          ],
          [
            0.06788865748762248,
            0.49120178977648415
          ],
          [
            0.07524506628023221,
            0.4679408251742522
          ],
          [
            0.06298438495921613,
            0.5622769593944154
          ],
          [
            0.043367294845590106,
            0.5416005464146533
          ],
          [
            0.03355874978877709,
            0.5235086850573619
          ],
          [
            0.023750204731964073,
            0.5028322720776002
          ]
        ],
        "dw_face": [
          [
            0.46513473228854835,
            0.31932910688221455
          ],
          [
            0.45042191470332865,
            0.34388234729568173
          ],
          [
            0.44306550591071914,
            0.3658510360866785
          ],
          [
            0.44061336964651576,
            0.3891120006889105
          ],
          [
            0.44551764217492207,
            0.4110806894799074
          ],
          [
            0.4577783234959386,
            0.4343416540821394
          ],
          [
            0.4798475498737678,
            0.45243351543943083
          ],
          [
            0.5166295938368163,
            0.46277172192931176
          ],
          [
            0.5632201828566781,
            0.465356273551782
          ],
          [
            0.6073586356123365,
            0.46406399774054685
          ],
          [
            0.6490449521037914,
            0.4601871703068415
          ],
          [
            0.6907312685952467,
            0.45114123962819574
          ],
          [
            0.7275133125582954,
            0.4382184815158447
          ],
          [
            0.752034675200328,
            0.41883434434731803
          ],
          [
            0.7691996290497504,
            0.39815793136755623
          ],
          [
            0.7839124466349701,
            0.37618924257655945
          ],
          [
            0.793720991691783,
            0.3542205537855625
          ],
          [
            0.47494327734536124,
            0.2986526939024527
          ],
          [
            0.49210823119478386,
            0.29348359065751245
          ],
          [
            0.5092731850442067,
            0.29348359065751245
          ],
          [
            0.5264381388936291,
            0.29606814227998257
          ],
          [
            0.5436030927430521,
            0.2999449697136879
          ],
          [
            0.6098107718765396,
            0.3012372455249231
          ],
          [
            0.6367842707827752,
            0.2999449697136879
          ],
          [
            0.6662099059532142,
            0.2999449697136879
          ],
          [
            0.6980876773878565,
            0.3038217971473932
          ],
          [
            0.722609040029889,
            0.31286772782603905
          ],
          [
            0.5656723191208812,
            0.3244982101271551
          ],
          [
            0.5558637740640681,
            0.3348364166170359
          ],
          [
            0.5460552290072554,
            0.34388234729568173
          ],
          [
            0.5362466839504423,
            0.3542205537855625
          ],
          [
            0.5117253213084098,
            0.37231241514285407
          ],
          [
            0.5239860026294262,
            0.37489696676532425
          ],
          [
            0.5411509564788488,
            0.37489696676532425
          ],
          [
            0.5607680465924747,
            0.37618924257655945
          ],
          [
            0.5803851367061007,
            0.3774815183877945
          ],
          [
            0.48229968613797075,
            0.3219136585046847
          ],
          [
            0.4994646399873936,
            0.31545227944850923
          ],
          [
            0.5239860026294262,
            0.31803683107097935
          ],
          [
            0.5386988202146454,
            0.3270827617496252
          ],
          [
            0.5190817301010197,
            0.32966731337209537
          ],
          [
            0.4994646399873936,
            0.3283750375608604
          ],
          [
            0.6171671806691493,
            0.3309595891833305
          ],
          [
            0.6392364070469786,
            0.3232059343159199
          ],
          [
            0.6662099059532142,
            0.3244982101271551
          ],
          [
            0.6882791323310433,
            0.3335441408058007
          ],
          [
            0.6662099059532142,
            0.337420968239506
          ],
          [
            0.6392364070469786,
            0.33612869242827104
          ],
          [
            0.4847518224021741,
            0.4046193104237318
          ],
          [
            0.501916776251597,
            0.39686565555632114
          ],
          [
            0.5215338663652228,
            0.39169655231138073
          ],
          [
            0.5337945476862389,
            0.3929888281226158
          ],
          [
            0.5460552290072554,
            0.3929888281226158
          ],
          [
            0.5803851367061007,
            0.40074248299002646
          ],
          [
            0.612262908140743,
            0.4110806894799074
          ],
          [
            0.5852894092345072,
            0.4149575169136127
          ],
          [
            0.5583159103282715,
            0.4162497927248478
          ],
          [
            0.5288902751578326,
            0.4162497927248478
          ],
          [
            0.5117253213084098,
            0.4136652411023775
          ],
          [
            0.49701250372319045,
            0.4097884136686722
          ],
          [
            0.49210823119478386,
            0.4046193104237318
          ],
          [
            0.5117253213084098,
            0.40203475880126155
          ],
          [
            0.5337945476862389,
            0.40203475880126155
          ],
          [
            0.5681244553850846,
            0.4046193104237318
          ],
          [
            0.6049064993481331,
            0.4097884136686722
          ],
          [
            0.5681244553850846,
            0.40720386204620207
          ],
          [
            0.531342411422036,
            0.4046193104237318
          ],
          [
            0.5117253213084098,
            0.4046193104237318
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "016516",
  "objects": [
    {
      "box": [
        0.03180895745754242,
        0.29553884267807007,
        0.39482933282852173,
        0.5882766842842102
      ],
      "name": "pumpkin",
      "possible_names": [
        "pumpkin"
      ]
    }
  ],
  "mask_file": "./person_labeling/./016516.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is holding a large orange gourd against a plain light background wearing a green apron over a beige shirt with soft natural lighting highlighting the texture of the gourd and fabric.",
  "overall_past": "Before this scene, the individual likely discovered or recently acquired the large orange gourd, perhaps from a garden, market, or seasonal harvest. They may have carefully selected it for its unique shape, texture, or symbolic meaning—possibly representing abundance, tradition, or a personal connection to nature. After bringing it home, they paused to examine it closely, perhaps cleaning it or simply holding it in quiet appreciation, leading to the current moment of stillness and contemplation. The soft lighting and intimate posture suggest a deliberate, mindful act, indicating that this was not a fleeting interaction but a meaningful pause in their day.",
  "overall_past_clean": "The individual moved with purpose toward the object, their hands reaching out not in haste but with intention, having made a deliberate choice to bring it into their space, their fingers tracing its contours as if confirming its presence, their breath steady and focused, as though the act of acquiring it had already begun to shift their inner rhythm.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to gently lower the gourd, perhaps placing it on a nearby surface with deliberate care, as if acknowledging its presence before continuing with a quiet, intentional act—such as preparing it for cooking or displaying it as part of a seasonal decoration. The soft lighting and serene expression suggest a moment of mindful connection, indicating that the action following will be thoughtful and deliberate, rooted in appreciation rather than urgency.",
  "overall_future_clean": "The hands move with quiet precision, setting the vessel down with deliberate care before turning to gather tools, each motion a quiet affirmation of purpose, as the space settles into a rhythm of mindful intention.",
  "future_scene_ok": true
}