{
  "video_path": "./ref_datasets/part2/6647100000.mp4",
  "start_time": 0.0,
  "end_time": 6.005999999999999,
  "image_path": "./005450.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6647100000.mp4",
      "start_time": 0.0,
      "end_time": 6.005999999999999,
      "image_path": "./ref_datasets/extracted_frames/person_-4957250815499105439_1_6647100000.mp4_0.00_6.01.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/6647100001.mp4",
      "start_time": 0.0,
      "end_time": 4.004,
      "image_path": "./ref_datasets/extracted_frames/face_4850831338188666176_1_6647100001.mp4_0.00_4.00.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a light pink sweater over a dark red long-sleeve shirt, paired with gray jeans. The sweater appears to be loose-fitting, and the sleeves of the red shirt are visible underneath. The person also wears a silver watch on their left wrist.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "earrings",
                "ear studs"
              ],
              "name": "earrings",
              "type": "accessory",
              "color": [
                "silver"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "acoustic guitar",
              "classical guitar"
            ],
            "name": "acoustic guitar",
            "position": "body"
          }
        ],
        "description": "A female adult is seated and playing an acoustic guitar. She is dressed in a light pink sweater over a dark red long-sleeve shirt and gray jeans. Her expression is neutral as she focuses on playing the guitar. A silver watch is visible on her left wrist.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused and calm while playing the guitar, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "A young adult woman is engaged in playing an acoustic guitar, possibly practicing or performing music. Her concentration suggests she is deeply involved in her activity, enjoying a moment of personal expression through music.",
        "race": "asian",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is playing an acoustic guitar, focusing intently on the strings as they strum and press down with their fingers. They appear to be deeply engaged in the music, possibly practicing or performing a piece they enjoy. Their expression suggests concentration and enjoyment, indicating a passion for playing the instrument. The casual attire and relaxed posture suggest a comfortable setting, perhaps at home or during a casual gathering where they feel at ease expressing themselves through music.",
        "intention": "The individual is expressing personal passion and finding emotional fulfillment through immersive musical practice in a relaxed and comfortable environment",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "both hands",
            "action": [
              [
                "both hands",
                "playing"
              ],
              [
                "both hands",
                "holding"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.3470418446278446,
            0.24915102592536384
          ],
          [
            0.3758239602443402,
            0.265830548178582
          ],
          [
            0.4057556553177102,
            0.27772906564530875
          ],
          [
            0.43430095367015353,
            0.2914947305406843
          ],
          [
            0.4606919210581552,
            0.2987759287868227
          ],
          [
            0.49940761300937203,
            0.3105702100055558
          ],
          [
            0.533228878590165,
            0.30945199273881463
          ],
          [
            0.5764641348016326,
            0.30964625399737133
          ],
          [
            0.6075674109358006,
            0.30283784085796
          ],
          [
            0.636649600601701,
            0.2860792852583386
          ],
          [
            0.6643294619504737,
            0.2648892023733684
          ],
          [
            0.6910015976618207,
            0.23892789646273568
          ],
          [
            0.7047680621109311,
            0.21120103398958842
          ],
          [
            0.6983044604775767,
            0.1818839278959093
          ],
          [
            0.6805041367414768,
            0.1535397891487394
          ],
          [
            0.6461956530336349,
            0.12702934092708998
          ],
          [
            0.6095551036653064,
            0.1002101622876667
          ],
          [
            0.33241452611785716,
            0.20516408802497957
          ],
          [
            0.33427395732314497,
            0.19627268275334722
          ],
          [
            0.3477910383747368,
            0.18848139746558096
          ],
          [
            0.371527142657174,
            0.18656446969225293
          ],
          [
            0.39217796984803743,
            0.18421742128474372
          ],
          [
            0.43824383241158943,
            0.16961212449130555
          ],
          [
            0.4494823560512886,
            0.14490276092574708
          ],
          [
            0.4727327640567507,
            0.12750970843647208
          ],
          [
            0.49885828600674076,
            0.11132501101210004
          ],
          [
            0.5440378404798962,
            0.10771194744322982
          ],
          [
            0.43991896322479956,
            0.197476526314304
          ],
          [
            0.450628874415443,
            0.2113703486820062
          ],
          [
            0.466059164505787,
            0.22454698547011331
          ],
          [
            0.47859950478745517,
            0.24079309574195318
          ],
          [
            0.4918268690664301,
            0.2571857683715366
          ],
          [
            0.5041994753811094,
            0.2562748547111239
          ],
          [
            0.5123059619986822,
            0.2512361610219592
          ],
          [
            0.5132651623594697,
            0.2434013192142759
          ],
          [
            0.5187742248414055,
            0.23532529650699524
          ],
          [
            0.37663956752845223,
            0.22432048746517724
          ],
          [
            0.38884628348880346,
            0.21732786141690755
          ],
          [
            0.4056192975510996,
            0.2118987790885426
          ],
          [
            0.4280133126904725,
            0.21473425931873774
          ],
          [
            0.4091944799221382,
            0.21770695078940616
          ],
          [
            0.39638646795320764,
            0.22222708811362585
          ],
          [
            0.48921845282511733,
            0.1817370579356239
          ],
          [
            0.4928036359252122,
            0.16936274085726055
          ],
          [
            0.5071320543844233,
            0.16186883545347625
          ],
          [
            0.5300276017378247,
            0.15223596450828372
          ],
          [
            0.5223867664576838,
            0.16391434108927136
          ],
          [
            0.5127983109345512,
            0.17417842270362946
          ],
          [
            0.5050342318872926,
            0.27439371077787306
          ],
          [
            0.5092197891896364,
            0.2695470841158005
          ],
          [
            0.5164179487203163,
            0.26328681870585396
          ],
          [
            0.531730647629531,
            0.25852699748107366
          ],
          [
            0.5433254059345003,
            0.2525639376470021
          ],
          [
            0.5645394394006679,
            0.2459882976043792
          ],
          [
            0.587344475807967,
            0.23755621470156169
          ],
          [
            0.5746068167938757,
            0.25358185597828453
          ],
          [
            0.5597066001286582,
            0.2681277444674855
          ],
          [
            0.5482313287951959,
            0.27462695553189237
          ],
          [
            0.5413003887448993,
            0.27634120399043677
          ],
          [
            0.5289438705595713,
            0.2814211779407092
          ],
          [
            0.5143489631080123,
            0.2752504043635868
          ],
          [
            0.5299452479081178,
            0.268098050568785
          ],
          [
            0.5443157042145098,
            0.267565549555279
          ],
          [
            0.5443205045644568,
            0.2609898274853116
          ],
          [
            0.5791490261832242,
            0.24104457107328234
          ],
          [
            0.5407994826634724,
            0.25893836461362385
          ],
          [
            0.5387563424135643,
            0.26281356194189615
          ],
          [
            0.5301635072975562,
            0.26608220807143623
          ]
        ],
        "visibility": [
          1.0,
          0.00033370795426890254,
          3.5625248528958764e-07,
          2.2122166945526267e-11,
          0.9987727999687195,
          0.9999836683273315,
          0.341109961271286,
          0.01234874315559864,
          0.9930837154388428,
          0.30272403359413147,
          4.615687935078392e-15,
          2.1194129757413568e-14,
          0.9998144507408142,
          5.1122498595512766e-11,
          0.9519619941711426,
          4.971230133272997e-13,
          4.4690882106124263e-08,
          3.2644774705659074e-07,
          3.8586579135906074e-14,
          5.232231092833217e-09,
          7.022455282013499e-28,
          9.103859752775908e-22,
          6.138187874649148e-11,
          0.6351332664489746,
          1.3313125775404888e-11,
          2.523706883663518e-13,
          8.841430192141342e-12,
          6.945342196328086e-13,
          0.0007679108530282974
        ],
        "headpose": {
          "pitch": -18.02202615342163,
          "yaw": 7.125774144081515,
          "roll": -37.01952967882073
        },
        "attributes": {
          "5 oClock Shadow": 0.00010223373828921467,
          "Arched Eyebrows": 0.08523905277252197,
          "Attractive": 0.29776763916015625,
          "Bags Under Eyes": 0.056035690009593964,
          "Bald": 3.75192257706658e-07,
          "Bangs": 0.0006879157153889537,
          "Big Lips": 0.18750496208667755,
          "Big Nose": 0.09500470757484436,
          "Black Hair": 0.11554719507694244,
          "Blond Hair": 0.0010492777219042182,
          "Blurry": 0.0001083406968973577,
          "Brown Hair": 0.5188616514205933,
          "Bushy Eyebrows": 0.004394695162773132,
          "Chubby": 0.030922863632440567,
          "Double Chin": 0.005125819705426693,
          "Eyeglasses": 0.002427096478641033,
          "Goatee": 1.3390660569712054e-05,
          "Gray Hair": 2.3487569706048816e-05,
          "Heavy Makeup": 0.19737817347049713,
          "High Cheekbones": 0.3904406726360321,
          "Male": 0.0012958976440131664,
          "Mouth Slightly Open": 0.037968624383211136,
          "Mustache": 3.0475575840682723e-06,
          "Narrow Eyes": 0.6421070098876953,
          "No Beard": 0.9998003840446472,
          "Oval Face": 0.2738417983055115,
          "Pale Skin": 0.0012468131026253104,
          "Pointy Nose": 0.0455019548535347,
          "Receding Hairline": 0.01816294714808464,
          "Rosy Cheeks": 0.010544009506702423,
          "Sideburns": 2.7303578917781124e-06,
          "Smiling": 0.07791050523519516,
          "Straight Hair": 0.29760947823524475,
          "Wavy Hair": 0.41925135254859924,
          "Wearing Earrings": 0.017203541472554207,
          "Wearing Hat": 0.0001417216844856739,
          "Wearing Lipstick": 0.7667413949966431,
          "Wearing Necklace": 0.03081386163830757,
          "Wearing Necktie": 0.00025587441632524133,
          "Young": 0.9899328947067261
        },
        "age": [
          0.02645244635641575,
          0.5372288823127747,
          0.9223994612693787,
          0.8401455283164978,
          0.6013657450675964,
          0.03105909749865532,
          0.00041674988460727036,
          5.897908067709068e-06
        ],
        "race": [
          0.7776790857315063,
          0.007554302457720041,
          0.997611403465271,
          0.03505450859665871,
          0.2749731242656708
        ],
        "gender": [
          0.00087808130774647,
          0.9993020296096802
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 3.791838850847991e-07,
          "disgust": 2.4142268077764466e-12,
          "fear": 0.0001245678198095932,
          "happy": 0.857177199533844,
          "sad": 0.013173619051206148,
          "surprise": 1.328595170165614e-07,
          "neutral": 99.12952174300214
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1102,
          "h": 1155,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 27,
        "gender": {
          "Woman": 99.86069798469543,
          "Man": 0.13930053682997823
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 99.51744076713567,
          "indian": 0.029077635832101753,
          "black": 0.0008801695527679766,
          "white": 0.32781641555973384,
          "middle eastern": 0.006188980119623921,
          "latino hispanic": 0.11860400679582397
        },
        "dominant_race": "asian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.014312581159174442,
        0.013253211975097656,
        0.9990454912185669,
        0.9989622235298157
      ]
    ],
    "face_boxes": [
      [
        0.3369361162185669,
        0.09608161449432373,
        0.6773291230201721,
        0.2967830002307892
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6372921660504925,
            0.3615638976320624
          ],
          [
            0.40948953341652916,
            0.35838315031429124
          ],
          [
            0.1802719775985038,
            0.4426729542352259
          ],
          [
            0.1321645893403996,
            0.5508183630394438
          ],
          [
            0.8650947986844559,
            0.3647446449498336
          ],
          [
            0.9499901897281691,
            0.690771245021373
          ],
          [
            0.7943486394813618,
            0.690771245021373
          ],
          [
            0.2962956786915785,
            0.690771245021373
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.2906359859553308,
            0.7798321699189642
          ],
          [
            0.5057043099327374,
            0.7702899279656508
          ],
          [
            0.04443935192856288,
            0.9070620626298092
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.41797907252090044,
            0.20570727906127764
          ],
          [
            0.5255132345096039,
            0.16753831124802435
          ],
          [
            0.37836122336716776,
            0.22638213662679005
          ],
          [
            0.6556861674432971,
            0.12618859611699976
          ]
        ],
        "dw_hand_1": [
          [
            0.777369561272619,
            0.6987231133158007
          ],
          [
            0.7632203294320002,
            0.6637348928203187
          ],
          [
            0.7575606366957528,
            0.6239755513481796
          ],
          [
            0.7207726339101437,
            0.5858065835349262
          ],
          [
            0.6868144774926584,
            0.5587702313338718
          ],
          [
            0.6896443238607823,
            0.6223851776892939
          ],
          [
            0.6500264747070494,
            0.5746739679227271
          ],
          [
            0.6556861674432971,
            0.5587702313338718
          ],
          [
            0.6698353992839159,
            0.5508183630394438
          ],
          [
            0.644366781970802,
            0.6287466723248363
          ],
          [
            0.6104086255533168,
            0.5778547152404986
          ],
          [
            0.6245578573939354,
            0.5651317259694137
          ],
          [
            0.6415369356026783,
            0.5619509786516428
          ],
          [
            0.6104086255533168,
            0.6351081669603786
          ],
          [
            0.5849400082402028,
            0.5873969571938119
          ],
          [
            0.6019190864489457,
            0.5762643415816128
          ],
          [
            0.6160683182895644,
            0.5730835942638418
          ],
          [
            0.5877698546083266,
            0.644650408913692
          ],
          [
            0.5736206227677076,
            0.6096621884182095
          ],
          [
            0.5821101618720792,
            0.5953488254882395
          ],
          [
            0.596259393712698,
            0.5858065835349262
          ]
        ],
        "dw_hand_2": [
          [
            0.12084520386790466,
            0.5603606049927571
          ],
          [
            0.1632928993897612,
            0.5714932206049561
          ],
          [
            0.2029107485434941,
            0.5746739679227271
          ],
          [
            0.23969875132910298,
            0.5953488254882395
          ],
          [
            0.2821464468509595,
            0.6128429357359805
          ],
          [
            0.15480336028538988,
            0.6048910674415529
          ],
          [
            0.18593167033475128,
            0.6207948040304087
          ],
          [
            0.22837936585660804,
            0.6287466723248363
          ],
          [
            0.2651673686422169,
            0.6319274196426072
          ],
          [
            0.13782428207664726,
            0.6239755513481796
          ],
          [
            0.17461228486225636,
            0.644650408913692
          ],
          [
            0.23120921222473168,
            0.6510119035492339
          ],
          [
            0.2708270613784646,
            0.6510119035492339
          ],
          [
            0.13499443570852343,
            0.6382889142781496
          ],
          [
            0.16895259212600888,
            0.6589637718436621
          ],
          [
            0.2255495194884842,
            0.6637348928203187
          ],
          [
            0.26233752227409307,
            0.6637348928203187
          ],
          [
            0.1406541284447709,
            0.6478311562314629
          ],
          [
            0.1717824384941325,
            0.665325266479204
          ],
          [
            0.21423013401598906,
            0.6716867611147463
          ],
          [
            0.2481882904334743,
            0.6748675084325173
          ]
        ],
        "dw_face": [
          [
            0.36987168426279626,
            0.215249521014591
          ],
          [
            0.39251045520778655,
            0.23433400492121767
          ],
          [
            0.4151492261527766,
            0.2518281151689589
          ],
          [
            0.446277536202138,
            0.2661414780989289
          ],
          [
            0.4774058462514996,
            0.27886446737001347
          ],
          [
            0.5170236954052323,
            0.2868163356644411
          ],
          [
            0.5538116981908414,
            0.2931778302999835
          ],
          [
            0.5934295473445741,
            0.2915874566410978
          ],
          [
            0.6273877037620595,
            0.27886446737001347
          ],
          [
            0.6528563210751734,
            0.26137035712227225
          ],
          [
            0.6670055529157922,
            0.24069549955676006
          ],
          [
            0.681154784756411,
            0.21843026833236218
          ],
          [
            0.681154784756411,
            0.1961650371079644
          ],
          [
            0.6754950920201633,
            0.1738998058835665
          ],
          [
            0.6613458601795446,
            0.1532249483180543
          ],
          [
            0.644366781970802,
            0.13414046441142763
          ],
          [
            0.6245578573939354,
            0.11346560684591532
          ],
          [
            0.3585522987903013,
            0.20093615808462095
          ],
          [
            0.3670418378946726,
            0.1929842897901932
          ],
          [
            0.3840209161034152,
            0.18821316881353653
          ],
          [
            0.3981701479440342,
            0.18503242149576546
          ],
          [
            0.41797907252090044,
            0.18185167417799436
          ],
          [
            0.4632566144108806,
            0.16117681661248207
          ],
          [
            0.48023569261962346,
            0.1516345746591687
          ],
          [
            0.49721477082836585,
            0.14050195904696977
          ],
          [
            0.5198535417733562,
            0.13095971709365642
          ],
          [
            0.5453221590864701,
            0.12777896977588535
          ],
          [
            0.46608646077900445,
            0.1929842897901932
          ],
          [
            0.4774058462514996,
            0.20570727906127764
          ],
          [
            0.48872523172399457,
            0.21843026833236218
          ],
          [
            0.5000446171964898,
            0.2311532576034467
          ],
          [
            0.49438492446024224,
            0.24546662053341675
          ],
          [
            0.5085341563008612,
            0.24387624687453102
          ],
          [
            0.5198535417733562,
            0.24069549955676006
          ],
          [
            0.534002773613975,
            0.23433400492121767
          ],
          [
            0.5481520054545937,
            0.22797251028567553
          ],
          [
            0.4009999943121578,
            0.21843026833236218
          ],
          [
            0.4151492261527766,
            0.2136591473557055
          ],
          [
            0.4292984579933956,
            0.20888802637904882
          ],
          [
            0.4434476898340144,
            0.20252653174350665
          ],
          [
            0.43212830436151944,
            0.20888802637904882
          ],
          [
            0.41797907252090044,
            0.215249521014591
          ],
          [
            0.5028744635646135,
            0.17867092686022318
          ],
          [
            0.5198535417733562,
            0.1738998058835665
          ],
          [
            0.5368326199820987,
            0.16753831124802435
          ],
          [
            0.5538116981908414,
            0.15958644295359647
          ],
          [
            0.5396624663502226,
            0.16753831124802435
          ],
          [
            0.5226833881414797,
            0.1738998058835665
          ],
          [
            0.5113640026689849,
            0.26932222541670015
          ],
          [
            0.5198535417733562,
            0.2629607307811577
          ],
          [
            0.5311729272458513,
            0.2565992361456156
          ],
          [
            0.5396624663502226,
            0.2550088624867301
          ],
          [
            0.5481520054545937,
            0.25023774151007344
          ],
          [
            0.570790776399584,
            0.24387624687453102
          ],
          [
            0.5934295473445741,
            0.23910512589787436
          ],
          [
            0.5877698546083266,
            0.25023774151007344
          ],
          [
            0.5764504691358316,
            0.26137035712227225
          ],
          [
            0.5594713909270889,
            0.26932222541670015
          ],
          [
            0.5453221590864701,
            0.2725029727344711
          ],
          [
            0.5283430808777274,
            0.2725029727344711
          ],
          [
            0.5170236954052323,
            0.26932222541670015
          ],
          [
            0.5311729272458513,
            0.2645511044400434
          ],
          [
            0.5481520054545937,
            0.25977998346338677
          ],
          [
            0.5679609300314602,
            0.25023774151007344
          ],
          [
            0.5905997009764504,
            0.24069549955676006
          ],
          [
            0.570790776399584,
            0.2518281151689589
          ],
          [
            0.5481520054545937,
            0.26137035712227225
          ],
          [
            0.5311729272458513,
            0.2645511044400434
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "005450",
  "objects": [
    {
      "box": [
        0.032643675804138184,
        0.47605565190315247,
        0.9974890947341919,
        0.8342620134353638
      ],
      "name": "acoustic guitar",
      "possible_names": [
        "acoustic guitar"
      ]
    }
  ],
  "mask_file": "./person_labeling/./005450.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person is playing an acoustic guitar while wearing a pink sweater and gray pants seated on a white surface with a soft textured object nearby in a softly lit indoor environment with neutral colors and minimalistic decor suggesting a calm and focused atmosphere for music practice or performance",
  "overall_past": "Before the current scene, the individual likely set up their space with intention—choosing a quiet, uncluttered corner of a room, placing the guitar on a soft, supportive surface, and adjusting the lighting to create a warm, inviting ambiance. They may have taken a few moments to tune the guitar, perhaps testing each string with gentle plucks to ensure clarity and harmony. This preparation suggests a routine or ritual, indicating that music is a meaningful and regular part of their life. The pink sweater and gray pants, chosen for comfort and personal style, imply a sense of self-expression even in private moments. The presence of the soft textured object nearby—perhaps a cushion or blanket—hints at a deliberate effort to enhance comfort, reinforcing that this is a space where they feel safe to focus and create. Thus, the scene likely follows a brief moment of stillness and mindfulness, where the individual paused to center themselves before beginning to play, fully immersed in the act of making music.",
  "overall_past_clean": "A deliberate pause was held as the individual took a deep breath, centering their focus inward, then reached for the instrument with purpose, their hands moving with quiet confidence to align the strings, setting the stage for a moment of intentional creation.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to pause briefly, gently lowering the guitar onto the soft textured object nearby, taking a slow breath as they reflect on the piece just played. Their expression may soften into a quiet smile, indicating satisfaction or emotional connection to the music. They might then reach for a nearby cup of tea or water, sipping slowly before deciding whether to continue practicing, improvise a new melody, or simply sit in the peaceful stillness, letting the lingering notes echo in the calm, minimalist space.",
  "overall_future_clean": "A deep, quiet breath is drawn, the instrument settles into place with deliberate care, and the silence that follows hums with unspoken resonance, before a hand lifts toward the cup, fingers curling around its warmth as the mind drifts into the next moment—whether to shape a new phrase or simply remain, suspended in stillness.",
  "future_scene_ok": true
}