{
  "video_path": "./ref_datasets/part2/6646795000.mp4",
  "start_time": 0.0,
  "end_time": 2.48,
  "image_path": "./021314.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6646795000.mp4",
      "start_time": 0.0,
      "end_time": 2.48,
      "image_path": "./ref_datasets/extracted_frames/person_-8411317716657486472_1_6646795000.mp4_0.00_2.48.jpg",
      "type": "person"
    }
  ],
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a white knitted sweater with a loose texture. She also has a black pair of over-ear headphones around her neck and a silver ring on her right hand.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "sweater",
                "knitwear",
                "pullover"
              ],
              "name": "sweater",
              "type": "top",
              "color": [
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "earphones",
                "headphones"
              ],
              "name": "headphones",
              "type": "accessory",
              "color": [
                "black"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "ring"
              ],
              "name": "ring",
              "type": "accessory",
              "color": [
                "silver"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "nose ring"
              ],
              "name": "nose ring",
              "type": "accessory",
              "color": [
                "silver"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "ring"
            ],
            "name": "ring",
            "position": "hand"
          }
        ],
        "description": "A female adult appears in the foreground with a neutral expression. She is dressed in a white knitted sweater and has black over-ear headphones resting around her neck. A silver ring adorns her right hand. Her hair is styled in an afro, and she has a nose piercing. The background is plain and light-colored.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, with their eyes slightly closed and a relaxed posture.",
        "meaningful": true,
        "story": "The person seems to be in a moment of reflection or relaxation, possibly listening to music or taking a break. The headphones suggest an interest in audio or music-related activities.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is holding a pair of headphones around their neck, suggesting they might be taking a break from listening to music or preparing to put them on. Their gaze is directed downwards, indicating a moment of contemplation or perhaps feeling shy or reserved. The casual pose and relaxed demeanor suggest a comfortable setting, possibly at home or in a familiar environment where they feel at ease. The white sweater adds to the cozy atmosphere, hinting at a preference for comfort and warmth. The overall scene conveys a sense of quiet introspection or casual leisure.",
        "intention": "The individual is momentarily pausing to reflect or prepare for a moment of personal connection with music in a comfortable and familiar space",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3212299811875537,
            0.25006697960000823
          ],
          [
            0.3189125570690348,
            0.2897437114564199
          ],
          [
            0.3164613131256331,
            0.3352484202258802
          ],
          [
            0.3174335774921236,
            0.3712984127342385
          ],
          [
            0.3232252302269141,
            0.41317610097309904
          ],
          [
            0.33271865954711327,
            0.4539019717741265
          ],
          [
            0.341031724888654,
            0.493161850505405
          ],
          [
            0.34900564991292504,
            0.5360592472490179
          ],
          [
            0.36307206327716507,
            0.5600601458675647
          ],
          [
            0.3894550969912892,
            0.5652346545426303
          ],
          [
            0.41913779551784197,
            0.5414493292097062
          ],
          [
            0.4523495266834895,
            0.5177710406994693
          ],
          [
            0.4848049974157697,
            0.4955478250034271
          ],
          [
            0.5089121238816352,
            0.4512244578391787
          ],
          [
            0.5225739478355362,
            0.39294689130530785
          ],
          [
            0.5313561198257265,
            0.3293173196139159
          ],
          [
            0.5399023242649578,
            0.2622506896339396
          ],
          [
            0.31538988844979376,
            0.17127694713060188
          ],
          [
            0.32220803401654674,
            0.13849347569639722
          ],
          [
            0.33429220593756154,
            0.1355986662327297
          ],
          [
            0.3462647690659478,
            0.13837714813373708
          ],
          [
            0.3574225238746121,
            0.15202095711988117
          ],
          [
            0.38400810992433915,
            0.14425794050176305
          ],
          [
            0.4083071984705471,
            0.1285659978471736
          ],
          [
            0.4308672267766226,
            0.1285777489344279
          ],
          [
            0.45506282462960196,
            0.14767491767015406
          ],
          [
            0.4734832032805397,
            0.17757125358102183
          ],
          [
            0.3652459927258037,
            0.22242769598960876
          ],
          [
            0.35906585522350815,
            0.24630103145957624
          ],
          [
            0.3508481241053059,
            0.26785222086956895
          ],
          [
            0.34462163505100063,
            0.29383374591353073
          ],
          [
            0.3399607825846899,
            0.34582121201923915
          ],
          [
            0.34626774003817923,
            0.3497209796199092
          ],
          [
            0.3541762269323781,
            0.35201779581882336
          ],
          [
            0.3676162584906533,
            0.35076276095455916
          ],
          [
            0.38166884751546953,
            0.3562196472019115
          ],
          [
            0.3267443687610683,
            0.25158564653346144
          ],
          [
            0.33180814974364786,
            0.24586529224007217
          ],
          [
            0.3405532448774293,
            0.24361458997877822
          ],
          [
            0.35135431857336136,
            0.24196864107929206
          ],
          [
            0.34159444457008725,
            0.24395245424023382
          ],
          [
            0.3333192837912412,
            0.2473590510862845
          ],
          [
            0.4083534403925851,
            0.2404654391858944
          ],
          [
            0.41933810043902625,
            0.23650259296730083
          ],
          [
            0.4309249140676998,
            0.23700804202644912
          ],
          [
            0.44671689222256344,
            0.24292836397413226
          ],
          [
            0.4325862028059505,
            0.2402395090098103
          ],
          [
            0.4188610456174328,
            0.2418280029423022
          ],
          [
            0.3332488081639722,
            0.426270022341814
          ],
          [
            0.33460131312410035,
            0.4089016576292654
          ],
          [
            0.34268419937718486,
            0.3913006846551542
          ],
          [
            0.35094863286330585,
            0.398148580959865
          ],
          [
            0.36071974393867307,
            0.39294136138189406
          ],
          [
            0.3821686505561784,
            0.4120764428976352
          ],
          [
            0.4064843918950785,
            0.4404754583167021
          ],
          [
            0.38245756938343956,
            0.4564702931535307
          ],
          [
            0.3635951078718617,
            0.46692690969144224
          ],
          [
            0.35187153085356665,
            0.4723832101418228
          ],
          [
            0.3439528483720053,
            0.4662059107785502
          ],
          [
            0.3369283298651377,
            0.4496682061720147
          ],
          [
            0.3364897606450887,
            0.42744798975646814
          ],
          [
            0.3441469372737975,
            0.429964198637261
          ],
          [
            0.3511879002764111,
            0.4304139969840882
          ],
          [
            0.36333047208331876,
            0.42866185480955415
          ],
          [
            0.39892695113306953,
            0.4392002017409713
          ],
          [
            0.36339803703484086,
            0.4263659055901583
          ],
          [
            0.3522697288365591,
            0.4238178762178572
          ],
          [
            0.34522557560177075,
            0.4226856009670036
          ]
        ],
        "visibility": [
          0.999975323677063,
          3.9718880628925035e-08,
          3.475007906672545e-05,
          7.0920391548367e-15,
          0.042168863117694855,
          3.272310641477816e-05,
          6.049132379628685e-16,
          6.509071961717557e-20,
          0.9901170134544373,
          1.2907683090906475e-15,
          5.160703153705981e-08,
          2.391430387049809e-10,
          1.6313355180597178e-11,
          0.015284320339560509,
          6.850640931269081e-13,
          1.3506631830750848e-06,
          6.018421117914841e-06,
          4.6339434511821764e-09,
          1.774323621361873e-08,
          1.2561010862555122e-06,
          6.448784561907672e-11,
          8.72977850008283e-08,
          0.9438424110412598,
          4.167203915272921e-09,
          1.161260486642196e-14,
          3.782391744646188e-15,
          2.0029139805033402e-11,
          4.3587456275417935e-06,
          3.124011271893323e-08
        ],
        "headpose": {
          "pitch": 5.816567752841703,
          "yaw": 30.22138775639368,
          "roll": 3.1191570024217095
        },
        "attributes": {
          "5 oClock Shadow": 0.004169246647506952,
          "Arched Eyebrows": 0.01999877393245697,
          "Attractive": 0.35755109786987305,
          "Bags Under Eyes": 0.08097167313098907,
          "Bald": 4.8172187234740704e-05,
          "Bangs": 0.0034314722288399935,
          "Big Lips": 0.7723268270492554,
          "Big Nose": 0.17448589205741882,
          "Black Hair": 0.5218778252601624,
          "Blond Hair": 0.001783710322342813,
          "Blurry": 0.005158035084605217,
          "Brown Hair": 0.06446438282728195,
          "Bushy Eyebrows": 0.03470577672123909,
          "Chubby": 0.035570625215768814,
          "Double Chin": 0.006054338999092579,
          "Eyeglasses": 0.001352593069896102,
          "Goatee": 0.0008337243343703449,
          "Gray Hair": 0.0014131489442661405,
          "Heavy Makeup": 0.17303870618343353,
          "High Cheekbones": 0.19623005390167236,
          "Male": 0.4210696220397949,
          "Mouth Slightly Open": 0.3588029742240906,
          "Mustache": 0.0004565247509162873,
          "Narrow Eyes": 0.669278085231781,
          "No Beard": 0.9965938925743103,
          "Oval Face": 0.19064250588417053,
          "Pale Skin": 0.004480199888348579,
          "Pointy Nose": 0.07727757096290588,
          "Receding Hairline": 0.07461772114038467,
          "Rosy Cheeks": 0.0018605977529659867,
          "Sideburns": 5.7589943025959656e-05,
          "Smiling": 0.052957650274038315,
          "Straight Hair": 0.06525614857673645,
          "Wavy Hair": 0.28215864300727844,
          "Wearing Earrings": 0.13400046527385712,
          "Wearing Hat": 0.00043892604298889637,
          "Wearing Lipstick": 0.427334725856781,
          "Wearing Necklace": 0.01880136877298355,
          "Wearing Necktie": 0.018463077023625374,
          "Young": 0.9831374883651733
        },
        "age": [
          0.8259088397026062,
          0.991679847240448,
          0.8768935799598694,
          0.07857485860586166,
          0.0040433467365801334,
          0.0002571880759205669,
          4.886859096586704e-05,
          1.5849816918489523e-05
        ],
        "race": [
          0.0829881951212883,
          0.8250052332878113,
          0.5254860520362854,
          0.1670067012310028,
          0.8078272342681885
        ],
        "gender": [
          0.18273355066776276,
          0.7976139783859253
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.0013802770808979403,
          "disgust": 4.0390302213921814e-08,
          "fear": 1.8139319494366646,
          "happy": 0.027897857944481075,
          "sad": 97.32775092124939,
          "surprise": 0.0006261538146645762,
          "neutral": 0.8284171111881733
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 617,
          "h": 742,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 33,
        "gender": {
          "Woman": 17.344930768013,
          "Man": 82.65507221221924
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 18.09416115283966,
          "indian": 11.15194708108902,
          "black": 7.723958045244217,
          "white": 18.73452663421631,
          "middle eastern": 17.582842707633972,
          "latino hispanic": 26.712566614151
        },
        "dominant_race": "latino hispanic"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.1474379599094391,
        0.005501699633896351,
        0.7022241950035095,
        0.985602855682373
      ]
    ],
    "face_boxes": [
      [
        0.30505913496017456,
        0.03736676648259163,
        0.5195820927619934,
        0.558101236820221
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.2846982796457079,
            0.8985380717962331
          ],
          [
            0.5170301049417919,
            0.7649774823843042
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.26444371026092106,
            0.9070181092192129
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.33354753522078207,
            0.24981520893829257
          ],
          [
            0.42886315585507284,
            0.2519352182940373
          ],
          [
            0.30852718480428054,
            0.29433540540893544
          ],
          [
            0.5384761195845074,
            0.32825555510085386
          ]
        ],
        "dw_hand_1": [
          [
            0.2751667175822788,
            0.8879380250175087
          ],
          [
            0.3144844110939238,
            0.8158577069221818
          ],
          [
            0.3573764403793547,
            0.7543774356055798
          ],
          [
            0.3978855791489284,
            0.7119772484906816
          ],
          [
            0.41933159379164386,
            0.6886571455774876
          ],
          [
            0.36690800244278376,
            0.6759370894430182
          ],
          [
            0.40860858647028614,
            0.6398969303953549
          ],
          [
            0.4181401485337151,
            0.6462569584625897
          ],
          [
            0.42409737482335835,
            0.6674570520200388
          ],
          [
            0.36095077615314064,
            0.6801771081545082
          ],
          [
            0.4062256959544288,
            0.6526169865298243
          ],
          [
            0.40860858647028614,
            0.6674570520200388
          ],
          [
            0.4026513601806429,
            0.6886571455774876
          ],
          [
            0.3442705425421398,
            0.6950171736447224
          ],
          [
            0.39907702440685694,
            0.6738170800872734
          ],
          [
            0.39907702440685694,
            0.6928971642889775
          ],
          [
            0.3823967907958561,
            0.7162172672021715
          ],
          [
            0.32878175418906747,
            0.7119772484906816
          ],
          [
            0.3871625718275707,
            0.7119772484906816
          ],
          [
            0.3871625718275707,
            0.7416573794711104
          ],
          [
            0.36929089295864104,
            0.7607374636728145
          ]
        ],
        "dw_hand_2": [
          [
            0.28350683438777924,
            0.8964180624404884
          ],
          [
            0.31925019212563827,
            0.7882975852974982
          ],
          [
            0.343079097284211,
            0.7119772484906816
          ],
          [
            0.3883540170854992,
            0.6928971642889775
          ],
          [
            0.41933159379164386,
            0.6801771081545082
          ],
          [
            0.36929089295864104,
            0.6632170333085486
          ],
          [
            0.40860858647028614,
            0.6483769678183346
          ],
          [
            0.42290592956542966,
            0.658977014597059
          ],
          [
            0.43243749162885875,
            0.6674570520200388
          ],
          [
            0.3728652287324269,
            0.684417126865998
          ],
          [
            0.4074171412123574,
            0.6738170800872734
          ],
          [
            0.4074171412123574,
            0.684417126865998
          ],
          [
            0.38954546234342785,
            0.6865371362217428
          ],
          [
            0.37048233821656973,
            0.7183372765579163
          ],
          [
            0.3978855791489284,
            0.7162172672021715
          ],
          [
            0.3907369076013565,
            0.7310573326923857
          ],
          [
            0.3835882360537846,
            0.7352973514038756
          ],
          [
            0.37167378347449836,
            0.7670974917400492
          ],
          [
            0.3871625718275707,
            0.769217501095794
          ],
          [
            0.38477968131171336,
            0.7798175478745186
          ],
          [
            0.3776310097641415,
            0.7861775759417532
          ]
        ],
        "dw_face": [
          [
            0.31210152057806656,
            0.24345518087105758
          ],
          [
            0.3049528490304947,
            0.29433540540893544
          ],
          [
            0.3025699585146374,
            0.34521562994681326
          ],
          [
            0.30733573954635196,
            0.393975845128946
          ],
          [
            0.3156758563518524,
            0.4427360603110787
          ],
          [
            0.3275903089311388,
            0.4893762661374667
          ],
          [
            0.3406962067683537,
            0.5317764532523648
          ],
          [
            0.36452511192692644,
            0.5593365748770487
          ],
          [
            0.3931197981172138,
            0.5593365748770487
          ],
          [
            0.421714484307501,
            0.5466165187425791
          ],
          [
            0.4479262799819311,
            0.5232964158293851
          ],
          [
            0.4705637398825752,
            0.49361628484895653
          ],
          [
            0.49200975452529067,
            0.46181614451278286
          ],
          [
            0.5051156523625056,
            0.41729594804214
          ],
          [
            0.5158386596838633,
            0.36853573286000707
          ],
          [
            0.5217958859735066,
            0.31977551767787415
          ],
          [
            0.526561667005221,
            0.2731353118514864
          ],
          [
            0.31329296583599514,
            0.1883349376216903
          ],
          [
            0.3228245278994243,
            0.17561488148722074
          ],
          [
            0.33235608996285326,
            0.17349487213147602
          ],
          [
            0.34188765202628246,
            0.17349487213147602
          ],
          [
            0.3526106593476402,
            0.17773489084296568
          ],
          [
            0.3955026886330711,
            0.17137486277573089
          ],
          [
            0.4157572580178578,
            0.16289482535275138
          ],
          [
            0.4360118274026447,
            0.16077481599700646
          ],
          [
            0.4562663967874315,
            0.16713484406424103
          ],
          [
            0.47532952091428965,
            0.1883349376216903
          ],
          [
            0.36571655718485524,
            0.24769519958254746
          ],
          [
            0.3585678856372833,
            0.2688952931399967
          ],
          [
            0.35141921408971144,
            0.29009538669744556
          ],
          [
            0.3454619878000683,
            0.3112954802548947
          ],
          [
            0.33354753522078207,
            0.3536956673697928
          ],
          [
            0.34188765202628246,
            0.3600556954370276
          ],
          [
            0.3538021046055687,
            0.3600556954370276
          ],
          [
            0.3680994477007124,
            0.3600556954370276
          ],
          [
            0.38120534553792745,
            0.3600556954370276
          ],
          [
            0.31925019212563827,
            0.2582952463612721
          ],
          [
            0.32878175418906747,
            0.25617523700552713
          ],
          [
            0.3395047615104252,
            0.2540552276497822
          ],
          [
            0.3502277688317829,
            0.2540552276497822
          ],
          [
            0.3395047615104252,
            0.260415255717017
          ],
          [
            0.32878175418906747,
            0.26253526507276176
          ],
          [
            0.4062256959544288,
            0.25617523700552713
          ],
          [
            0.4205230390495724,
            0.2540552276497822
          ],
          [
            0.43720327266057335,
            0.25617523700552713
          ],
          [
            0.45269206101364556,
            0.2582952463612721
          ],
          [
            0.43720327266057335,
            0.26465527442850684
          ],
          [
            0.4205230390495724,
            0.26253526507276176
          ],
          [
            0.3275903089311388,
            0.43637603224384414
          ],
          [
            0.33235608996285326,
            0.41941595739788473
          ],
          [
            0.34188765202628246,
            0.40669590126341537
          ],
          [
            0.3502277688317829,
            0.40669590126341537
          ],
          [
            0.3585678856372833,
            0.4045758919076704
          ],
          [
            0.38001390027999876,
            0.41729594804214
          ],
          [
            0.4026513601806429,
            0.43637603224384414
          ],
          [
            0.3871625718275707,
            0.4533361070898033
          ],
          [
            0.37048233821656973,
            0.46817617258001765
          ],
          [
            0.35141921408971144,
            0.47241619129150747
          ],
          [
            0.3406962067683537,
            0.4660561632242727
          ],
          [
            0.33235608996285326,
            0.4533361070898033
          ],
          [
            0.33116464470492474,
            0.4384960415995889
          ],
          [
            0.3395047615104252,
            0.434256022888099
          ],
          [
            0.3502277688317829,
            0.43001600417660935
          ],
          [
            0.37405667399035564,
            0.43213601353235426
          ],
          [
            0.3978855791489284,
            0.43637603224384414
          ],
          [
            0.37524811924828416,
            0.43637603224384414
          ],
          [
            0.35141921408971144,
            0.4384960415995889
          ],
          [
            0.3406962067683537,
            0.4384960415995889
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "021314",
  "objects": [],
  "mask_file": "./person_labeling/./021314.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person wearing a white textured sweater holds black headphones around their neck against a plain light gray background with soft lighting and minimalistic style emphasizing simplicity and modernity",
  "overall_past": "Before this scene, the individual was likely listening to music through the black headphones, perhaps engrossed in a playlist, podcast, or audiobook. The soft lighting and minimalistic setting suggest a calm, intentional environment—possibly a quiet morning or evening at home. The act of placing the headphones around the neck indicates a pause in listening, signaling a transition from active engagement with audio to a moment of reflection or stillness. This brief break may have been prompted by a thought, a shift in mood, or simply a desire to be present in the moment without external input, highlighting a personal ritual of mindfulness or emotional reset.",
  "overall_past_clean": "The individual was fully immersed in a stream of auditory content, their focus entirely absorbed in the rhythm and flow of sound, as if time had slowed to match the cadence of the music, thoughts, and emotions unfolding within.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to put the headphones on and begin listening to music, perhaps as a way to immerse themselves in a personal moment of focus or emotional connection. The downward gaze and relaxed posture suggest a transition from stillness to engagement—possibly selecting a playlist, adjusting the volume, or simply allowing the music to guide their thoughts. This small, deliberate action would mark the shift from quiet contemplation to a more inward, sensory experience, reinforcing the scene’s theme of modern, minimalist self-care.",
  "overall_future_clean": "The rhythm takes hold, pulling attention inward as the mind settles into a focused stillness, the body responding to the pulse with subtle shifts in breath and posture, fully absorbed in the unfolding sensory journey.",
  "future_scene_ok": true
}