{
  "video_path": "./ref_datasets/part2/7710586000.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./027003.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/7710586000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_5256881235505922583_1_7710586000.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a black top with a visible necklace around her neck.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "shirt",
                "blouse",
                "top"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "black"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "glasses"
              ],
              "name": "glasses",
              "type": "accessory",
              "color": [
                "black"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [],
        "description": "A female adult with curly brown hair and glasses is in the foreground. She appears to have a neutral expression. She is wearing a black top and a silver necklace. There are no other objects directly associated with her.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, neither displaying strong positive nor negative emotions. The eyes seem focused, possibly indicating concentration or thoughtfulness.",
        "meaningful": false,
        "story": "unknown",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person with curly hair and glasses appears to be focused on something off-camera, possibly a screen or an object of interest, as indicated by the reflection in their glasses. Their expression is serious and concentrated, suggesting they might be engaged in a task that requires attention and thought. The slight downward tilt of their head and the intensity in their gaze imply a deep level of engagement, perhaps indicating they are analyzing or studying the subject before them. The overall demeanor suggests a moment of quiet concentration, possibly for work, study, or personal interest.",
        "intention": "They are deeply engaged in analyzing or studying something important requiring focused attention",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.31619045747876434,
            0.35126073019845144
          ],
          [
            0.31794882928911,
            0.43961027690342497
          ],
          [
            0.32672112717825386,
            0.5259816646575928
          ],
          [
            0.336692037917341,
            0.6114954948425293
          ],
          [
            0.3525186620037338,
            0.6962552751813617
          ],
          [
            0.3803799802345955,
            0.7613443647112165
          ],
          [
            0.41939978743071804,
            0.8209475789751325
          ],
          [
            0.45748408843896216,
            0.8653300149100167
          ],
          [
            0.5025968985199663,
            0.8841502325875419
          ],
          [
            0.5484377562617218,
            0.8907226834978376
          ],
          [
            0.5970237509879683,
            0.8542898041861398
          ],
          [
            0.6430912674072065,
            0.8159606797354562
          ],
          [
            0.6809511898151999,
            0.7517715181623187
          ],
          [
            0.7030581346313869,
            0.675671032496861
          ],
          [
            0.7185276986232825,
            0.5908748762948173
          ],
          [
            0.7323733916107034,
            0.507375887462071
          ],
          [
            0.7461294015603406,
            0.4095278467450823
          ],
          [
            0.3506569029414095,
            0.2564758573259626
          ],
          [
            0.38154307613149285,
            0.21699036870683944
          ],
          [
            0.42143133624423557,
            0.21738903863089426
          ],
          [
            0.46495645254617557,
            0.23257919720241002
          ],
          [
            0.5002575012788708,
            0.2689205067498343
          ],
          [
            0.5569857848043154,
            0.2726912498474121
          ],
          [
            0.5958596195559949,
            0.24475884437561035
          ],
          [
            0.6391384495156152,
            0.2446726390293666
          ],
          [
            0.680251624119202,
            0.26349096638815744
          ],
          [
            0.7052917742902147,
            0.30421291078839985
          ],
          [
            0.5255597463276769,
            0.3450087479182652
          ],
          [
            0.5214562723329956,
            0.4132214273725237
          ],
          [
            0.5202840846281366,
            0.4762938703809465
          ],
          [
            0.5180638024217582,
            0.5459886619022915
          ],
          [
            0.4822658678583268,
            0.5709998267037528
          ],
          [
            0.49783716129604727,
            0.5919534819466727
          ],
          [
            0.5140203704608471,
            0.6108785356794085
          ],
          [
            0.5343328374936911,
            0.5953482900347028
          ],
          [
            0.5506990988589158,
            0.5838682310921806
          ],
          [
            0.4040371780616364,
            0.33725336619785856
          ],
          [
            0.4271990956123253,
            0.322030816759382
          ],
          [
            0.4469700633032646,
            0.32853167397635324
          ],
          [
            0.4731655096069777,
            0.35746639115469797
          ],
          [
            0.44362351794760413,
            0.35436974252973286
          ],
          [
            0.42449638706498916,
            0.35167029925755094
          ],
          [
            0.5763969943093668,
            0.36750350679670063
          ],
          [
            0.6052739064408732,
            0.34636919839041574
          ],
          [
            0.6206398029212974,
            0.3487109456743513
          ],
          [
            0.64623784998964,
            0.36955128397260395
          ],
          [
            0.6226377205956461,
            0.37746078627450125
          ],
          [
            0.6064859954972885,
            0.37037413460867746
          ],
          [
            0.4409746002222944,
            0.6632271494184222
          ],
          [
            0.468059713661205,
            0.6655291148594448
          ],
          [
            0.4906983154859128,
            0.6626917975289481
          ],
          [
            0.5100347194571181,
            0.6731901850019183
          ],
          [
            0.5304538941044095,
            0.6638514654976981
          ],
          [
            0.5548119211702474,
            0.6777283804757255
          ],
          [
            0.5849747208579044,
            0.6915909222194127
          ],
          [
            0.5503848092131582,
            0.728196280343192
          ],
          [
            0.5233397111296654,
            0.736161640712193
          ],
          [
            0.5055470524488815,
            0.734710557120187
          ],
          [
            0.4914621603592033,
            0.7277614048549107
          ],
          [
            0.4649286166033042,
            0.7070006643022809
          ],
          [
            0.4541570757449206,
            0.6680024691990444
          ],
          [
            0.4992495931385617,
            0.6862207821437291
          ],
          [
            0.5101353848669012,
            0.6974027497427804
          ],
          [
            0.5198052304081752,
            0.697166987827846
          ],
          [
            0.5702039625362627,
            0.6942483357020787
          ],
          [
            0.5200185696344956,
            0.6985064234052386
          ],
          [
            0.5078803694840255,
            0.6978099686758858
          ],
          [
            0.4959395480192532,
            0.6851966721670968
          ]
        ],
        "visibility": [
          0.01775926724076271,
          0.5239406228065491,
          0.024159347638487816,
          0.6549588441848755,
          2.9579840088445053e-07,
          0.004658436868339777,
          5.776275429525413e-06,
          0.7077686786651611,
          9.122240953729488e-06,
          0.9943563342094421,
          8.778844318158008e-10,
          0.36310213804244995,
          1.220052672579186e-05,
          4.5516493352160126e-11,
          0.9999593496322632,
          0.04701003432273865,
          1.623065912781385e-07,
          0.9995844960212708,
          1.627448277866355e-14,
          1.4769223355415306e-07,
          2.262612672853612e-16,
          7.070272163628019e-21,
          3.621314877198627e-14,
          3.4759649585741625e-12,
          4.32405753536339e-17,
          1.8766673514535514e-15,
          2.1875755791559054e-17,
          8.010614913566043e-17,
          1.3102994167110693e-12
        ],
        "headpose": {
          "pitch": -6.422580555819315,
          "yaw": 1.2563748780097643,
          "roll": 3.0465418462607188
        },
        "attributes": {
          "5 oClock Shadow": 0.002438576426357031,
          "Arched Eyebrows": 0.07167723029851913,
          "Attractive": 0.4747900664806366,
          "Bags Under Eyes": 0.12659825384616852,
          "Bald": 2.6361650640183143e-09,
          "Bangs": 0.6643940806388855,
          "Big Lips": 0.21411387622356415,
          "Big Nose": 0.3190235495567322,
          "Black Hair": 0.002339113038033247,
          "Blond Hair": 0.013648437336087227,
          "Blurry": 1.6849851817823946e-05,
          "Brown Hair": 0.8635275363922119,
          "Bushy Eyebrows": 0.0280916765332222,
          "Chubby": 0.023206802085042,
          "Double Chin": 0.011676738038659096,
          "Eyeglasses": 0.06972654908895493,
          "Goatee": 5.952053106739186e-05,
          "Gray Hair": 0.0007226833840832114,
          "Heavy Makeup": 0.1539851725101471,
          "High Cheekbones": 0.1339140087366104,
          "Male": 0.3693852126598358,
          "Mouth Slightly Open": 0.08990593254566193,
          "Mustache": 2.112879701599013e-05,
          "Narrow Eyes": 0.11057242751121521,
          "No Beard": 0.9990695118904114,
          "Oval Face": 0.5225799679756165,
          "Pale Skin": 0.020840151235461235,
          "Pointy Nose": 0.11041902750730515,
          "Receding Hairline": 2.5106262910412624e-05,
          "Rosy Cheeks": 0.03835078701376915,
          "Sideburns": 1.0972307791234925e-05,
          "Smiling": 0.025361448526382446,
          "Straight Hair": 0.0006097467266954482,
          "Wavy Hair": 0.984886109828949,
          "Wearing Earrings": 0.019609058275818825,
          "Wearing Hat": 0.00021804218704346567,
          "Wearing Lipstick": 0.626633882522583,
          "Wearing Necklace": 0.0586603544652462,
          "Wearing Necktie": 0.0017694017151370645,
          "Young": 0.9617448449134827
        },
        "age": [
          0.03824584186077118,
          0.9661391973495483,
          0.9059141278266907,
          0.4729844331741333,
          0.13329105079174042,
          0.004790793173015118,
          0.00020016933558508754,
          2.9257139431138057e-06
        ],
        "race": [
          0.989309549331665,
          0.0014807054540142417,
          0.486432820558548,
          0.11292006820440292,
          0.7643994092941284
        ],
        "gender": [
          0.03677539527416229,
          0.9730567336082458
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 7.305634766817093,
          "disgust": 0.016202240658458322,
          "fear": 60.70640683174133,
          "happy": 23.700284957885742,
          "sad": 1.57318115234375,
          "surprise": 2.018211781978607,
          "neutral": 4.680077359080315
        },
        "dominant_emotion": "fear",
        "region": {
          "x": 0,
          "y": 0,
          "w": 2284,
          "h": 2159,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 35,
        "gender": {
          "Woman": 98.01986813545227,
          "Man": 1.9801368936896324
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 2.4686126260194188e-05,
          "indian": 0.00022780638112591896,
          "black": 1.1412217407401345e-07,
          "white": 98.51416936601218,
          "middle eastern": 1.3351476615755355,
          "latino hispanic": 0.1504286980511962
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.16180144250392914,
        0.0031146423425525427,
        0.9985355138778687,
        0.9856101870536804
      ]
    ],
    "face_boxes": [
      [
        0.34054476022720337,
        0.03587570786476135,
        0.7124701738357544,
        0.8843489289283752
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6100080524616771,
            0.9503823499274409
          ],
          [
            0.2833696233961317,
            0.9972585296922409
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.9366464815272225,
            0.9035061701626408
          ],
          [
            1.1013381264342201,
            0.9451738855091301
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7042482714917924,
            0.6222490915738401
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4370818253093296,
            0.33751970337283227
          ],
          [
            0.6109230060444938,
            0.3583535610460767
          ],
          [
            0.3346070240338643,
            0.38613203794373613
          ],
          [
            0.7243772503137589,
            0.42085513406581015
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.3474163741932975,
            0.30626891686296553
          ],
          [
            0.3474163741932975,
            0.39654896678035845
          ],
          [
            0.351076188524564,
            0.48682901669775114
          ],
          [
            0.3602257243527306,
            0.5771090666151438
          ],
          [
            0.3730350745121639,
            0.6604444973081219
          ],
          [
            0.3986537748310301,
            0.740307618388892
          ],
          [
            0.4297621966467964,
            0.8097538106330405
          ],
          [
            0.46819024712509577,
            0.865310764428359
          ],
          [
            0.5139379262659286,
            0.8861446221016036
          ],
          [
            0.5633454197380279,
            0.8687830740405665
          ],
          [
            0.6054332845475937,
            0.8271153586940777
          ],
          [
            0.6402015206946267,
            0.7646137856743442
          ],
          [
            0.6694800353447594,
            0.6951675934301962
          ],
          [
            0.6877791070010926,
            0.6153044723494251
          ],
          [
            0.6987585499948925,
            0.5284967320442402
          ],
          [
            0.7060781786574257,
            0.4382166821268473
          ],
          [
            0.7079080858230591,
            0.3444643225972471
          ],
          [
            0.37486498167779714,
            0.2646012015164765
          ],
          [
            0.40048368199666334,
            0.24723965345543936
          ],
          [
            0.427932289481163,
            0.25071196306764687
          ],
          [
            0.45721080413129594,
            0.2646012015164765
          ],
          [
            0.4846594116157955,
            0.2819627495775136
          ],
          [
            0.5633454197380279,
            0.2923796784141359
          ],
          [
            0.5907940272225274,
            0.2784904399653061
          ],
          [
            0.6219024490382935,
            0.2715458207408915
          ],
          [
            0.6511809636884266,
            0.2715458207408915
          ],
          [
            0.6767996640072929,
            0.2923796784141359
          ],
          [
            0.5212575549284618,
            0.3583535610460767
          ],
          [
            0.5175977405971951,
            0.42085513406581015
          ],
          [
            0.5157678334315617,
            0.48682901669775114
          ],
          [
            0.5139379262659286,
            0.5493305897174846
          ],
          [
            0.475509875787629,
            0.5909983050639737
          ],
          [
            0.49563885460959545,
            0.6014152339005959
          ],
          [
            0.5157678334315617,
            0.6083598531250105
          ],
          [
            0.5358968122535281,
            0.6014152339005959
          ],
          [
            0.5560257910754944,
            0.5979429242883885
          ],
          [
            0.4023135891622967,
            0.33751970337283227
          ],
          [
            0.427932289481163,
            0.31668584569958785
          ],
          [
            0.45721080413129594,
            0.32710277453620995
          ],
          [
            0.47733978295326235,
            0.3618258706582842
          ],
          [
            0.4498911754687626,
            0.368770489882699
          ],
          [
            0.4242724751498964,
            0.3618258706582842
          ],
          [
            0.5688351412349277,
            0.3757151091071138
          ],
          [
            0.5926239343881607,
            0.3444643225972471
          ],
          [
            0.6219024490382935,
            0.3444643225972471
          ],
          [
            0.6475211493571601,
            0.3652981802704917
          ],
          [
            0.6237323562039269,
            0.38613203794373613
          ],
          [
            0.5962837487194275,
            0.38613203794373613
          ],
          [
            0.45355098980002934,
            0.6882229742057812
          ],
          [
            0.47733978295326235,
            0.6743337357569515
          ],
          [
            0.5011285761064953,
            0.6673891165325365
          ],
          [
            0.5157678334315617,
            0.670861426144744
          ],
          [
            0.5304070907566284,
            0.670861426144744
          ],
          [
            0.5560257910754944,
            0.6812783549813661
          ],
          [
            0.581644491394361,
            0.6951675934301962
          ],
          [
            0.5633454197380279,
            0.7264183799400629
          ],
          [
            0.5395566265847946,
            0.7437799280010996
          ],
          [
            0.5157678334315617,
            0.7507245472255146
          ],
          [
            0.4919790402783287,
            0.740307618388892
          ],
          [
            0.4718500614563625,
            0.7194737607156478
          ],
          [
            0.46087061846256255,
            0.6916952838179886
          ],
          [
            0.48831922594706223,
            0.6951675934301962
          ],
          [
            0.5157678334315617,
            0.7021122126546108
          ],
          [
            0.5450463480816947,
            0.6986399030424032
          ],
          [
            0.5743248627318276,
            0.6986399030424032
          ],
          [
            0.5450463480816947,
            0.7021122126546108
          ],
          [
            0.5157678334315617,
            0.7021122126546108
          ],
          [
            0.48831922594706223,
            0.6951675934301962
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "027003",
  "objects": [],
  "mask_file": "./person_labeling/./027003.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A close-up shot features curly hair and glasses with reflections of a room including a window and wall art in soft natural light creating an intimate and casual atmosphere",
  "overall_past": "Before this scene, the person likely paused their activity—perhaps after a period of distraction or routine—to deliberately focus on a specific task or object of interest. The soft natural light and intimate atmosphere suggest it’s a quiet moment in their day, possibly early afternoon or late morning, when the room is bathed in gentle sunlight. Given their intense concentration and the reflection of a window and wall art in their glasses, they may have just turned toward a screen or document after a brief break—perhaps stepping away from a cluttered workspace, a conversation, or a digital notification. The slight downward tilt of their head and the serious expression indicate they’ve just shifted into deep focus, perhaps realizing the importance of what they’re seeing—such as a breakthrough in a project, a meaningful piece of art, or a critical detail in a problem they’ve been working on. Thus, the most plausible prior event is: they had been momentarily distracted or engaged in a routine task, then noticed something significant that prompted them to refocus with quiet intensity.",
  "overall_past_clean": "They had been pulled away from their work by a fleeting distraction, their attention scattered across routine tasks and digital interruptions, until a sudden realization cut through the noise, snapping them back into focus with purposeful urgency.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person is likely to slowly lift their head, blink once or twice to refocus, and then reach for a notebook or pen to jot down a key insight or idea that emerged during their concentration. This plausible next action follows naturally from the intense focus and thoughtful expression, suggesting a moment of realization or deep cognitive processing—common in study, creative work, or problem-solving. The soft natural light and intimate atmosphere reinforce a private, introspective moment, making the transition to recording thoughts a quiet, organic continuation of their internal process.",
  "overall_future_clean": "They snap back to awareness, head rising with deliberate calm, eyes adjusting as if emerging from deep thought, then swiftly grasp a writing tool to capture the fleeting clarity now crystallizing in their mind.",
  "future_scene_ok": true
}