{
  "video_path": "./ref_datasets/part2/6688235002.mp4",
  "start_time": 0.0,
  "end_time": 3.04,
  "image_path": "./005650.jpg",
  "represents_multiple_types": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6688235001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_6255479783848476065_1_6688235001.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/6688235002.mp4",
      "start_time": 0.0,
      "end_time": 3.04,
      "image_path": "./ref_datasets/extracted_frames/face_-3053584595652215794_1_6688235002.mp4_0.00_3.04.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/6688235003.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-2543577892448730385_1_6688235003.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a ribbed brown sweater with a round neckline. The texture appears soft and the fit is slightly loose.",
        "clothing": [
          {
            "possible_names": [
              "sweater",
              "knit top",
              "ribbed sweater"
            ],
            "name": "sweater",
            "type": "top",
            "color": [
              "brown"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "pencil",
              "writing tool"
            ],
            "name": "pencil",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "headphones",
              "earphones"
            ],
            "name": "headphones",
            "position": "head"
          }
        ],
        "description": "The person is an adult female with short gray hair, wearing a ribbed brown sweater. She appears to be in a neutral emotional state. She is holding a pencil in her hand and wearing headphones on her head. The background includes some blurred greenery, suggesting an indoor setting with plants.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and focused expression, possibly engaged in deep thought or concentration.",
        "meaningful": true,
        "story": "The person seems to be in a thoughtful or contemplative state, perhaps working on a task that requires focus. The presence of headphones suggests she might be listening to music or an audiobook, aiding her concentration. The pencil held to her lips could indicate she is brainstorming or writing something down.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is wearing headphones and holding a pencil close to their mouth, suggesting they might be engaged in a task that requires concentration such as writing or drawing while listening to something for inspiration or guidance. Their focused expression indicates deep thought or consideration, possibly indicating they are solving a problem or contemplating ideas. The presence of plants in the background adds a serene atmosphere, which could be contributing to a calm and creative environment conducive to their activity.",
        "intention": "The individual is likely seeking creative inspiration and mental clarity by combining auditory input with focused manual activity in a tranquil setting to enhance problem solving or idea generation",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ],
              [
                "right hand",
                "biting"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.5591875496364775,
            0.21020962510790145
          ],
          [
            0.561444597301029,
            0.29220240456717356
          ],
          [
            0.5661694157691228,
            0.3730992334229606
          ],
          [
            0.5757097948165166,
            0.44343214375632156
          ],
          [
            0.5966777228173755,
            0.5020216022218977
          ],
          [
            0.6282044558298021,
            0.5478876318250383
          ],
          [
            0.6637500615346998,
            0.5777318818228586
          ],
          [
            0.6974848213649931,
            0.6040071078709194
          ],
          [
            0.7271640607288905,
            0.6100315536771501
          ],
          [
            0.7513002758934384,
            0.6044443334851946
          ],
          [
            0.7683733803885323,
            0.5682523931775774
          ],
          [
            0.7848464829581124,
            0.5238021101270403
          ],
          [
            0.798543895993914,
            0.4726979051317488
          ],
          [
            0.8086503641945976,
            0.4196709394454956
          ],
          [
            0.8153235185713996,
            0.36770801884787424
          ],
          [
            0.8176641555059523,
            0.3118798051561628
          ],
          [
            0.8204387210664295,
            0.2586372154099601
          ],
          [
            0.6292088508605957,
            0.1648334051881518
          ],
          [
            0.6544628574734642,
            0.13706910610198975
          ],
          [
            0.6846232323419481,
            0.12699812650680542
          ],
          [
            0.7144444295338221,
            0.14023289935929437
          ],
          [
            0.741295489810762,
            0.1672678419521877
          ],
          [
            0.7665653819129581,
            0.17757193105561395
          ],
          [
            0.7869056769779751,
            0.16298091837338038
          ],
          [
            0.8042826538994199,
            0.1563449672290257
          ],
          [
            0.8207580793471564,
            0.16298869677952357
          ],
          [
            0.8264335450671968,
            0.18713414669036865
          ],
          [
            0.7558386552901495,
            0.21727343967982704
          ],
          [
            0.7579638390314011,
            0.2494935137884957
          ],
          [
            0.7625106107620966,
            0.2831845368657793
          ],
          [
            0.7646666663033622,
            0.31932868276323595
          ],
          [
            0.7300639742896671,
            0.36761536768504555
          ],
          [
            0.7425521918705531,
            0.3716274670192174
          ],
          [
            0.7535274914332799,
            0.37890871933528353
          ],
          [
            0.7636387052990141,
            0.37359066520418444
          ],
          [
            0.7725172701336088,
            0.368347099849156
          ],
          [
            0.6625534420921688,
            0.21136358806065147
          ],
          [
            0.6807881605057489,
            0.198112530367715
          ],
          [
            0.6958698715482439,
            0.19784263627869744
          ],
          [
            0.7089146931966146,
            0.22366994619369507
          ],
          [
            0.6927491097223192,
            0.22383790356772285
          ],
          [
            0.6787544182368687,
            0.2226207426616124
          ],
          [
            0.7673472177414667,
            0.23727022750037058
          ],
          [
            0.7819254511878604,
            0.2157049604824611
          ],
          [
            0.7955556506202335,
            0.21645112548555648
          ],
          [
            0.8051588285536994,
            0.23457212959017074
          ],
          [
            0.7962517897288005,
            0.24460499627249582
          ],
          [
            0.7824545179094587,
            0.24187867130552015
          ],
          [
            0.6959263574509393,
            0.4557692834309169
          ],
          [
            0.7205413103103637,
            0.43505368913922987
          ],
          [
            0.7403115635826474,
            0.42036013943808426
          ],
          [
            0.7493829772585914,
            0.43272491863795687
          ],
          [
            0.7584582374209449,
            0.4239022135734558
          ],
          [
            0.7702259381612142,
            0.4438850539071219
          ],
          [
            0.7753164132436117,
            0.4688653605324881
          ],
          [
            0.7665605862935384,
            0.4928785392216274
          ],
          [
            0.7558655307406471,
            0.5015230178833008
          ],
          [
            0.7461103416624524,
            0.502793414252145
          ],
          [
            0.7371790749686105,
            0.49754660470145096
          ],
          [
            0.7172514904113042,
            0.4842357976096018
          ],
          [
            0.7046669483184814,
            0.4568085500172206
          ],
          [
            0.7434037390209379,
            0.451918295451573
          ],
          [
            0.7483823412940616,
            0.457203677722386
          ],
          [
            0.7592695463271367,
            0.45671173504420687
          ],
          [
            0.7684797831944057,
            0.46752854755946566
          ],
          [
            0.7580763112931025,
            0.45950812952859055
          ],
          [
            0.7478270485287621,
            0.45952243464333664
          ],
          [
            0.7411181018466041,
            0.45373438085828505
          ]
        ],
        "visibility": [
          8.932477157941321e-07,
          6.250632606993878e-13,
          0.0005405278643593192,
          6.867048569321119e-16,
          2.100111305480823e-05,
          0.00028826462221331894,
          1.9941158811286486e-15,
          1.2330661837880075e-21,
          0.21614374220371246,
          2.346272826652164e-17,
          7.522013567573538e-11,
          7.371450672088997e-10,
          7.750000804662704e-06,
          0.0001625272270757705,
          2.73869909226971e-14,
          2.8006312614609237e-14,
          3.8221456634346396e-05,
          6.964564016644081e-13,
          9.312473752201567e-13,
          0.8582193851470947,
          4.0437943792104303e-13,
          5.0716558730457e-10,
          8.161102596204728e-05,
          1.1643141078820918e-05,
          7.033910953690992e-11,
          1.4738993359131314e-10,
          1.8434923276799964e-06,
          0.0023911555763334036,
          1.8062422668663203e-07
        ],
        "headpose": {
          "pitch": 0.02279020682621692,
          "yaw": -20.435888430637714,
          "roll": 1.6496861987230709
        },
        "attributes": {
          "5 oClock Shadow": 0.01990535855293274,
          "Arched Eyebrows": 0.08373632282018661,
          "Attractive": 0.23187462985515594,
          "Bags Under Eyes": 0.608404815196991,
          "Bald": 1.6649117242195643e-05,
          "Bangs": 0.0037758690305054188,
          "Big Lips": 0.3203575909137726,
          "Big Nose": 0.207931786775589,
          "Black Hair": 0.010097471997141838,
          "Blond Hair": 0.028283456340432167,
          "Blurry": 0.00013281301653478295,
          "Brown Hair": 0.11657167971134186,
          "Bushy Eyebrows": 0.48468780517578125,
          "Chubby": 0.023678509518504143,
          "Double Chin": 0.006963581778109074,
          "Eyeglasses": 0.005509252659976482,
          "Goatee": 0.0005039627430960536,
          "Gray Hair": 0.022632190957665443,
          "Heavy Makeup": 0.050343647599220276,
          "High Cheekbones": 0.13689596951007843,
          "Male": 0.6705286502838135,
          "Mouth Slightly Open": 0.8213097453117371,
          "Mustache": 0.0003110170364379883,
          "Narrow Eyes": 0.20678770542144775,
          "No Beard": 0.9902448654174805,
          "Oval Face": 0.14112715423107147,
          "Pale Skin": 0.021693645045161247,
          "Pointy Nose": 0.0955720916390419,
          "Receding Hairline": 0.014687187038362026,
          "Rosy Cheeks": 0.0026335420552641153,
          "Sideburns": 0.00011943674326175824,
          "Smiling": 0.007661646697670221,
          "Straight Hair": 0.38008883595466614,
          "Wavy Hair": 0.10947424173355103,
          "Wearing Earrings": 0.02958560176193714,
          "Wearing Hat": 0.0003454957331996411,
          "Wearing Lipstick": 0.1028827652335167,
          "Wearing Necklace": 0.012133467011153698,
          "Wearing Necktie": 0.014502904377877712,
          "Young": 0.8542312383651733
        },
        "age": [
          0.0006560119800269604,
          0.21398036181926727,
          0.9713889360427856,
          0.9578868746757507,
          0.7553375959396362,
          0.010631253942847252,
          0.0005926150479353964,
          3.7069137306389166e-06
        ],
        "race": [
          0.9962676167488098,
          0.0005531955976039171,
          0.848414957523346,
          0.08568666875362396,
          0.3164352774620056
        ],
        "gender": [
          0.023857612162828445,
          0.9737902283668518
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 86.26068830490112,
          "disgust": 2.6128018151827526e-09,
          "fear": 0.16305014723911881,
          "happy": 13.505816459655762,
          "sad": 0.01178868260467425,
          "surprise": 0.0003237091505070566,
          "neutral": 0.05833629402332008
        },
        "dominant_emotion": "angry",
        "region": {
          "x": 0,
          "y": 0,
          "w": 1407,
          "h": 1619,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 38,
        "gender": {
          "Woman": 99.9846339225769,
          "Man": 0.015363693819381297
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 0.00107823852886213,
          "indian": 0.0005341583346307743,
          "black": 1.999754317694169e-05,
          "white": 98.39656352996826,
          "middle eastern": 0.41554756462574005,
          "latino hispanic": 1.1862565763294697
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.25237351655960083,
        0.0007592910551466048,
        0.9146561622619629,
        0.9868342280387878
      ]
    ],
    "face_boxes": [
      [
        0.5799228549003601,
        0.021012991666793823,
        0.8243439793586731,
        0.6044498085975647
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5995950876043902,
            0.8606113588776974
          ],
          [
            0.3572404685152901,
            0.8528877294384101
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6697694101466073,
            1.004785775077725
          ],
          [
            0.8419497066934902,
            0.8683349883169847
          ],
          [
            0.8810158243974049,
            1.022807577102728
          ],
          [
            0.8231400944656796,
            0.9867639730527211
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6827914493812455,
            0.21955011541685976
          ],
          [
            0.7884146565066444,
            0.22984828800257592
          ],
          [
            0.559805523276329,
            0.2813391509311572
          ],
          [
            0.8231400944656796,
            0.2993609529561607
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            0.7276451400783326,
            0.9429967395634271
          ],
          [
            0.7102824210988151,
            0.9249749375384236
          ],
          [
            0.7146231008436944,
            0.896654962927704
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7218575670851601,
            0.9121022218062786
          ],
          [
            0.7507954320510227,
            0.8734840746098423
          ],
          [
            0.763817471285661,
            0.8837822471955585
          ],
          [
            0.7724988307754199,
            0.901804049220562
          ],
          [
            0.7450078590578503,
            0.9352731101241403
          ],
          [
            0.762370578037368,
            0.8992295060741332
          ],
          [
            0.7681581510305404,
            0.9275494806848529
          ],
          [
            0.7681581510305404,
            0.9352731101241403
          ],
          [
            0.763817471285661,
            0.9532949121491433
          ],
          [
            0.7710519375271268,
            0.9481458258562853
          ],
          [
            0.773945724023713,
            0.9764658004670049
          ],
          [
            0.7710519375271268,
            0.9841894299062927
          ],
          [
            0.7724988307754199,
            0.9713167141741468
          ],
          [
            0.7797332970168854,
            0.9764658004670049
          ],
          [
            0.7768395105202992,
            0.9893385161991504
          ],
          [
            0.7768395105202992,
            0.9919130593455796
          ]
        ],
        "dw_hand_2": [
          [
            0.687132129126125,
            1.0022112319312957
          ],
          [
            0.7001541683607632,
            0.9867639730527211
          ],
          [
            0.7030479548573494,
            0.9558694552955725
          ],
          [
            0.7450078590578503,
            0.9224003943919948
          ],
          [
            0.7782864037685925,
            0.8940804197812747
          ],
          [
            0.6856852358778317,
            0.9301240238312818
          ],
          [
            0.7233044603334533,
            0.8580368157312681
          ],
          [
            0.7681581510305404,
            0.8451640999991231
          ],
          [
            0.7956491227481102,
            0.8554622725848389
          ],
          [
            0.7073886346022289,
            0.961018541588431
          ],
          [
            0.7652643645339542,
            0.9172513080991364
          ],
          [
            0.7927553362515236,
            0.9301240238312818
          ],
          [
            0.8014366957412826,
            0.9455712827098564
          ],
          [
            0.7276451400783326,
            0.9944876024920084
          ],
          [
            0.7797332970168854,
            0.9661676278812887
          ],
          [
            0.7913084430032307,
            0.9764658004670049
          ],
          [
            0.7884146565066444,
            0.9867639730527211
          ],
          [
            0.7479016455544365,
            1.0099348613705827
          ],
          [
            0.7855208700100582,
            0.9919130593455796
          ],
          [
            0.7898615497549374,
            0.9996366887848666
          ],
          [
            0.7840739767617649,
            1.0073603182241542
          ]
        ],
        "dw_face": [
          [
            0.5728275625109672,
            0.22469920170971783
          ],
          [
            0.5742744557592604,
            0.28648823722401545
          ],
          [
            0.5786151355041398,
            0.3482772727383131
          ],
          [
            0.5844027084973124,
            0.40749176510618174
          ],
          [
            0.5959778544836575,
            0.46413171432762107
          ],
          [
            0.6162343599597614,
            0.5181971204026314
          ],
          [
            0.6408315451807446,
            0.5568152675990674
          ],
          [
            0.6712163033949005,
            0.5902843285026455
          ],
          [
            0.7044948481056427,
            0.6083061305276487
          ],
          [
            0.7392202860646778,
            0.6108806736740777
          ],
          [
            0.7696050442788337,
            0.5851352422097871
          ],
          [
            0.7898615497549374,
            0.5362189224276349
          ],
          [
            0.8043304822378688,
            0.4821535163526244
          ],
          [
            0.8159056282242139,
            0.42293902398475597
          ],
          [
            0.8216932012173865,
            0.36114998847045854
          ],
          [
            0.8245869877139728,
            0.2993609529561607
          ],
          [
            0.8216932012173865,
            0.23242283114900517
          ],
          [
            0.635043972187572,
            0.17835742507399466
          ],
          [
            0.655300477663676,
            0.16033562304899115
          ],
          [
            0.6784507696363662,
            0.15518653675613306
          ],
          [
            0.7016010616090561,
            0.1629101661954204
          ],
          [
            0.7233044603334533,
            0.17320833878113656
          ],
          [
            0.7667112577822472,
            0.1809319682204237
          ],
          [
            0.7811801902651787,
            0.1757828819275658
          ],
          [
            0.7956491227481102,
            0.17320833878113656
          ],
          [
            0.8101180552310413,
            0.17320833878113656
          ],
          [
            0.8216932012173865,
            0.19123014080614006
          ],
          [
            0.7479016455544365,
            0.22984828800257592
          ],
          [
            0.7507954320510227,
            0.2633173489061539
          ],
          [
            0.7551361117959022,
            0.29678640980973164
          ],
          [
            0.7580298982924885,
            0.33025547071330963
          ],
          [
            0.7204106738368671,
            0.37402270420260353
          ],
          [
            0.7348796063197983,
            0.37659724734903277
          ],
          [
            0.7493485388027298,
            0.37917179049546185
          ],
          [
            0.7609236847890748,
            0.37917179049546185
          ],
          [
            0.7710519375271268,
            0.37402270420260353
          ],
          [
            0.656747370911969,
            0.22469920170971783
          ],
          [
            0.6741100898914867,
            0.20667739968471432
          ],
          [
            0.6943665953675907,
            0.20925194283114357
          ],
          [
            0.7102824210988151,
            0.23499737429543402
          ],
          [
            0.6914728088710044,
            0.24014646058829228
          ],
          [
            0.6726631966431935,
            0.23757191744186326
          ],
          [
            0.7652643645339542,
            0.24014646058829228
          ],
          [
            0.7768395105202992,
            0.21955011541685976
          ],
          [
            0.7942022294998169,
            0.21955011541685976
          ],
          [
            0.8072242687344551,
            0.24014646058829228
          ],
          [
            0.7942022294998169,
            0.25044463317400845
          ],
          [
            0.7782864037685925,
            0.25044463317400845
          ],
          [
            0.6900259156227112,
            0.46155717118119205
          ],
          [
            0.7146231008436944,
            0.4461099123026176
          ],
          [
            0.7377733928163845,
            0.4358117397169012
          ],
          [
            0.7479016455544365,
            0.4383862828633304
          ],
          [
            0.7565830050441955,
            0.4383862828633304
          ],
          [
            0.7681581510305404,
            0.45125899859547564
          ],
          [
            0.7753926172720061,
            0.46928080062047917
          ],
          [
            0.7681581510305404,
            0.4898771457919117
          ],
          [
            0.7565830050441955,
            0.5027498615240569
          ],
          [
            0.7435609658095573,
            0.5053244046704861
          ],
          [
            0.7233044603334533,
            0.5001753183776279
          ],
          [
            0.7059417413539356,
            0.4821535163526244
          ],
          [
            0.6958134886158837,
            0.46155717118119205
          ],
          [
            0.7204106738368671,
            0.4589826280347628
          ],
          [
            0.7464547523061436,
            0.4589826280347628
          ],
          [
            0.7594767915407817,
            0.46413171432762107
          ],
          [
            0.7710519375271268,
            0.4718553437669082
          ],
          [
            0.7594767915407817,
            0.47442988691333726
          ],
          [
            0.7450078590578503,
            0.47442988691333726
          ],
          [
            0.7204106738368671,
            0.46928080062047917
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "005650",
  "objects": [
    {
      "box": [
        0.7382535934448242,
        0.4478054940700531,
        0.7663705348968506,
        0.8244118690490723
      ],
      "name": "pencil",
      "possible_names": [
        "pencil"
      ]
    }
  ],
  "mask_file": "./person_labeling/./005650.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person wearing headphones holds a pencil in a room with green plants and blurred background suggesting a calm indoor environment with natural elements and neutral colors",
  "overall_past": "Before the current scene, the individual likely entered the room seeking a peaceful space to focus, possibly after feeling distracted or mentally overwhelmed. They may have turned on music or an audio guide through the headphones to create a mental boundary against external noise, helping to center their thoughts. The act of picking up the pencil suggests they were preparing to jot down ideas, sketch a concept, or work through a creative or analytical challenge. The deliberate choice of a green, plant-filled environment indicates a prior intention to cultivate a calming, nature-inspired atmosphere conducive to deep thinking—perhaps they had been brainstorming earlier but needed a reset, leading them to this quiet corner where they could reconnect with their thoughts and begin the task at hand.",
  "overall_past_clean": "After feeling mentally scattered and overwhelmed by external demands, the individual deliberately retreated into a secluded space, activating a soothing auditory environment to shield the mind from distraction, then paused to center the breath and reestablish focus before beginning the task.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to begin sketching or writing down their ideas, translating the thoughts sparked by the audio into a tangible form. The calm, plant-filled environment and focused demeanor suggest a moment of creative flow, and with the pencil poised near the mouth—possibly as a gesture of contemplation—the next logical step is the act of creation: putting pen to paper to capture insights or solutions that have emerged during the reflective listening session.",
  "overall_future_clean": "The mind, alight with clarity, seizes the moment to commit the emerging thoughts to paper, the hand moving with purpose as ideas take shape in deliberate strokes.",
  "future_scene_ok": true
}