{
  "video_path": "./ref_datasets/part2/6609090000.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./005124.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6609090000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_-4873761820356300805_1_6609090000.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/6609090000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-4873761820356300805_1_6609090000.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a gray tank top under a brown ribbed cardigan. The tank top has thin straps and a scoop neckline. The cardigan is open, revealing the tank top underneath.",
        "clothing": [
          {
            "possible_names": [
              "gray tank top",
              "gray undershirt"
            ],
            "name": "tank top",
            "type": "top",
            "color": [
              "gray"
            ]
          },
          {
            "possible_names": [
              "brown cardigan",
              "brown sweater"
            ],
            "name": "cardigan",
            "type": "top",
            "color": [
              "brown"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "glass of water",
              "drink glass"
            ],
            "name": "glass of water",
            "position": "hand"
          }
        ],
        "description": "A female adult is sitting on a couch, holding a glass of water in her hand. She is wearing a gray tank top under a brown ribbed cardigan. Her expression appears neutral, and she seems to be looking down at the glass. The setting appears to be indoors with a light-colored background.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "The person is sitting on a couch, holding a glass of water, possibly taking a moment to relax or hydrate while engaging in an activity such as reading or using a laptop.",
        "race": "asian",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is seated on a gray couch, holding a glass of water in one hand while reaching out with the other towards a laptop, suggesting they might be working or browsing online. They appear focused and engaged, possibly concentrating on something important or interesting on the screen. Their attire, consisting of a casual tank top and cardigan, indicates a relaxed setting at home or a comfortable environment. The overall posture and interaction with the objects around them convey a sense of calm and intent, as if they are deeply involved in their current activity.",
        "intention": "The individual is likely engaged in a focused task requiring attention and access to digital information seeking clarity or progress on an important matter",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.43453033154919035,
            0.06382304322782648
          ],
          [
            0.42826641117710446,
            0.11672806102762777
          ],
          [
            0.4208805579647777,
            0.16808346749613523
          ],
          [
            0.41987752747677626,
            0.21834480806633277
          ],
          [
            0.4274187809743342,
            0.25881373453392553
          ],
          [
            0.44569285752340443,
            0.29299124044085306
          ],
          [
            0.4658812978260574,
            0.3260758359596212
          ],
          [
            0.4896417743748143,
            0.35521473985500435
          ],
          [
            0.508101436903789,
            0.3645583393712523
          ],
          [
            0.5208732093906119,
            0.3586252858399083
          ],
          [
            0.5313970302187261,
            0.3374596619732166
          ],
          [
            0.5450441357635316,
            0.3189128285362607
          ],
          [
            0.5595530238889512,
            0.29582495575859435
          ],
          [
            0.5710197526784171,
            0.2676538205020642
          ],
          [
            0.5794733059548196,
            0.23992455232711069
          ],
          [
            0.5808813826668829,
            0.21080586985936242
          ],
          [
            0.5857760681992485,
            0.18154968168369676
          ],
          [
            0.4985394376019637,
            0.04084460087238796
          ],
          [
            0.5179064110808429,
            0.03835855328216754
          ],
          [
            0.5361342493267287,
            0.04466363052842478
          ],
          [
            0.5499312280899002,
            0.06367328911231308
          ],
          [
            0.5640350526287442,
            0.08837998105735376
          ],
          [
            0.5809403226134323,
            0.10676388034114132
          ],
          [
            0.5864785014873459,
            0.09951498962583996
          ],
          [
            0.5917189556927909,
            0.09811811507063568
          ],
          [
            0.5944571398553394,
            0.09890000545789325
          ],
          [
            0.5959502697345757,
            0.09642768316168003
          ],
          [
            0.5638560258206867,
            0.13679248372082986
          ],
          [
            0.5638723543002492,
            0.15762452625093007
          ],
          [
            0.5671965271589302,
            0.18201610335597285
          ],
          [
            0.5702792607602619,
            0.20529553082884935
          ],
          [
            0.544525405587185,
            0.2245919870321082
          ],
          [
            0.5475744790619328,
            0.22945204828151317
          ],
          [
            0.552859952336266,
            0.2330613997878221
          ],
          [
            0.5577454395947002,
            0.23355384932623968
          ],
          [
            0.560358582791828,
            0.23219928810836143
          ],
          [
            0.5119663710395496,
            0.10487038196710052
          ],
          [
            0.525416639695565,
            0.10664919595869761
          ],
          [
            0.5312893517670177,
            0.11409657443011248
          ],
          [
            0.5356705081604776,
            0.1268791021493377
          ],
          [
            0.5283596552198842,
            0.12472235689718256
          ],
          [
            0.519610406759949,
            0.11676895886501938
          ],
          [
            0.5666795100839366,
            0.14910032787020244
          ],
          [
            0.5748141178417773,
            0.14504351950196362
          ],
          [
            0.5772123208358174,
            0.1436850151056966
          ],
          [
            0.5814877588124503,
            0.15451877495599173
          ],
          [
            0.5744489957534131,
            0.15719768080131086
          ],
          [
            0.5721145324763798,
            0.1535917669376999
          ],
          [
            0.5133378089893432,
            0.25875075923071966
          ],
          [
            0.5333982566992442,
            0.2545662525469664
          ],
          [
            0.5457765406086331,
            0.2489524375824701
          ],
          [
            0.5505300264628161,
            0.2584331961535903
          ],
          [
            0.552618790879136,
            0.2543423435675404
          ],
          [
            0.5534621151785056,
            0.2671229502511403
          ],
          [
            0.5461143765421141,
            0.27326194457906894
          ],
          [
            0.5461232352824439,
            0.28622385080529267
          ],
          [
            0.5438837951137906,
            0.29698670566397367
          ],
          [
            0.539598433495987,
            0.30120960417247955
          ],
          [
            0.5355795440219697,
            0.295792659249886
          ],
          [
            0.5243433508312418,
            0.28140222471227094
          ],
          [
            0.5179013489435117,
            0.25904971859442494
          ],
          [
            0.5481199089260329,
            0.26912345608706195
          ],
          [
            0.5439233044783275,
            0.2773255560133192
          ],
          [
            0.545692336275464,
            0.2777398641778048
          ],
          [
            0.5444741360133603,
            0.2755002255162234
          ],
          [
            0.5447642674758321,
            0.268337449194893
          ],
          [
            0.5418995453133469,
            0.27120741864360826
          ],
          [
            0.5447814447893983,
            0.267690103520792
          ]
        ],
        "visibility": [
          0.9285240173339844,
          0.03302134573459625,
          0.17088642716407776,
          2.620682837406463e-10,
          0.00010740167635958642,
          6.405694875866175e-05,
          8.723960274884326e-14,
          1.1524065227129518e-17,
          0.9999204874038696,
          0.00020181572472210974,
          1.1475242445158074e-07,
          1.979898467396879e-09,
          0.10995373874902725,
          8.829803846310824e-05,
          4.23236861024634e-06,
          2.0010267220982314e-08,
          8.748089021537453e-05,
          2.212879962826264e-06,
          9.726853870961616e-12,
          0.961605966091156,
          7.882339529349802e-15,
          5.866734795745288e-07,
          2.139470378637043e-09,
          7.218619430204853e-06,
          6.459947594211757e-12,
          5.592655938357893e-08,
          1.6041148853673803e-08,
          0.00013019049947615713,
          0.171897754073143
        ],
        "headpose": {
          "pitch": -9.920892458125833,
          "yaw": -37.49605148664501,
          "roll": 20.29697775084529
        },
        "attributes": {
          "5 oClock Shadow": 0.00026895065093412995,
          "Arched Eyebrows": 0.061713844537734985,
          "Attractive": 0.5087900757789612,
          "Bags Under Eyes": 0.03180859982967377,
          "Bald": 4.409345422118349e-07,
          "Bangs": 0.0013695412781089544,
          "Big Lips": 0.5087321996688843,
          "Big Nose": 0.01823865808546543,
          "Black Hair": 0.22268277406692505,
          "Blond Hair": 0.0015394650399684906,
          "Blurry": 0.0006658006459474564,
          "Brown Hair": 0.34925955533981323,
          "Bushy Eyebrows": 0.015517701394855976,
          "Chubby": 0.0032891018781811,
          "Double Chin": 0.00041202185093425214,
          "Eyeglasses": 0.0023132271599024534,
          "Goatee": 2.692058296815958e-05,
          "Gray Hair": 2.9534608984249644e-05,
          "Heavy Makeup": 0.2373029738664627,
          "High Cheekbones": 0.12351259589195251,
          "Male": 0.002896195277571678,
          "Mouth Slightly Open": 0.07580606639385223,
          "Mustache": 8.706690096005332e-06,
          "Narrow Eyes": 0.612948477268219,
          "No Beard": 0.9994992017745972,
          "Oval Face": 0.13895803689956665,
          "Pale Skin": 0.031945835798978806,
          "Pointy Nose": 0.2542201280593872,
          "Receding Hairline": 0.010076012462377548,
          "Rosy Cheeks": 0.0034492232371121645,
          "Sideburns": 2.6404990421724506e-05,
          "Smiling": 0.004331284202635288,
          "Straight Hair": 0.07520854473114014,
          "Wavy Hair": 0.7290759682655334,
          "Wearing Earrings": 0.013913397677242756,
          "Wearing Hat": 0.00044601954868994653,
          "Wearing Lipstick": 0.5787225961685181,
          "Wearing Necklace": 0.03318248689174652,
          "Wearing Necktie": 0.00033990427618846297,
          "Young": 0.9946150183677673
        },
        "age": [
          0.05670730397105217,
          0.9575269222259521,
          0.9957193732261658,
          0.7712004780769348,
          0.030033890157938004,
          4.791708124685101e-05,
          3.0336125291796634e-06,
          1.470637922551532e-08
        ],
        "race": [
          0.8095667958259583,
          0.00540554104372859,
          0.9729011058807373,
          0.1428714543581009,
          0.7261676788330078
        ],
        "gender": [
          0.0003981012850999832,
          0.9997933506965637
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 6.729155455076352e-07,
          "disgust": 4.2145875954772635e-12,
          "fear": 0.06295641651377082,
          "happy": 3.9973602206089254e-08,
          "sad": 99.93556141853333,
          "surprise": 1.1208446060254887e-13,
          "neutral": 0.0014833241948508658
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 434,
          "h": 457,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 38,
        "gender": {
          "Woman": 99.96115565299988,
          "Man": 0.038844565278850496
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 94.62623596191406,
          "indian": 0.04795092099811882,
          "black": 0.020433396275620908,
          "white": 3.1572870910167694,
          "middle eastern": 0.15674906317144632,
          "latino hispanic": 1.9913479685783386
        },
        "dominant_race": "asian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.14716246724128723,
        0.00401323800906539,
        0.9013217687606812,
        0.9878271818161011
      ],
      [
        0.14943161606788635,
        0.004815376363694668,
        0.646343469619751,
        0.9862625002861023
      ]
    ],
    "face_boxes": [
      [
        0.43757036328315735,
        0.008763876743614674,
        0.5883849859237671,
        0.3412144184112549
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4088746635284689,
            0.4579952474449312
          ],
          [
            0.27893617875046195,
            0.4289125721885453
          ],
          [
            0.2920117495457332,
            0.9175015164958293
          ],
          [
            0.4767041870289379,
            0.934951121649661
          ],
          [
            0.5388131483064758,
            0.48707792270131706
          ],
          [
            0.5829431997405159,
            0.8651527010343346
          ],
          [
            0.7610978518260849,
            0.856427898457419
          ],
          [
            0.2854739641480976,
            1.0134743448419032
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4652630625830757,
            0.9960247396880715
          ],
          [
            0.6989888905485473,
            0.9233180515471066
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5191997921135691,
            0.10609487684266097
          ],
          [
            0.5698676289452447,
            0.14390235467596263
          ],
          [
            0.4227674574984444,
            0.1090031443682996
          ],
          [
            0.5764054143428803,
            0.18170983250926448
          ]
        ],
        "dw_hand_1": [
          [
            0.7758078689707649,
            0.8535196309317805
          ],
          [
            0.8019590105613075,
            0.8128038855728398
          ],
          [
            0.8232068131036229,
            0.7749964077395384
          ],
          [
            0.8493579546941651,
            0.7691798726882607
          ],
          [
            0.8738746499352985,
            0.7808129427908153
          ],
          [
            0.8591646327906185,
            0.7895377453677312
          ],
          [
            0.8820468816823429,
            0.783721210316454
          ],
          [
            0.8804124353329339,
            0.7924460128933697
          ],
          [
            0.8755090962847075,
            0.8040790829959241
          ],
          [
            0.8624335254894363,
            0.8273452232010331
          ],
          [
            0.8853157743811607,
            0.8244369556753943
          ],
          [
            0.8787779889835251,
            0.8302534907266715
          ],
          [
            0.8689713108870719,
            0.83316175825231
          ],
          [
            0.8607990791400275,
            0.8593361659830573
          ],
          [
            0.8836813280317519,
            0.8593361659830573
          ],
          [
            0.8755090962847075,
            0.8593361659830573
          ],
          [
            0.8640679718388451,
            0.8593361659830573
          ],
          [
            0.8542612937423919,
            0.8942353762907208
          ],
          [
            0.8722402035858895,
            0.8971436438163591
          ],
          [
            0.8689713108870719,
            0.8942353762907208
          ],
          [
            0.8640679718388451,
            0.8913271087650819
          ]
        ],
        "dw_hand_2": [
          [
            0.4865108651253912,
            0.934951121649661
          ],
          [
            0.5110275603665245,
            0.8913271087650819
          ],
          [
            0.5371787019570669,
            0.8506113634061416
          ],
          [
            0.5682331825958359,
            0.841886560829226
          ],
          [
            0.5911154314875603,
            0.8477030958805029
          ],
          [
            0.5159308994147512,
            0.841886560829226
          ],
          [
            0.5388131483064758,
            0.8186204206241171
          ],
          [
            0.5665987362464271,
            0.8244369556753943
          ],
          [
            0.5894809851381515,
            0.841886560829226
          ],
          [
            0.5110275603665245,
            0.8884188412394435
          ],
          [
            0.5404475946558845,
            0.8826023061881663
          ],
          [
            0.5731365216440625,
            0.8971436438163591
          ],
          [
            0.5992876632346047,
            0.9087767139189137
          ],
          [
            0.5061242213182979,
            0.9378593891752994
          ],
          [
            0.5371787019570669,
            0.9465841917522155
          ],
          [
            0.5682331825958359,
            0.9553089943291312
          ],
          [
            0.5927498778369691,
            0.95821726185477
          ],
          [
            0.5061242213182979,
            0.9785751345342397
          ],
          [
            0.5322753629088401,
            0.9843916695855174
          ],
          [
            0.5551576118005646,
            0.9902082046367942
          ],
          [
            0.5764054143428803,
            0.9902082046367942
          ]
        ],
        "dw_face": [
          [
            0.43911192099253343,
            0.06828739900935912
          ],
          [
            0.4374774746431244,
            0.1090031443682996
          ],
          [
            0.43584302829371563,
            0.14390235467596263
          ],
          [
            0.43584302829371563,
            0.18170983250926448
          ],
          [
            0.43911192099253343,
            0.2166090428169275
          ],
          [
            0.4489185990889866,
            0.2485999855989521
          ],
          [
            0.46035972353484894,
            0.2747743933296995
          ],
          [
            0.475069740679529,
            0.30094880106044686
          ],
          [
            0.4914142041736179,
            0.321306673739917
          ],
          [
            0.5093931140171157,
            0.3387562788937487
          ],
          [
            0.5273720238606134,
            0.3358480113681101
          ],
          [
            0.5420820410052934,
            0.3067653361117241
          ],
          [
            0.5535231654511559,
            0.2805909283809767
          ],
          [
            0.5616953971982003,
            0.2485999855989521
          ],
          [
            0.5715020752946535,
            0.21951731034256633
          ],
          [
            0.5747709679934715,
            0.1846181000349031
          ],
          [
            0.5796743070416981,
            0.14971888972723987
          ],
          [
            0.5012208822700712,
            0.05374606138116623
          ],
          [
            0.5142964530653423,
            0.05374606138116623
          ],
          [
            0.5290064702100223,
            0.059562596432443264
          ],
          [
            0.5404475946558845,
            0.07119566653499775
          ],
          [
            0.550254272752338,
            0.08573700416319063
          ],
          [
            0.5698676289452447,
            0.1090031443682996
          ],
          [
            0.5747709679934715,
            0.1090031443682996
          ],
          [
            0.5796743070416981,
            0.11191141189393801
          ],
          [
            0.5829431997405159,
            0.11481967941957684
          ],
          [
            0.5845776460899247,
            0.12354448199649248
          ],
          [
            0.5551576118005646,
            0.13517755209904697
          ],
          [
            0.5567920581499733,
            0.1555354247785171
          ],
          [
            0.5600609508487915,
            0.17298502993234863
          ],
          [
            0.5616953971982003,
            0.19334290261181894
          ],
          [
            0.5306409165594311,
            0.20788424024001184
          ],
          [
            0.5404475946558845,
            0.21370077529128909
          ],
          [
            0.5486198264029292,
            0.2166090428169275
          ],
          [
            0.5551576118005646,
            0.22242557786820474
          ],
          [
            0.5600609508487915,
            0.21951731034256633
          ],
          [
            0.504489774968889,
            0.10027834179138374
          ],
          [
            0.5159308994147512,
            0.10027834179138374
          ],
          [
            0.5257375775112045,
            0.10609487684266097
          ],
          [
            0.5322753629088401,
            0.12063621447085388
          ],
          [
            0.5208342384629779,
            0.12063621447085388
          ],
          [
            0.5110275603665245,
            0.11191141189393801
          ],
          [
            0.5600609508487915,
            0.14681062220160124
          ],
          [
            0.5665987362464271,
            0.14099408715032422
          ],
          [
            0.5715020752946535,
            0.14681062220160124
          ],
          [
            0.5747709679934715,
            0.1555354247785171
          ],
          [
            0.5682331825958359,
            0.15844369230415573
          ],
          [
            0.5633298435476091,
            0.1555354247785171
          ],
          [
            0.5110275603665245,
            0.2485999855989521
          ],
          [
            0.5257375775112045,
            0.2485999855989521
          ],
          [
            0.5420820410052934,
            0.2485999855989521
          ],
          [
            0.5453509337041111,
            0.25150825312459074
          ],
          [
            0.5486198264029292,
            0.25441652065022935
          ],
          [
            0.550254272752338,
            0.26314132322714523
          ],
          [
            0.5486198264029292,
            0.27186612580406105
          ],
          [
            0.5469853800535202,
            0.2776826608553381
          ],
          [
            0.5437164873547023,
            0.2805909283809767
          ],
          [
            0.5388131483064758,
            0.2834991959066153
          ],
          [
            0.5290064702100223,
            0.2747743933296995
          ],
          [
            0.5191997921135691,
            0.26314132322714523
          ],
          [
            0.5142964530653423,
            0.25150825312459074
          ],
          [
            0.5273720238606134,
            0.25732478817586796
          ],
          [
            0.5420820410052934,
            0.26314132322714523
          ],
          [
            0.5453509337041111,
            0.2689578582784222
          ],
          [
            0.5469853800535202,
            0.27186612580406105
          ],
          [
            0.5453509337041111,
            0.26604959075278384
          ],
          [
            0.5420820410052934,
            0.26314132322714523
          ],
          [
            0.5273720238606134,
            0.25732478817586796
          ]
        ],
        "dw_foot_1": [
          [
            0.8232068131036229,
            0.6499409041370785
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "005124",
  "objects": [
    {
      "box": [
        0.5433842539787292,
        0.7073318362236023,
        0.6812558770179749,
        0.9962645173072815
      ],
      "name": "glass of water",
      "possible_names": [
        "glass of water"
      ]
    }
  ],
  "mask_file": "./person_labeling/./005124.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A cozy indoor setting features a person seated on a gray sofa with a white pillow holding a glass of water and using a laptop against a backdrop of white shutters and soft natural light creating a calm and relaxed atmosphere with neutral tones and a casual style.",
  "overall_past": "Before the current scene, the individual likely settled into the space after arriving home or returning from a brief outing, perhaps having just finished a light snack or drink. They may have taken a moment to unwind by adjusting the white shutters to let in soft natural light, creating a serene ambiance. The act of placing the glass of water on a nearby surface before picking up the laptop suggests a deliberate transition from relaxation to focused activity—possibly preparing to work, read, or engage in an online task. The casual yet intentional arrangement of their clothing and posture indicates a routine of balancing comfort with productivity, implying this moment is part of a familiar, daily rhythm.",
  "overall_past_clean": "The individual entered the space, moved with purpose toward a designated area, paused briefly to adjust the environment for comfort and clarity, then transitioned seamlessly into a state of focused readiness.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to set down the glass of water, close the laptop, and stretch slightly, signaling a brief pause in their activity. The calm and focused demeanor suggests they’ve just finished reviewing something important—perhaps a work task, an article, or a personal project—and are now taking a moment to relax, savoring the quiet ambiance before deciding whether to continue or shift to another activity, such as reading a book or stepping outside for a breath of fresh air.",
  "overall_future_clean": "A soft breath escapes, followed by a deliberate shift in posture as the body releases tension, fingers uncurling from the edge of the surface, then rising to stretch upward, arms reaching toward the ceiling before settling back down, the mind already turning toward the next movement—whether it’s the quiet rustle of a page turning or the steady click of a door closing behind a step into the open air.",
  "future_scene_ok": true
}