{
  "video_path": "./ref_datasets/part2/5901085000.mp4",
  "start_time": 0.0,
  "end_time": 6.006,
  "image_path": "./003128.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5901085000.mp4",
      "start_time": 0.0,
      "end_time": 6.006,
      "image_path": "./ref_datasets/extracted_frames/person_6432481472850785947_1_5901085000.mp4_0.00_6.01.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5901085000.mp4",
      "start_time": 0.0,
      "end_time": 6.006,
      "image_path": "./ref_datasets/extracted_frames/face_6432481472850785947_1_5901085000.mp4_0.00_6.01.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/5901085001.mp4",
      "start_time": 0.0,
      "end_time": 0.9009,
      "image_path": "./ref_datasets/extracted_frames/person_2059225732629080132_1_5901085001.mp4_0.00_0.90.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5901085001.mp4",
      "start_time": 0.0,
      "end_time": 0.9009,
      "image_path": "./ref_datasets/extracted_frames/face_2059225732629080132_1_5901085001.mp4_0.00_0.90.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a black beret, a white blouse with a ruffled collar, a black textured blazer with gold buttons, and black trousers. The outfit is formal and stylish.",
        "clothing": [
          {
            "possible_names": [
              "beret",
              "hat"
            ],
            "name": "beret",
            "type": "headwear",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "blouse",
              "shirt"
            ],
            "name": "blouse",
            "type": "top",
            "color": [
              "white"
            ]
          },
          {
            "possible_names": [
              "blazer",
              "jacket"
            ],
            "name": "blazer",
            "type": "top",
            "color": [
              "black"
            ]
          },
          {
            "possible_names": [
              "trousers",
              "pants"
            ],
            "name": "trousers",
            "type": "bottom",
            "color": [
              "black"
            ]
          }
        ],
        "objects": [],
        "description": "The person is an adult female standing in the foreground against a light-colored wall. She is dressed in a formal and stylish outfit consisting of a black beret, a white blouse with a ruffled collar, a black textured blazer with gold buttons, and black trousers. Her expression is neutral, and she appears to be posing for the photo.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "The person is dressed in a stylish outfit consisting of a black beret, a textured black jacket with gold buttons, a white blouse, and black trousers. The setting suggests an urban environment, possibly during a casual outing or a photoshoot. The individual's pose and attire convey a sense of fashion and confidence.",
        "race": "asian",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is standing against a plain wall, wearing a black beret, a textured black blazer with gold buttons, a white blouse, and black trousers. They have one hand raised to their face, possibly adjusting their hair or simply posing for the photograph. Their posture suggests confidence and style, as they seem to be showcasing their outfit. The overall appearance indicates a fashion-conscious individual who may be modeling or simply enjoying a moment of self-expression through their attire.",
        "intention": "The individual is deliberately showcasing their outfit to express personal style and confidence through intentional posture and gesture",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.5377204974965444,
            0.3416669887623617
          ],
          [
            0.5380807080123791,
            0.36028526047510756
          ],
          [
            0.5399469417869729,
            0.38034532204979943
          ],
          [
            0.5467260102273295,
            0.3992782735753627
          ],
          [
            0.5612502991522431,
            0.4118289458964552
          ],
          [
            0.5819588216208907,
            0.42054119078176366
          ],
          [
            0.6055765982342776,
            0.4281899416375728
          ],
          [
            0.626015129985002,
            0.4329627274047761
          ],
          [
            0.6477655228483613,
            0.43261941756520955
          ],
          [
            0.6570275646038156,
            0.42353007289625355
          ],
          [
            0.660591636069868,
            0.4126351704554898
          ],
          [
            0.6682860371927736,
            0.40588991861967816
          ],
          [
            0.6753760435593822,
            0.3958334526490598
          ],
          [
            0.6832001237011461,
            0.38606649310815905
          ],
          [
            0.6853782726974084,
            0.3717037004019533
          ],
          [
            0.6842405832633771,
            0.36176519865791
          ],
          [
            0.6853637969683086,
            0.3494010974253927
          ],
          [
            0.6047318843306687,
            0.3306197497816313
          ],
          [
            0.6208499179630683,
            0.3248902063816786
          ],
          [
            0.6338401286374955,
            0.3237910437974192
          ],
          [
            0.6473219336025298,
            0.3262291109987668
          ],
          [
            0.659339830862782,
            0.3309419941334497
          ],
          [
            0.6761266799200149,
            0.33248975642380263
          ],
          [
            0.6786401514653806,
            0.32932221843373205
          ],
          [
            0.6820550127004189,
            0.3273655013846499
          ],
          [
            0.6850941369142481,
            0.3265310162589664
          ],
          [
            0.6882208650074307,
            0.3256509122039591
          ],
          [
            0.6658401827332835,
            0.34720482620454973
          ],
          [
            0.6716769877564971,
            0.3553582783433653
          ],
          [
            0.6773681096298985,
            0.36477755088181724
          ],
          [
            0.6807892167378986,
            0.3751445386736166
          ],
          [
            0.6524189186474634,
            0.3840955048799515
          ],
          [
            0.6600788719439633,
            0.38402800013621646
          ],
          [
            0.6677461145416138,
            0.38571422855768883
          ],
          [
            0.6724181891749146,
            0.3840516330585593
          ],
          [
            0.6760508476741731,
            0.3835350025977407
          ],
          [
            0.6172337191760856,
            0.34430878502982004
          ],
          [
            0.6259036007381621,
            0.34201285977448737
          ],
          [
            0.6359875993753867,
            0.34138497798925355
          ],
          [
            0.6401578144421652,
            0.34800055559192383
          ],
          [
            0.6344228832810014,
            0.34954903175433477
          ],
          [
            0.6254954292660667,
            0.347073323457014
          ],
          [
            0.6713821972488726,
            0.34866189543335213
          ],
          [
            0.6754759334382556,
            0.34269851510013855
          ],
          [
            0.679860212941649,
            0.34067734291865714
          ],
          [
            0.6818202119655711,
            0.3454769301982153
          ],
          [
            0.6793940503761251,
            0.347076166421175
          ],
          [
            0.6761121013177135,
            0.3482658780401662
          ],
          [
            0.62330012983746,
            0.3986429775399821
          ],
          [
            0.6445316449674979,
            0.39784395432188396
          ],
          [
            0.6627906536299085,
            0.39494198926147955
          ],
          [
            0.666800092578565,
            0.3968688551868711
          ],
          [
            0.6680000056034673,
            0.3955974991477671
          ],
          [
            0.670185958266889,
            0.39777671258364405
          ],
          [
            0.6690023286002023,
            0.39757437368943577
          ],
          [
            0.6672405809321732,
            0.4022837250360421
          ],
          [
            0.6645210984522703,
            0.407052803678172
          ],
          [
            0.6595236211857467,
            0.41097516743909746
          ],
          [
            0.6509322980093578,
            0.4092994216652144
          ],
          [
            0.6377690840019751,
            0.4054313121807008
          ],
          [
            0.6263542882349125,
            0.3983186917645591
          ],
          [
            0.6536019310749397,
            0.4007801727170036
          ],
          [
            0.6620556833882811,
            0.4025855676758857
          ],
          [
            0.6645678616705395,
            0.40099047692049117
          ],
          [
            0.6676969558473618,
            0.3980048886367253
          ],
          [
            0.6643742396087242,
            0.4001826367562725
          ],
          [
            0.6611899906996066,
            0.4023553126269863
          ],
          [
            0.6507630422001793,
            0.40025080527578083
          ]
        ],
        "visibility": [
          0.7676810026168823,
          0.9997057318687439,
          0.8896207809448242,
          4.3060466850874946e-05,
          7.566929707536474e-05,
          6.898302672198042e-05,
          2.6453129976289347e-05,
          1.2389439474347341e-09,
          0.9995924830436707,
          0.11601655930280685,
          9.154172744274547e-07,
          0.00422345194965601,
          0.9248161911964417,
          0.00020370492711663246,
          0.03884726017713547,
          1.4251145330490544e-05,
          7.648290193174034e-05,
          5.930932729825145e-06,
          9.333956718649006e-09,
          1.0,
          1.3440082380355989e-11,
          5.053333751448008e-08,
          3.6673910436269e-11,
          0.3478296995162964,
          4.527666897001861e-14,
          8.606628604246325e-11,
          2.794046244369852e-11,
          1.9751166036030554e-08,
          0.0004607160808518529
        ],
        "headpose": {
          "pitch": -10.727471204759931,
          "yaw": -48.0593556796091,
          "roll": 7.045581746810042
        },
        "attributes": {
          "5 oClock Shadow": 0.0005148759228177369,
          "Arched Eyebrows": 0.3037877678871155,
          "Attractive": 0.44049200415611267,
          "Bags Under Eyes": 0.2547367215156555,
          "Bald": 3.0273843094619224e-06,
          "Bangs": 0.007759059779345989,
          "Big Lips": 0.5401512384414673,
          "Big Nose": 0.11638388782739639,
          "Black Hair": 0.692335307598114,
          "Blond Hair": 0.000473413267172873,
          "Blurry": 0.001235793810337782,
          "Brown Hair": 0.015201279893517494,
          "Bushy Eyebrows": 0.028180941939353943,
          "Chubby": 0.006432437803596258,
          "Double Chin": 0.00043585675302892923,
          "Eyeglasses": 8.381121733691543e-05,
          "Goatee": 3.4037995646940544e-05,
          "Gray Hair": 5.9359943406889215e-05,
          "Heavy Makeup": 0.12364795804023743,
          "High Cheekbones": 0.17414280772209167,
          "Male": 0.017390970140695572,
          "Mouth Slightly Open": 0.023751573637127876,
          "Mustache": 2.6539977625361644e-05,
          "Narrow Eyes": 0.1814318150281906,
          "No Beard": 0.9994484782218933,
          "Oval Face": 0.050273261964321136,
          "Pale Skin": 0.01854586973786354,
          "Pointy Nose": 0.20159278810024261,
          "Receding Hairline": 0.003705222625285387,
          "Rosy Cheeks": 0.0014198579592630267,
          "Sideburns": 2.0324538127169944e-05,
          "Smiling": 0.023797735571861267,
          "Straight Hair": 0.07833119481801987,
          "Wavy Hair": 0.25576189160346985,
          "Wearing Earrings": 0.027135156095027924,
          "Wearing Hat": 0.08249359577894211,
          "Wearing Lipstick": 0.4194950759410858,
          "Wearing Necklace": 0.01580086722970009,
          "Wearing Necktie": 0.0009820215636864305,
          "Young": 0.9880512952804565
        },
        "age": [
          0.003636109409853816,
          0.8406141400337219,
          0.9971828460693359,
          0.8872013688087463,
          0.1254863739013672,
          0.000310200935928151,
          5.529821464733686e-06,
          1.529483739659554e-08
        ],
        "race": [
          0.06786341965198517,
          0.16461612284183502,
          0.7963988780975342,
          0.9019754528999329,
          0.48021572828292847
        ],
        "gender": [
          0.0016873738495633006,
          0.998863935470581
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.0021389695754269085,
          "disgust": 3.0629208848347013e-07,
          "fear": 0.0010157648529108604,
          "happy": 0.005952062219740857,
          "sad": 91.42154557448082,
          "surprise": 1.3844283442955723e-09,
          "neutral": 8.569344601709295
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 232,
          "h": 352,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 30,
        "gender": {
          "Woman": 99.90234375,
          "Man": 0.09765215800143778
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 42.677703499794006,
          "indian": 4.075915738940239,
          "black": 1.581331342458725,
          "white": 22.783680260181427,
          "middle eastern": 7.180320471525192,
          "latino hispanic": 21.701054275035858
        },
        "dominant_race": "asian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.2297196090221405,
        0.25463858246803284,
        0.9762946963310242,
        0.9987673759460449
      ]
    ],
    "face_boxes": [
      [
        0.5491536259651184,
        0.30243945121765137,
        0.6932836174964905,
        0.42505258321762085
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5759137001326075,
            0.4680894207706054
          ],
          [
            0.4114316373285732,
            0.48189523339271545
          ],
          [
            0.4285206828147067,
            0.648765490303437
          ],
          [
            0.47765168858734036,
            0.523912923981746
          ],
          [
            0.7403957629366418,
            0.45428360814849533
          ],
          [
            0.8514745585965092,
            0.6163518432776132
          ],
          [
            0.8771081268257094,
            0.7796205838521321
          ],
          [
            0.5011491261307739,
            0.7400039041539033
          ],
          [
            0.47337942721580695,
            0.970500949670871
          ],
          [
            0.4648349044727401,
            1.0857494724293548
          ],
          [
            0.7104899333359084,
            0.7520089586079121
          ],
          [
            0.6699034503063416,
            0.9680999387800694
          ],
          [
            0.652814404820208,
            1.0857494724293548
          ],
          [
            0.6271808365910079,
            0.34863912895321847
          ],
          [
            0.680584103735175,
            0.34863912895321847
          ],
          [
            0.5289188250457405,
            0.3558421616256237
          ],
          [
            0.6827202344209414,
            0.35464165618022275
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5374633477888073,
            0.48189523339271545
          ],
          [
            0.526782694359974,
            0.47949422250191365
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5182381716169072,
            0.4951007932921251
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.4947407340734737,
            0.5227124185363451
          ],
          [
            0.5118297795596072,
            0.5047048368553321
          ],
          [
            0.526782694359974,
            0.4866972551743189
          ],
          [
            0.5374633477888073,
            0.47589270616571105
          ],
          [
            0.5588246546464742,
            0.46748916804790497
          ],
          [
            0.5182381716169072,
            0.47349169527490936
          ],
          [
            0.5310549557315073,
            0.4638876517117023
          ],
          [
            0.5417356091603406,
            0.4662886626025041
          ],
          [
            0.5460078705318742,
            0.4686896734933058
          ],
          [
            0.520374302302674,
            0.4806947279473146
          ],
          [
            0.5331910864172739,
            0.47349169527490936
          ],
          [
            0.5438717398461074,
            0.47949422250191365
          ],
          [
            0.5460078705318742,
            0.48789776061971984
          ],
          [
            0.5182381716169072,
            0.4890982660651207
          ],
          [
            0.5289188250457405,
            0.4854967497289181
          ],
          [
            0.5374633477888073,
            0.4914992769559225
          ],
          [
            0.5395994784745741,
            0.4975018041829268
          ],
          [
            0.5182381716169072,
            0.4975018041829268
          ],
          [
            0.5246465636742073,
            0.4951007932921251
          ],
          [
            0.5331910864172739,
            0.49870230962832773
          ],
          [
            0.5331910864172739,
            0.5035043314099312
          ]
        ],
        "dw_face": [
          [
            0.5438717398461074,
            0.3474386235078175
          ],
          [
            0.5417356091603406,
            0.3594436779618263
          ],
          [
            0.5460078705318742,
            0.37144873241583515
          ],
          [
            0.5481440012176406,
            0.3834537868698437
          ],
          [
            0.5566885239607074,
            0.3942583358784516
          ],
          [
            0.5695053080753075,
            0.4038623794416586
          ],
          [
            0.5844582228756744,
            0.4110654121140639
          ],
          [
            0.6036833990475745,
            0.4170679393410683
          ],
          [
            0.6207724445337078,
            0.4218699611226717
          ],
          [
            0.6421337513913747,
            0.4230704665680727
          ],
          [
            0.6592227968775081,
            0.41826844478646913
          ],
          [
            0.6677673196205747,
            0.4062633903324604
          ],
          [
            0.6741757116778749,
            0.39665934676925335
          ],
          [
            0.680584103735175,
            0.3846542923152447
          ],
          [
            0.6848563651067082,
            0.3726492378612359
          ],
          [
            0.6848563651067082,
            0.36064418340722726
          ],
          [
            0.6869924957924748,
            0.34863912895321847
          ],
          [
            0.6015472683618077,
            0.3366340744992096
          ],
          [
            0.6143640524764078,
            0.334233063608408
          ],
          [
            0.6293169672767744,
            0.334233063608408
          ],
          [
            0.6421337513913747,
            0.33543356905380894
          ],
          [
            0.652814404820208,
            0.3378345799446106
          ],
          [
            0.6763118423636414,
            0.34023559083541227
          ],
          [
            0.680584103735175,
            0.33903508539001154
          ],
          [
            0.6827202344209414,
            0.3378345799446106
          ],
          [
            0.6869924957924748,
            0.3378345799446106
          ],
          [
            0.6912647571640083,
            0.33903508539001154
          ],
          [
            0.6656311889348081,
            0.3510401398440201
          ],
          [
            0.6699034503063416,
            0.3582431725164254
          ],
          [
            0.6763118423636414,
            0.36664671063423154
          ],
          [
            0.680584103735175,
            0.3738497433066368
          ],
          [
            0.6506782741344415,
            0.382253281424443
          ],
          [
            0.6592227968775081,
            0.3834537868698437
          ],
          [
            0.6677673196205747,
            0.3834537868698437
          ],
          [
            0.6763118423636414,
            0.3834537868698437
          ],
          [
            0.6827202344209414,
            0.3798522705336411
          ],
          [
            0.6100917911048743,
            0.3498396343986194
          ],
          [
            0.6207724445337078,
            0.3474386235078175
          ],
          [
            0.6335892286483079,
            0.3474386235078175
          ],
          [
            0.639997620705608,
            0.3510401398440201
          ],
          [
            0.6293169672767744,
            0.353441150734822
          ],
          [
            0.618636313847941,
            0.35224064528942106
          ],
          [
            0.6720395809921081,
            0.35224064528942106
          ],
          [
            0.6741757116778749,
            0.34863912895321847
          ],
          [
            0.680584103735175,
            0.34863912895321847
          ],
          [
            0.6848563651067082,
            0.3510401398440201
          ],
          [
            0.680584103735175,
            0.353441150734822
          ],
          [
            0.6763118423636414,
            0.353441150734822
          ],
          [
            0.6314530979625413,
            0.3978598522146543
          ],
          [
            0.646406012762908,
            0.39545884132385256
          ],
          [
            0.6613589275632749,
            0.3942583358784516
          ],
          [
            0.6677673196205747,
            0.3942583358784516
          ],
          [
            0.6699034503063416,
            0.3942583358784516
          ],
          [
            0.6720395809921081,
            0.39665934676925335
          ],
          [
            0.6720395809921081,
            0.3978598522146543
          ],
          [
            0.6699034503063416,
            0.40146136855085696
          ],
          [
            0.6677673196205747,
            0.4038623794416586
          ],
          [
            0.6634950582490413,
            0.40506288488705955
          ],
          [
            0.6506782741344415,
            0.4038623794416586
          ],
          [
            0.639997620705608,
            0.40146136855085696
          ],
          [
            0.6335892286483079,
            0.3978598522146543
          ],
          [
            0.6506782741344415,
            0.3978598522146543
          ],
          [
            0.6634950582490413,
            0.3978598522146543
          ],
          [
            0.6677673196205747,
            0.39906035766005515
          ],
          [
            0.6699034503063416,
            0.39906035766005515
          ],
          [
            0.6656311889348081,
            0.39906035766005515
          ],
          [
            0.6634950582490413,
            0.39906035766005515
          ],
          [
            0.6485421434486746,
            0.39906035766005515
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "003128",
  "objects": [],
  "mask_file": "./person_labeling/./003128.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person stands against a light gray wall wearing a black beret white blouse black textured jacket with gold buttons and black pants creating a chic monochromatic look with subtle accents of gold and white.",
  "overall_past": "Before the current scene, the individual likely spent time carefully selecting and arranging their outfit, possibly trying on different pieces to achieve the desired monochromatic yet refined look. They may have paused in front of a mirror to adjust the fit of the black blazer, ensuring the gold buttons caught the light just right, and styled their hair to complement the black beret. The deliberate positioning against the wall and the raised hand suggest a moment of intentional self-presentation—perhaps preparing for a photoshoot, a social media post, or a special event—indicating that this pose was chosen after a brief moment of reflection and adjustment to perfect their image.",
  "overall_past_clean": "The individual stood in front of a mirror, meticulously adjusting their silhouette, testing the balance of form and detail, pausing to refine every element until the alignment of posture, gesture, and presence felt unmistakably intentional.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to turn slightly, perhaps toward a nearby mirror or reflective surface, to check their overall appearance and ensure the outfit’s polished look is perfectly aligned—confirming the subtle interplay of black, white, and gold in the lighting. This moment of self-assessment would naturally lead to a confident stride forward, as if stepping into a new scene, perhaps a photoshoot, a fashion event, or a quiet moment of personal empowerment in a cityscape.",
  "overall_future_clean": "A decisive step forward cuts through the air, the momentum carrying the figure into a new frame of presence—sharp, unapologetic, as if the world itself has shifted to accommodate the weight of that movement.",
  "future_scene_ok": true
}