{
  "video_path": "./ref_datasets/part2/4788140007.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./001599.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/4788140007.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_3397165204458686302_1_4788140007.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4788140007.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_3397165204458686302_1_4788140007.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "unknown",
        "emotion": "neutral",
        "clothing_description": "The person appears to be unclothed from the shoulders up, showing bare skin.",
        "clothing": [],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "flowers",
              "floral arrangement"
            ],
            "name": "flowers",
            "position": "head"
          }
        ],
        "description": "The person is an adult with a shaved head and a neutral expression. They are unclothed from the shoulders up, revealing bare skin. There is a floral arrangement consisting of various small flowers placed on the side of their face, extending from the forehead down towards the cheek. The background is plain and light-colored.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a neutral expression, neither displaying strong emotions nor engaging directly with the viewer.",
        "meaningful": true,
        "story": "The person seems to be part of an artistic or conceptual photoshoot, possibly exploring themes of nature, beauty, or identity. The flowers adorning their face suggest a connection to nature or a symbolic representation of growth and change.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the image appears to be engaged in a creative or artistic endeavor, as evidenced by the delicate arrangement of small flowers adorning their face. Their expression is serene and contemplative, suggesting a deep connection with the artistry involved. The positioning of the flowers around their eye and cheek indicates a deliberate and thoughtful placement, possibly aiming to evoke a sense of beauty and nature intertwined with human form. The overall atmosphere conveys a sense of calm and introspection, hinting at a motivation rooted in self-expression and the exploration of aesthetic boundaries.",
        "intention": "The intention is to merge natural elements with the human form as a means of expressing inner tranquility and pushing the boundaries of aesthetic perception",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "head",
            "action": [
              "wear"
            ]
          },
          "object": 0,
          "deleted": true
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "head",
            "action": [
              [
                "head",
                "wear"
              ]
            ]
          },
          "object": 1
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "head",
            "action": [
              "wear"
            ]
          },
          "object": 2,
          "deleted": true
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.5532999272691086,
            0.421043975012643
          ],
          [
            0.5606453563502458,
            0.48678725106375564
          ],
          [
            0.5687783694135891,
            0.5527055263519287
          ],
          [
            0.5790894552025877,
            0.6178708076477051
          ],
          [
            0.5876367076167038,
            0.6844393866402763
          ],
          [
            0.6060192894074135,
            0.7477068219866071
          ],
          [
            0.6262308066444737,
            0.8057468278067452
          ],
          [
            0.6473732485070026,
            0.8634065900530133
          ],
          [
            0.6798154706567792,
            0.8856771332877023
          ],
          [
            0.7273981794881235,
            0.8701788357325962
          ],
          [
            0.7718326692535942,
            0.8104601587568011
          ],
          [
            0.8184300808102958,
            0.7475157465253558
          ],
          [
            0.856436682083378,
            0.6712367194039481
          ],
          [
            0.8800445522813658,
            0.5719735281808036
          ],
          [
            0.8851076787437446,
            0.4693272454398019
          ],
          [
            0.8846839988670712,
            0.36540024621146067
          ],
          [
            0.8823613904948746,
            0.26081069878169466
          ],
          [
            0.5315992481607412,
            0.3421802520751953
          ],
          [
            0.5361357878926876,
            0.29376254762922016
          ],
          [
            0.5547332654158319,
            0.2849658557346889
          ],
          [
            0.5773774166840927,
            0.2850586005619594
          ],
          [
            0.5981529754686302,
            0.293830190386091
          ],
          [
            0.6449682873374384,
            0.2633837120873587
          ],
          [
            0.6763022634466844,
            0.22382569313049316
          ],
          [
            0.7113688322964922,
            0.19684253420148576
          ],
          [
            0.7480430561284135,
            0.19853036744253977
          ],
          [
            0.7816304669915033,
            0.2253230128969465
          ],
          [
            0.6245125967876187,
            0.3482494354248047
          ],
          [
            0.6217100409558043,
            0.4025084972381592
          ],
          [
            0.6198716137691268,
            0.4516455445970808
          ],
          [
            0.6151692075821172,
            0.5049361501421247
          ],
          [
            0.6176414815792148,
            0.5699763298034668
          ],
          [
            0.6268249281316197,
            0.569859504699707
          ],
          [
            0.639012237353849,
            0.5728754316057477
          ],
          [
            0.6549515666556545,
            0.5567446776798793
          ],
          [
            0.6740338570089079,
            0.5464421340397426
          ],
          [
            0.5620587550136926,
            0.4009420871734619
          ],
          [
            0.5682849354883989,
            0.3666463920048305
          ],
          [
            0.5902372908229674,
            0.35831165313720703
          ],
          [
            0.6085282329336873,
            0.37835683141435894
          ],
          [
            0.5923656599479727,
            0.3933932100023542
          ],
          [
            0.5735483871789516,
            0.40249763216291157
          ],
          [
            0.6889020878006704,
            0.341259275163923
          ],
          [
            0.7028798021492548,
            0.3013812133244106
          ],
          [
            0.72465718339663,
            0.2878474167415074
          ],
          [
            0.7484725403067256,
            0.2999518598828997
          ],
          [
            0.73195732185351,
            0.32584987367902485
          ],
          [
            0.7072959026221983,
            0.33436107635498047
          ],
          [
            0.6202224838031855,
            0.6899828229631696
          ],
          [
            0.6230942303248282,
            0.6619746344430106
          ],
          [
            0.6331978806161455,
            0.6372081211635044
          ],
          [
            0.6460216485845324,
            0.6415999276297433
          ],
          [
            0.659112414428299,
            0.6272679056440081
          ],
          [
            0.6922432316101289,
            0.6396726880754743
          ],
          [
            0.7294097967928141,
            0.6558330399649483
          ],
          [
            0.7019070865519876,
            0.6929582187107631
          ],
          [
            0.6752503703464754,
            0.7203225408281598
          ],
          [
            0.656436477729585,
            0.7307893208095005
          ],
          [
            0.6426124920170488,
            0.7291902133396694
          ],
          [
            0.6297285641693244,
            0.7163713318961007
          ],
          [
            0.6265320157565709,
            0.6859948975699288
          ],
          [
            0.6396142458626335,
            0.6746058464050293
          ],
          [
            0.6499595599598251,
            0.6685357775006976
          ],
          [
            0.6684460387498673,
            0.6661334037780762
          ],
          [
            0.7195916498562187,
            0.6594531195504325
          ],
          [
            0.6701540227929529,
            0.6771861485072544
          ],
          [
            0.6518027842310923,
            0.6823761122567313
          ],
          [
            0.6378763696661086,
            0.6800063678196498
          ]
        ],
        "visibility": [
          0.9999371767044067,
          3.170022300214015e-10,
          1.2528083971119486e-05,
          2.7687474166669668e-14,
          0.9906478524208069,
          0.9980236291885376,
          1.2807266358549896e-10,
          2.77472814690094e-13,
          0.9982006549835205,
          7.42298410238984e-12,
          2.458877474964538e-07,
          1.6541771424849472e-11,
          0.1335715353488922,
          0.0015015238896012306,
          2.131146636941139e-08,
          3.1609866633919292e-12,
          3.8049526551731105e-07,
          2.5542280096546577e-11,
          1.9894898228844937e-10,
          1.0149368845357998e-10,
          5.380757772278854e-18,
          3.027737314453195e-21,
          4.1136324568924465e-08,
          8.9420510926419e-12,
          2.2635868600046282e-17,
          8.532851753706701e-17,
          9.335521721984263e-13,
          1.356287857631061e-13,
          2.433596033024621e-11
        ],
        "headpose": {
          "pitch": -4.085131019942749,
          "yaw": 24.99873141886762,
          "roll": -11.376741303298527
        },
        "attributes": {
          "5 oClock Shadow": 0.13866785168647766,
          "Arched Eyebrows": 0.06527069956064224,
          "Attractive": 0.30894598364830017,
          "Bags Under Eyes": 0.5322553515434265,
          "Bald": 0.07234527170658112,
          "Bangs": 3.104798088315874e-05,
          "Big Lips": 0.5952094793319702,
          "Big Nose": 0.2691423296928406,
          "Black Hair": 0.009626648388803005,
          "Blond Hair": 0.039262428879737854,
          "Blurry": 0.000331491872202605,
          "Brown Hair": 0.003681372618302703,
          "Bushy Eyebrows": 0.0365961454808712,
          "Chubby": 0.023060135543346405,
          "Double Chin": 0.006866297218948603,
          "Eyeglasses": 0.004254805389791727,
          "Goatee": 0.007038035895675421,
          "Gray Hair": 0.03525281324982643,
          "Heavy Makeup": 0.005942649208009243,
          "High Cheekbones": 0.08104594796895981,
          "Male": 0.9893842339515686,
          "Mouth Slightly Open": 0.9946746826171875,
          "Mustache": 0.0011987026082351804,
          "Narrow Eyes": 0.06434345990419388,
          "No Beard": 0.957832932472229,
          "Oval Face": 0.10991790145635605,
          "Pale Skin": 0.20927342772483826,
          "Pointy Nose": 0.21998535096645355,
          "Receding Hairline": 0.18814469873905182,
          "Rosy Cheeks": 0.0023831576108932495,
          "Sideburns": 0.0012512076646089554,
          "Smiling": 0.04645852744579315,
          "Straight Hair": 0.13617295026779175,
          "Wavy Hair": 0.0023744520731270313,
          "Wearing Earrings": 0.026325678452849388,
          "Wearing Hat": 0.0013020836049690843,
          "Wearing Lipstick": 0.01727324351668358,
          "Wearing Necklace": 0.005383507814258337,
          "Wearing Necktie": 0.24671657383441925,
          "Young": 0.9062896370887756
        },
        "age": [
          0.008726769126951694,
          0.3644874691963196,
          0.9768490195274353,
          0.857273519039154,
          0.2910977602005005,
          0.006962710991501808,
          0.0014228189829736948,
          5.418612636276521e-05
        ],
        "race": [
          0.9984588623046875,
          0.00466343155130744,
          0.4190969169139862,
          0.02677985653281212,
          0.06852050870656967
        ],
        "gender": [
          0.9747621417045593,
          0.03041940927505493
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 2.267903834581375,
          "disgust": 8.834869049678673e-05,
          "fear": 9.491771459579468,
          "happy": 6.610580533742905,
          "sad": 65.67848324775696,
          "surprise": 0.012281208182685077,
          "neutral": 15.9388929605484
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 2052,
          "h": 2159,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 38,
        "gender": {
          "Woman": 24.614757299423218,
          "Man": 75.38524866104126
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 1.4446931118072825e-05,
          "indian": 1.4056016084396106e-05,
          "black": 2.058638370883159e-07,
          "white": 99.88101720809937,
          "middle eastern": 0.06297843065112829,
          "latino hispanic": 0.055975792929530144
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.4865335524082184,
        0.0033075488172471523,
        0.9991901516914368,
        0.9843593835830688
      ]
    ],
    "face_boxes": [
      [
        0.5289028286933899,
        0.019074028357863426,
        0.8631482124328613,
        0.8897875547409058
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.8714915609889561,
            0.9203502217249957
          ],
          [
            1.0628490859799913,
            0.93521426152811
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5827766987217796,
            0.37462761752494345
          ],
          [
            0.718181731025378,
            0.3194183268276621
          ],
          [
            0.5525623526705635,
            0.4298369082222251
          ],
          [
            0.893872558063931,
            0.36613388049459245
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.5480861532555686,
            0.3873682230704699
          ],
          [
            0.5548004523780611,
            0.4744290276315679
          ],
          [
            0.5626338013543023,
            0.5551195294199024
          ],
          [
            0.5794195491605335,
            0.6400568997234125
          ],
          [
            0.5973243468205135,
            0.7143770987389837
          ],
          [
            0.6230624934567345,
            0.799314469042494
          ],
          [
            0.6454434905317095,
            0.8608940625125387
          ],
          [
            0.6879673849741619,
            0.8842518393460042
          ],
          [
            0.7304912794166142,
            0.8672643652853018
          ],
          [
            0.7685389744440713,
            0.8226722458759592
          ],
          [
            0.8043485697640312,
            0.7632160866635022
          ],
          [
            0.8345629158152473,
            0.6995130589358696
          ],
          [
            0.8591820125977196,
            0.6166991228899471
          ],
          [
            0.8681344114277099,
            0.540255489616788
          ],
          [
            0.8726106108427047,
            0.45107125079810256
          ],
          [
            0.8726106108427047,
            0.36613388049459245
          ],
          [
            0.8703725111352073,
            0.28119651019108255
          ],
          [
            0.53801470457183,
            0.3321589323731883
          ],
          [
            0.5503242529630661,
            0.3109245897973108
          ],
          [
            0.5671100007692973,
            0.30667772128213544
          ],
          [
            0.5838957485755284,
            0.3109245897973108
          ],
          [
            0.6006814963817596,
            0.31517145831248644
          ],
          [
            0.6555149392154482,
            0.28331994444867026
          ],
          [
            0.682372135705418,
            0.2557152991000292
          ],
          [
            0.7125864817566342,
            0.23023408800897632
          ],
          [
            0.745038927515348,
            0.2217403509786253
          ],
          [
            0.7741342237128152,
            0.23448095652415174
          ],
          [
            0.629776792579227,
            0.3597635777218293
          ],
          [
            0.6264196430179808,
            0.41072599990393527
          ],
          [
            0.6241815433104833,
            0.4616884220860413
          ],
          [
            0.620824393749237,
            0.5105274100105596
          ],
          [
            0.611871994919247,
            0.5678601349654289
          ],
          [
            0.625300593164232,
            0.5742304377381922
          ],
          [
            0.6398482412629658,
            0.5699835692230167
          ],
          [
            0.6611101884841919,
            0.5614898321926656
          ],
          [
            0.6812530858516693,
            0.550872660904727
          ],
          [
            0.5615147515005535,
            0.3937385258432332
          ],
          [
            0.5749433497455385,
            0.36401044623700474
          ],
          [
            0.593967197259267,
            0.3597635777218293
          ],
          [
            0.6096338952117496,
            0.3809979202977068
          ],
          [
            0.5950862471130159,
            0.39586196010082114
          ],
          [
            0.5783004993067847,
            0.40223226287358427
          ],
          [
            0.6834911855591668,
            0.3470229721763027
          ],
          [
            0.7013959832191468,
            0.3088011555397231
          ],
          [
            0.727134129855368,
            0.2981839842517844
          ],
          [
            0.7517532266378403,
            0.3109245897973108
          ],
          [
            0.7327293791241116,
            0.33852923514595185
          ],
          [
            0.7081102823416393,
            0.3491464064338904
          ],
          [
            0.6185862940417396,
            0.6973896246782818
          ],
          [
            0.6241815433104833,
            0.6719084135872287
          ],
          [
            0.6364910917017195,
            0.652797505268939
          ],
          [
            0.6465625403854582,
            0.6506740710113512
          ],
          [
            0.6588720887766945,
            0.6421803339810005
          ],
          [
            0.6935626342429054,
            0.6443037682385879
          ],
          [
            0.727134129855368,
            0.6570443737841144
          ],
          [
            0.709229332195388,
            0.6973896246782818
          ],
          [
            0.6868483351204131,
            0.729241138542098
          ],
          [
            0.6599911386304431,
            0.7462286126028002
          ],
          [
            0.6420863409704632,
            0.7398583098300368
          ],
          [
            0.6286577427254784,
            0.720747401511747
          ],
          [
            0.6230624934567345,
            0.6973896246782818
          ],
          [
            0.6364910917017195,
            0.6867724533903431
          ],
          [
            0.6521577896542019,
            0.6804021506175798
          ],
          [
            0.6857292852666642,
            0.6676615450720533
          ],
          [
            0.7204198307328754,
            0.66129124229929
          ],
          [
            0.6879673849741619,
            0.6825255848751675
          ],
          [
            0.6543958893616993,
            0.6995130589358696
          ],
          [
            0.638729191409217,
            0.6995130589358696
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "001599",
  "objects": [
    {
      "box": [
        0.5463984608650208,
        0.17142058908939362,
        0.57832270860672,
        0.24817417562007904
      ],
      "name": "flowers",
      "possible_names": [
        "flowers"
      ],
      "deleted": true
    },
    {
      "box": [
        0.47704052925109863,
        0.16930055618286133,
        0.6194547414779663,
        0.7499322891235352
      ],
      "name": "flowers",
      "possible_names": [
        "flowers"
      ]
    },
    {
      "box": [
        0.4957254230976105,
        0.18522489070892334,
        0.5354564785957336,
        0.27772992849349976
      ],
      "name": "flowers",
      "possible_names": [
        "flowers"
      ],
      "deleted": true
    }
  ],
  "mask_file": "./person_labeling/./001599.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A serene setting with soft lighting and a neutral backdrop features delicate flowers adorning the side creating an artistic and ethereal atmosphere",
  "overall_past": "Before the current scene, the individual likely spent time carefully selecting and arranging the delicate flowers, perhaps gathering them from a nearby garden or natural setting. They may have been inspired by a moment of quiet reflection or a creative vision, leading them to experiment with floral adornment as a form of personal expression. The deliberate placement of the flowers around their face suggests a process of trial and adjustment, aiming to achieve a harmonious blend of nature and self, possibly in preparation for a photo, performance, or private ritual. This act of creation was likely preceded by a meditative state, where the individual sought to connect with beauty, impermanence, and the subtle interplay between human presence and the natural world.",
  "overall_past_clean": "The individual moved with quiet intention through a sun-dappled space, pausing to pluck and examine each bloom with focused care, their hands tracing the edges of petals and stems as if listening to the silent language of growth, then arranging them in deliberate patterns that mirrored a vision forming in stillness.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual may slowly rise, the delicate flowers still gently resting in place, and step forward into a soft, diffused light that spills across the space—perhaps signaling a transition from introspection to expression. As they move, the flowers might begin to subtly shift, their petals catching the light and casting faint, ephemeral shadows, symbolizing the fleeting nature of beauty and the moment’s artistic culmination. This motion could mark the beginning of a quiet performance or a gesture of release—perhaps placing the flowers down, allowing them to fall like silent confessions, or stepping into a new space where the artistry continues in a different form, such as a painted canvas or a recorded moment, preserving the ethereal essence of the scene.",
  "overall_future_clean": "The figure rises with deliberate grace, each step dissolving the stillness into motion, the air itself seeming to ripple as light enfolds them, petals trembling like whispered secrets before drifting downward in a slow, inevitable descent, marking the moment when silence yields to creation and the ephemeral becomes eternal.",
  "future_scene_ok": true
}