{
  "video_path": "./ref_datasets/part2/5821502000.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./003000.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5821502000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_5516082401647180436_1_5821502000.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5821502000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_5516082401647180436_1_5821502000.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a loose-fitting gray coat over a white t-shirt. The coat appears to be made of a soft material, possibly wool or a similar fabric. The t-shirt is plain with no visible patterns or designs. The person also seems to be wearing dark-colored pants, though only a small portion is visible.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "jacket",
                "coat"
              ],
              "name": "jacket",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "t-shirt",
                "shirt"
              ],
              "name": "t-shirt",
              "type": "top",
              "color": [
                "white"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [],
        "description": "The person is an adult female sitting in the foreground against a red wall. She is dressed in a neutral manner, wearing a gray coat over a white t-shirt and dark pants. Her expression is neutral, and she does not appear to be holding or interacting with any objects. The setting suggests an outdoor environment, possibly during the day given the lighting.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "The person is sitting against a red wall, possibly taking a moment to rest or reflect. The setting suggests an urban environment, and her attire indicates a casual yet stylish appearance.",
        "race": "asian",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is sitting against a vibrant red wall, wearing a gray coat over a white shirt, with their legs crossed and hands resting on their knees. Their posture suggests a relaxed yet contemplative state, possibly indicating they are deep in thought or simply enjoying a moment of solitude. The bright sunlight casts shadows on the wall, adding to the serene atmosphere, and the person's calm demeanor implies they might be taking a break from daily activities to reflect or meditate. The presence of a padlock on the wall hints at a secure location, perhaps a private space where the individual feels safe and undisturbed.",
        "intention": "The individual seeks a moment of quiet introspection in a secure and peaceful environment to recharge mentally and emotionally",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.39623888865822837,
            0.15793235024447164
          ],
          [
            0.39745479878925144,
            0.17902941583956358
          ],
          [
            0.399148773490673,
            0.20418261819415623
          ],
          [
            0.4024910660726684,
            0.2256017358845504
          ],
          [
            0.4070740304532505,
            0.24639190820159104
          ],
          [
            0.41680943132156417,
            0.26250559659231276
          ],
          [
            0.42886184262377874,
            0.26597452510601627
          ],
          [
            0.4437398476260049,
            0.27135200916774693
          ],
          [
            0.457768323804651,
            0.2732098039495882
          ],
          [
            0.4709324441495396,
            0.2758082088339266
          ],
          [
            0.48151534738994783,
            0.2673565748507384
          ],
          [
            0.49349373295193627,
            0.2594505687239309
          ],
          [
            0.5015440763462158,
            0.24575640221752185
          ],
          [
            0.506849959776515,
            0.22790643588575735
          ],
          [
            0.5090396933612369,
            0.20716373283396322
          ],
          [
            0.5120971742130461,
            0.18458411475968742
          ],
          [
            0.5144962236994789,
            0.16165311216677306
          ],
          [
            0.4072638049721718,
            0.08151272207340866
          ],
          [
            0.4150307366535777,
            0.06291178972632797
          ],
          [
            0.42553018821137295,
            0.05712793404778476
          ],
          [
            0.4378237864800862,
            0.05855551622216664
          ],
          [
            0.44965981592734655,
            0.06879816894178037
          ],
          [
            0.46639910680907115,
            0.07371624791748309
          ],
          [
            0.4770624570903324,
            0.06547905969872046
          ],
          [
            0.48821133729957394,
            0.0691522739867054
          ],
          [
            0.49810361578350976,
            0.07934078487454269
          ],
          [
            0.504733559631166,
            0.09393649236865777
          ],
          [
            0.45790167720544905,
            0.09641576507104137
          ],
          [
            0.4585492671955199,
            0.10695653933065909
          ],
          [
            0.4592860154452778,
            0.11570792381094877
          ],
          [
            0.4592402787435622,
            0.12706635616443776
          ],
          [
            0.45140295099644434,
            0.16713946206229074
          ],
          [
            0.45630805109228406,
            0.1662127254185853
          ],
          [
            0.4594560748054867,
            0.16600737606406843
          ],
          [
            0.463629802493822,
            0.16683223291679664
          ],
          [
            0.46710786592392695,
            0.16927597084373394
          ],
          [
            0.42078255152418503,
            0.11165034282144415
          ],
          [
            0.42754179586966834,
            0.10500092875389826
          ],
          [
            0.4353244514692397,
            0.1047638063392942
          ],
          [
            0.4416952505707741,
            0.11209064264776845
          ],
          [
            0.4342189563172204,
            0.109311294776422
          ],
          [
            0.42830873067889896,
            0.10848281055531175
          ],
          [
            0.4739815893627348,
            0.1148412514615942
          ],
          [
            0.47993539912360056,
            0.11037115807886477
          ],
          [
            0.4853598986353193,
            0.11264382752161176
          ],
          [
            0.4917421389193762,
            0.11899936877230488
          ],
          [
            0.48562346625895725,
            0.11510096655951606
          ],
          [
            0.4806664912473588,
            0.11279595308202915
          ],
          [
            0.44088491102059685,
            0.2118668174617505
          ],
          [
            0.4475091707138788,
            0.19166860031703162
          ],
          [
            0.45600896030664445,
            0.1789315328711555
          ],
          [
            0.4601321192014785,
            0.18228909893641396
          ],
          [
            0.4637558292774927,
            0.17768131109772536
          ],
          [
            0.47024651694865455,
            0.19353156745749173
          ],
          [
            0.47680246588729674,
            0.21490382044403641
          ],
          [
            0.4696815994523821,
            0.21382407378898097
          ],
          [
            0.462926912520613,
            0.21183282767654096
          ],
          [
            0.45947015626089915,
            0.21357107603991474
          ],
          [
            0.4551974547760827,
            0.2115550205190346
          ],
          [
            0.44843133226746607,
            0.21197042137226732
          ],
          [
            0.44524370446091605,
            0.20895139849375166
          ],
          [
            0.45546154933316363,
            0.19656185309092203
          ],
          [
            0.45963175105197085,
            0.1978598911926229
          ],
          [
            0.46313001733450665,
            0.19924055268524815
          ],
          [
            0.47194397697846097,
            0.2112046659938873
          ],
          [
            0.4623953207617715,
            0.19974518232244662
          ],
          [
            0.4594069186420668,
            0.1988034995775374
          ],
          [
            0.454177698422046,
            0.19703092556151133
          ]
        ],
        "visibility": [
          0.9999972581863403,
          1.949672423506854e-08,
          3.965174073528033e-06,
          2.027636786499764e-15,
          0.0007644668221473694,
          5.168967163626803e-06,
          1.4448901426861894e-17,
          2.2796024389368235e-23,
          5.040501491748728e-06,
          3.268854329920525e-17,
          2.5690249927379227e-09,
          6.51366601715081e-13,
          2.8862192397481135e-16,
          5.751177312163236e-08,
          4.49970371361086e-18,
          5.611787701198523e-10,
          1.5689315402411808e-09,
          1.6405016234344316e-09,
          2.8776869048168535e-17,
          2.4892468728637818e-14,
          2.3196369955055807e-13,
          1.7565150722820277e-11,
          7.519541327383195e-07,
          4.817672343416894e-14,
          9.597206022077089e-20,
          1.6671146699410038e-20,
          1.8006398238776256e-12,
          0.00014214393740985543,
          2.3294553841424204e-07
        ],
        "headpose": {
          "pitch": 19.307548009940778,
          "yaw": 0.9471318734785016,
          "roll": 1.476127249931639
        },
        "attributes": {
          "5 oClock Shadow": 0.0009162682690657675,
          "Arched Eyebrows": 0.016949312761425972,
          "Attractive": 0.22061926126480103,
          "Bags Under Eyes": 0.0058224075473845005,
          "Bald": 1.1310600029901252e-06,
          "Bangs": 0.002042581094428897,
          "Big Lips": 0.2972870171070099,
          "Big Nose": 0.012246845290064812,
          "Black Hair": 0.6257500648498535,
          "Blond Hair": 0.0003667958080768585,
          "Blurry": 0.01601380482316017,
          "Brown Hair": 0.06952325254678726,
          "Bushy Eyebrows": 0.03747539222240448,
          "Chubby": 0.03377196565270424,
          "Double Chin": 0.003975164610892534,
          "Eyeglasses": 0.0013206701260060072,
          "Goatee": 8.348529081558809e-05,
          "Gray Hair": 6.919352017575875e-05,
          "Heavy Makeup": 0.2865348160266876,
          "High Cheekbones": 0.05919934809207916,
          "Male": 0.01954597793519497,
          "Mouth Slightly Open": 0.7782623171806335,
          "Mustache": 3.0118975701043382e-05,
          "Narrow Eyes": 0.7093637585639954,
          "No Beard": 0.9985976815223694,
          "Oval Face": 0.3224371075630188,
          "Pale Skin": 0.0013125613331794739,
          "Pointy Nose": 0.16380761563777924,
          "Receding Hairline": 0.010529011487960815,
          "Rosy Cheeks": 0.004446213599294424,
          "Sideburns": 5.544755913433619e-05,
          "Smiling": 0.0072577940300107,
          "Straight Hair": 0.1267569661140442,
          "Wavy Hair": 0.31294992566108704,
          "Wearing Earrings": 0.11058002710342407,
          "Wearing Hat": 0.0008336496539413929,
          "Wearing Lipstick": 0.599696159362793,
          "Wearing Necklace": 0.015344735234975815,
          "Wearing Necktie": 0.0022644363343715668,
          "Young": 0.9858642816543579
        },
        "age": [
          0.09696927666664124,
          0.97117018699646,
          0.9946880340576172,
          0.7699450254440308,
          0.016444457694888115,
          2.9345605071284808e-05,
          2.345962457184214e-06,
          1.7794276274685217e-08
        ],
        "race": [
          0.8144521713256836,
          0.0011980354320257902,
          0.9890797734260559,
          0.07241061329841614,
          0.8415583372116089
        ],
        "gender": [
          0.015435714274644852,
          0.9866698384284973
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.04246453754603863,
          "disgust": 2.4453422398096336e-06,
          "fear": 0.18149235984310508,
          "happy": 0.350607861764729,
          "sad": 94.39008235931396,
          "surprise": 7.555980729989642e-07,
          "neutral": 5.03535158932209
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 315,
          "h": 354,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 30,
        "gender": {
          "Woman": 99.33987855911255,
          "Man": 0.6601161789149046
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 96.89509254068687,
          "indian": 0.863704975021182,
          "black": 0.035017925888437086,
          "white": 0.683769345061144,
          "middle eastern": 0.11350134831302454,
          "latino hispanic": 1.4089140018173458
        },
        "dominant_race": "asian"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.11588120460510254,
        0.003310200059786439,
        0.6627176403999329,
        0.987483561038971
      ]
    ],
    "face_boxes": [
      [
        0.4072180688381195,
        0.015498989261686802,
        0.517257809638977,
        0.2663429379463196
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.4607348450554742,
            0.4797581349874778
          ],
          [
            0.3398794940312704,
            0.4846087765344852
          ],
          [
            0.3162536359363132,
            0.8645756977167277
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.581590196079678,
            0.4749074934404704
          ],
          [
            0.6133942358228897,
            0.8564912951383821
          ],
          [
            0.5879510040283203,
            0.953504126078529
          ],
          [
            0.3944007050196329,
            0.9842248558762424
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5570556511349148,
            0.977757333813566
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4316568658616808,
            0.10625873586791178
          ],
          [
            0.4843607031504314,
            0.10464185535224267
          ],
          [
            0.4025788866678873,
            0.17578459804168375
          ],
          [
            0.518890803443061,
            0.17740147855735294
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.4062136340671116,
            0.1272781825716102
          ],
          [
            0.40530494721730553,
            0.15638203185365432
          ],
          [
            0.4071223209169176,
            0.18225212010436023
          ],
          [
            0.4098483814663357,
            0.20650532783939696
          ],
          [
            0.414391815715366,
            0.22914165505876458
          ],
          [
            0.42438737106323243,
            0.24692734073112493
          ],
          [
            0.43347423956129283,
            0.2630961458878161
          ],
          [
            0.44710454230838353,
            0.2695636679504926
          ],
          [
            0.46073484505547413,
            0.27118054846616163
          ],
          [
            0.47527383465237083,
            0.2679467874348235
          ],
          [
            0.48799545054965554,
            0.261479265372147
          ],
          [
            0.4961736321979099,
            0.24531046021545574
          ],
          [
            0.5061691875457763,
            0.22914165505876458
          ],
          [
            0.5107126217948066,
            0.20812220835506615
          ],
          [
            0.5143473691940308,
            0.18386900062002934
          ],
          [
            0.5170734297434489,
            0.1596157928849926
          ],
          [
            0.5170734297434489,
            0.1321288241186176
          ],
          [
            0.414391815715366,
            0.08685616967988233
          ],
          [
            0.42166131051381434,
            0.07553800607019857
          ],
          [
            0.4289308053122627,
            0.07230424503886028
          ],
          [
            0.4371089869605171,
            0.07068736452319119
          ],
          [
            0.4452871686087715,
            0.07230424503886028
          ],
          [
            0.4680043398539226,
            0.07230424503886028
          ],
          [
            0.47709120835198293,
            0.06907048400752198
          ],
          [
            0.48617807685004344,
            0.07068736452319119
          ],
          [
            0.49435625849829784,
            0.07553800607019857
          ],
          [
            0.5025344401465522,
            0.08523928916421324
          ],
          [
            0.45800878450605614,
            0.10625873586791178
          ],
          [
            0.45800878450605614,
            0.11596001896192644
          ],
          [
            0.4589174713558621,
            0.1272781825716102
          ],
          [
            0.4589174713558621,
            0.13859634618129407
          ],
          [
            0.4480132291581896,
            0.16446643443199999
          ],
          [
            0.4534653502570259,
            0.16446643443199999
          ],
          [
            0.4598261582056682,
            0.1628495539163309
          ],
          [
            0.46618696615431054,
            0.1628495539163309
          ],
          [
            0.4725477741029526,
            0.1628495539163309
          ],
          [
            0.42166131051381434,
            0.11272625793058814
          ],
          [
            0.4289308053122627,
            0.10787561638358087
          ],
          [
            0.4362003001107109,
            0.10625873586791178
          ],
          [
            0.44346979490915933,
            0.10949249689924996
          ],
          [
            0.4362003001107109,
            0.11272625793058814
          ],
          [
            0.4289308053122627,
            0.11434313844625735
          ],
          [
            0.4725477741029526,
            0.10787561638358087
          ],
          [
            0.47981726890140114,
            0.10464185535224267
          ],
          [
            0.4870867636998494,
            0.10625873586791178
          ],
          [
            0.49435625849829784,
            0.10949249689924996
          ],
          [
            0.4870867636998494,
            0.11272625793058814
          ],
          [
            0.47981726890140114,
            0.11110937741491905
          ],
          [
            0.44074373435974123,
            0.20650532783939696
          ],
          [
            0.4480132291581896,
            0.1919534031983749
          ],
          [
            0.456191410806444,
            0.18548588113569842
          ],
          [
            0.46073484505547413,
            0.18548588113569842
          ],
          [
            0.4652782793045044,
            0.18548588113569842
          ],
          [
            0.4734564609527588,
            0.1919534031983749
          ],
          [
            0.480725955751207,
            0.20488844732372785
          ],
          [
            0.47436514780256495,
            0.20973908887073525
          ],
          [
            0.4680043398539226,
            0.21297284990207344
          ],
          [
            0.46073484505547413,
            0.21297284990207344
          ],
          [
            0.4534653502570259,
            0.21297284990207344
          ],
          [
            0.44710454230838353,
            0.20973908887073525
          ],
          [
            0.44346979490915933,
            0.20488844732372785
          ],
          [
            0.4516479765574137,
            0.19842092526105137
          ],
          [
            0.46073484505547413,
            0.1968040447453823
          ],
          [
            0.46982171355353464,
            0.19842092526105137
          ],
          [
            0.478908582051595,
            0.20488844732372785
          ],
          [
            0.46982171355353464,
            0.20003780577672048
          ],
          [
            0.46073484505547413,
            0.20003780577672048
          ],
          [
            0.4516479765574137,
            0.20165468629238958
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "003000",
  "objects": [],
  "mask_file": "./person_labeling/./003000.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person sits against a vibrant red wall with two padlocks attached to it wearing a gray coat over a white shirt and blue pants in an urban setting with strong sunlight casting shadows on the wall",
  "overall_past": "Before the current scene, the individual likely arrived at this secluded urban spot after a period of movement—perhaps walking through the city, seeking a quiet corner away from the noise and rush. The gray coat suggests they were prepared for the weather, possibly having left home earlier in the day. The presence of two padlocks on the red wall indicates this is a secured or private area, possibly a gate, fence, or enclosure that has been locked for some time. It’s plausible that the person unlocked one of the padlocks, entered or accessed this space, and then chose to sit there, perhaps drawn by the contrast of the vivid red wall against the bright sunlight and the sense of enclosure it provides. The act of sitting with legs crossed and hands resting calmly on knees suggests a deliberate pause—perhaps after a journey, a decision, or a moment of emotional weight—leading to this reflective stillness. The sunlight casting long shadows may symbolize the passage of time or the transition from action to introspection.",
  "overall_past_clean": "The figure moved swiftly through the city’s winding alleys, shoulders tense with purpose, until reaching the secluded spot where they halted, breath steady, hands briefly gripping the cold metal of a padlock before turning it with a decisive click, stepping into the quiet enclosure as if crossing a threshold into stillness.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual may slowly rise from the wall, adjusting their coat as they take a deep breath, signaling a transition from reflection to action. The sunlight, now shifting slightly, casts a longer shadow across the ground, suggesting the passage of time. They might glance at the padlock briefly—perhaps checking its security or simply acknowledging the boundary it represents—before turning away and walking down the urban path, their steps deliberate yet unhurried. This moment of stillness has likely provided clarity, and they are now moving forward with renewed purpose, perhaps toward a destination that had been lingering in their thoughts during the pause.",
  "overall_future_clean": "The figure strides forward with unwavering resolve, each step echoing the weight of decision made, the city’s pulse now syncing with the rhythm of purpose-driven motion.",
  "future_scene_ok": true
}