{
  "video_path": "./ref_datasets/part2/4820997001.mp4",
  "start_time": 0.0,
  "end_time": 6.08,
  "image_path": "./001492.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/4769799000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_6303405833719979819_1_4769799000.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4769799000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_6303405833719979819_1_4769799000.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/4769799001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_5919362314109869334_1_4769799001.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4769799001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_5919362314109869334_1_4769799001.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/4820997000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_-5568736687890508324_1_4820997000.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4820997000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-5568736687890508324_1_4820997000.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/4820997001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_-1011199542531272048_1_4820997001.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/4820997001.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_-1011199542531272048_1_4820997001.mp4_0.00_6.08.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a sleeveless, ribbed tank top in a mustard yellow color. The top fits closely to the body, highlighting the shoulders and arms.",
        "clothing": [
          {
            "possible_names": [
              "sleeveless top",
              "tank top",
              "ribbed top"
            ],
            "name": "tank top",
            "type": "top",
            "color": [
              "mustard yellow"
            ]
          }
        ],
        "objects": [],
        "description": "The person is an adult female with a neutral expression. She has shoulder-length braided hair with a mix of dark roots and lighter tips. She is wearing a mustard yellow ribbed tank top that fits closely to her body. There are no additional objects or accessories visible in the image.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to have a calm and composed expression, with no strong emotions displayed.",
        "meaningful": false,
        "story": "unknown",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is standing against a plain background wearing a yellow sleeveless top and has long braided hair that appears to be dyed at the ends. They seem to be posing for a photograph, possibly for identification or a profile picture, as they are looking directly at the camera with a neutral expression. The individual's posture is upright and relaxed, suggesting confidence or a desire to present themselves clearly. There are no other people or objects in the image, focusing all attention on the person and their appearance.",
        "intention": "They are intentionally presenting themselves clearly and confidently for identification or a professional profile to make a strong and neutral impression",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.3455105236913792,
            0.4187803872284435
          ],
          [
            0.35248058618061123,
            0.44698270089214753
          ],
          [
            0.36567069392986395,
            0.4720778664662725
          ],
          [
            0.37841041138563203,
            0.49916435622033617
          ],
          [
            0.39792344538623065,
            0.5233990880350272
          ],
          [
            0.4266657995799231,
            0.5403138383513405
          ],
          [
            0.45563785298160775,
            0.5524388654246216
          ],
          [
            0.48543580398357733,
            0.5641348672055063
          ],
          [
            0.5158290193194434,
            0.5684403616757621
          ],
          [
            0.5533582191618662,
            0.5663557705425081
          ],
          [
            0.5884097262034341,
            0.5539794733836537
          ],
          [
            0.6265338104237954,
            0.5352495249183405
          ],
          [
            0.6554158775894731,
            0.510844200885012
          ],
          [
            0.6747399309955577,
            0.48060947010914484
          ],
          [
            0.6770685227459701,
            0.4465372357340086
          ],
          [
            0.6781583314219479,
            0.41277749345061326
          ],
          [
            0.6761366807594502,
            0.37356433398312044
          ],
          [
            0.35968199435365267,
            0.3879009067302659
          ],
          [
            0.3796575693226365,
            0.37588464397759663
          ],
          [
            0.40356838772536585,
            0.37612488683135736
          ],
          [
            0.42997306288865506,
            0.3773513062014466
          ],
          [
            0.4547027655379482,
            0.3832588864579087
          ],
          [
            0.505568087037909,
            0.38213453966946825
          ],
          [
            0.5334462630685675,
            0.36988281387658345
          ],
          [
            0.5619619102074356,
            0.36013501023962385
          ],
          [
            0.5921869633689759,
            0.3568835252452464
          ],
          [
            0.6234751649634548,
            0.3668640856054567
          ],
          [
            0.48348157967209193,
            0.4105074724803368
          ],
          [
            0.48471263697538425,
            0.4293950874713205
          ],
          [
            0.4875711248034522,
            0.4473766652423711
          ],
          [
            0.49029540902092345,
            0.4672165941269625
          ],
          [
            0.46816639408232674,
            0.48185889990556807
          ],
          [
            0.4830579921051308,
            0.48477068153165637
          ],
          [
            0.49610911513131767,
            0.4861658754448096
          ],
          [
            0.5120269267016618,
            0.4803707756456875
          ],
          [
            0.5235982795871754,
            0.47869024706028757
          ],
          [
            0.39475317203178606,
            0.41294282114221936
          ],
          [
            0.41198875002129365,
            0.40441264471127875
          ],
          [
            0.4354246868027581,
            0.40558963677003274
          ],
          [
            0.4538407562901734,
            0.41743647869498957
          ],
          [
            0.4328838104924197,
            0.41729912974295164
          ],
          [
            0.4132828325190872,
            0.41708733687798183
          ],
          [
            0.5292499344815652,
            0.4104615189489864
          ],
          [
            0.5458169483003162,
            0.3970147051271938
          ],
          [
            0.5658470548649944,
            0.3941898622505722
          ],
          [
            0.5900302383634779,
            0.3976923211167256
          ],
          [
            0.5716428080563823,
            0.4043090506678536
          ],
          [
            0.549842391695295,
            0.4080246892181181
          ],
          [
            0.4496948193620752,
            0.5078205312291781
          ],
          [
            0.46765823465175727,
            0.5003007131318251
          ],
          [
            0.48503303483680443,
            0.4954800490112532
          ],
          [
            0.5002087765900546,
            0.4963553607818626
          ],
          [
            0.5166347634224664,
            0.4938089723388354
          ],
          [
            0.541976733434768,
            0.49890864292780557
          ],
          [
            0.5710885473029322,
            0.5044010930118107
          ],
          [
            0.544040337567607,
            0.5170582816359542
          ],
          [
            0.5191681039396417,
            0.5266279530667124
          ],
          [
            0.5017906282313916,
            0.5283536407919157
          ],
          [
            0.48592164100162566,
            0.5258617826160931
          ],
          [
            0.4677578464386955,
            0.519103907190618
          ],
          [
            0.4576669444482793,
            0.5086485295778229
          ],
          [
            0.4859317098345076,
            0.508572995059547
          ],
          [
            0.5017589968979043,
            0.5119605499009291
          ],
          [
            0.5162407649257196,
            0.5117547351689565
          ],
          [
            0.5605590811482182,
            0.5055304754348028
          ],
          [
            0.5159507793724222,
            0.5096552525602636
          ],
          [
            0.5011574157962093,
            0.5076143933548815
          ],
          [
            0.48533817113391936,
            0.5060090222883792
          ]
        ],
        "visibility": [
          1.0,
          0.5125251412391663,
          7.493295761662466e-09,
          1.1741085534366924e-11,
          0.9984081387519836,
          0.9968405961990356,
          0.0042717354372143745,
          4.019320840598084e-06,
          0.10977649688720703,
          0.006629678420722485,
          1.346070493819659e-19,
          1.6784417411486174e-08,
          4.215502031001961e-06,
          7.007252173256082e-14,
          0.16577965021133423,
          1.8599963149540377e-12,
          4.320898361873972e-14,
          2.735109250195933e-09,
          4.765531028062993e-15,
          2.144697042183452e-08,
          4.134658049204449e-27,
          3.238403697092007e-20,
          0.00011410584556870162,
          0.9995864033699036,
          2.1597818206185032e-13,
          4.2182824074032954e-12,
          1.9168506781852557e-09,
          8.67619073374043e-13,
          9.980112337948117e-15
        ],
        "headpose": {
          "pitch": -12.646803880404997,
          "yaw": 5.9348657754926775,
          "roll": -7.923479621210121
        },
        "attributes": {
          "5 oClock Shadow": 0.0009335445356555283,
          "Arched Eyebrows": 0.25839006900787354,
          "Attractive": 0.24913078546524048,
          "Bags Under Eyes": 0.25676849484443665,
          "Bald": 2.2876029106555507e-05,
          "Bangs": 3.147896859445609e-05,
          "Big Lips": 0.6069541573524475,
          "Big Nose": 0.7615763545036316,
          "Black Hair": 0.4790264070034027,
          "Blond Hair": 0.00033967685885727406,
          "Blurry": 0.00015701589290983975,
          "Brown Hair": 0.023078709840774536,
          "Bushy Eyebrows": 0.37132591009140015,
          "Chubby": 0.12241042405366898,
          "Double Chin": 0.0037875911220908165,
          "Eyeglasses": 0.0006957040168344975,
          "Goatee": 0.00017392149311490357,
          "Gray Hair": 6.972227856749669e-05,
          "Heavy Makeup": 0.27233976125717163,
          "High Cheekbones": 0.2983691394329071,
          "Male": 0.0065236459486186504,
          "Mouth Slightly Open": 0.0014145815512165427,
          "Mustache": 0.00026310308021493256,
          "Narrow Eyes": 0.12352827936410904,
          "No Beard": 0.9940949082374573,
          "Oval Face": 0.28701719641685486,
          "Pale Skin": 0.00041557158692739904,
          "Pointy Nose": 0.00997774675488472,
          "Receding Hairline": 0.6091948747634888,
          "Rosy Cheeks": 0.0010230609914287925,
          "Sideburns": 2.277680869156029e-05,
          "Smiling": 0.10837001353502274,
          "Straight Hair": 0.47815096378326416,
          "Wavy Hair": 0.037187326699495316,
          "Wearing Earrings": 0.6921045780181885,
          "Wearing Hat": 0.0003934930427931249,
          "Wearing Lipstick": 0.42482757568359375,
          "Wearing Necklace": 0.10160627216100693,
          "Wearing Necktie": 7.660625851713121e-05,
          "Young": 0.9981076717376709
        },
        "age": [
          0.13385462760925293,
          0.9976534247398376,
          0.9787769913673401,
          0.06559431552886963,
          0.0026049416046589613,
          3.388160257600248e-05,
          3.7567199342447566e-06,
          1.8463323669948295e-07
        ],
        "race": [
          0.012948361225426197,
          0.7213417291641235,
          0.572789192199707,
          0.912446141242981,
          0.43540170788764954
        ],
        "gender": [
          0.0011775571620091796,
          0.9992241859436035
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.2494944660595696,
          "disgust": 4.9469300531817306e-08,
          "fear": 0.04704422338711042,
          "happy": 0.1142138129851147,
          "sad": 29.108044015402314,
          "surprise": 4.613247615754889e-05,
          "neutral": 70.48115486131252
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 501,
          "h": 758,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 30,
        "gender": {
          "Woman": 87.03020215034485,
          "Man": 12.969796359539032
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 7.17295695269621,
          "indian": 12.595283973779205,
          "black": 5.814076639523907,
          "white": 16.183849730032716,
          "middle eastern": 15.9383441879339,
          "latino hispanic": 42.29548367315726
        },
        "dominant_race": "latino hispanic"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.007321741431951523,
        0.23813235759735107,
        0.9989981055259705,
        0.9906550049781799
      ]
    ],
    "face_boxes": [
      [
        0.3558739125728607,
        0.29839256405830383,
        0.6657851934432983,
        0.5619357824325562
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.5271458785764405,
            0.6768157752851645
          ],
          [
            0.17445432881726342,
            0.6725201450785
          ],
          [
            0.09146808181510416,
            0.9805781970421474
          ],
          [
            0.11767426507894403,
            0.9695322907964389
          ],
          [
            0.8798374283356174,
            0.6811114054918289
          ],
          [
            0.9256982490473371,
            0.9805781970421474
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.2945660021098625,
            1.0849006449182828
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7422549662004586,
            1.0849006449182828
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4212292212184214,
            0.41969162434339524
          ],
          [
            0.5719147749855,
            0.40987304101387656
          ],
          [
            0.3513460658481819,
            0.44178343683481214
          ],
          [
            0.681107205251499,
            0.420918947259585
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.353529914453502,
            0.420918947259585
          ],
          [
            0.36008146026946175,
            0.44546540558338166
          ],
          [
            0.3688168546907418,
            0.4700118639071783
          ],
          [
            0.3819199463226617,
            0.4921036763985952
          ],
          [
            0.39939073516522144,
            0.5141954888900121
          ],
          [
            0.42559691842906117,
            0.5338326555490494
          ],
          [
            0.4561707989035412,
            0.5510151763757071
          ],
          [
            0.49329622519398075,
            0.5620610826214156
          ],
          [
            0.5369731973003803,
            0.5632884055376053
          ],
          [
            0.57846632080146,
            0.5546971451242766
          ],
          [
            0.6112240498812598,
            0.5387419472138086
          ],
          [
            0.6374302331450995,
            0.5191047805547714
          ],
          [
            0.6527171733823395,
            0.4970129680633545
          ],
          [
            0.6636364164089393,
            0.47369383265574777
          ],
          [
            0.6658202650142592,
            0.4491473743319511
          ],
          [
            0.6680041136195793,
            0.4233735930919647
          ],
          [
            0.6636364164089393,
            0.3988271347681681
          ],
          [
            0.36226530887478187,
            0.407418395181497
          ],
          [
            0.3819199463226617,
            0.4012817806005478
          ],
          [
            0.40594228098118135,
            0.400054457684358
          ],
          [
            0.43214846424502135,
            0.400054457684358
          ],
          [
            0.4561707989035412,
            0.4025091035167376
          ],
          [
            0.5216862570631406,
            0.3975998118519783
          ],
          [
            0.5478924403269803,
            0.392690520187219
          ],
          [
            0.5740986235908202,
            0.3877812285224596
          ],
          [
            0.6024886554599796,
            0.38655390560626984
          ],
          [
            0.6286948387238197,
            0.3902358743548393
          ],
          [
            0.49111237658866086,
            0.4184643014272054
          ],
          [
            0.49329622519398075,
            0.435646822253863
          ],
          [
            0.49548007379930087,
            0.4540566659967104
          ],
          [
            0.4976639224046206,
            0.4712391868233681
          ],
          [
            0.46927389053546087,
            0.48351241598526634
          ],
          [
            0.4845608307727007,
            0.48596706181764604
          ],
          [
            0.5020316196152608,
            0.48596706181764604
          ],
          [
            0.5216862570631406,
            0.48351241598526634
          ],
          [
            0.5391570459057003,
            0.4798304472366968
          ],
          [
            0.39283918934926165,
            0.4233735930919647
          ],
          [
            0.4124938267971415,
            0.4160096555948257
          ],
          [
            0.43651616145566136,
            0.41478233267863596
          ],
          [
            0.4583546475088609,
            0.4233735930919647
          ],
          [
            0.43651616145566136,
            0.428282884756724
          ],
          [
            0.4124938267971415,
            0.428282884756724
          ],
          [
            0.5369731973003803,
            0.4184643014272054
          ],
          [
            0.5544439861429403,
            0.407418395181497
          ],
          [
            0.5806501694067802,
            0.4037364264329275
          ],
          [
            0.6046725040652998,
            0.4086457180976868
          ],
          [
            0.58501786661742,
            0.41723697851101554
          ],
          [
            0.5609955319589003,
            0.41969162434339524
          ],
          [
            0.44961925308758105,
            0.5129681659738222
          ],
          [
            0.471457739140781,
            0.5080588743090629
          ],
          [
            0.49329622519398075,
            0.5043769055604934
          ],
          [
            0.5063993168259007,
            0.5043769055604934
          ],
          [
            0.5195024084578205,
            0.5031495826443037
          ],
          [
            0.5500762889323003,
            0.5031495826443037
          ],
          [
            0.57846632080146,
            0.5043769055604934
          ],
          [
            0.5609955319589003,
            0.515422811806202
          ],
          [
            0.5391570459057003,
            0.5240140722195307
          ],
          [
            0.5129508626418606,
            0.5276960409681002
          ],
          [
            0.48892852798334074,
            0.5264687180519104
          ],
          [
            0.46927389053546087,
            0.5215594263871511
          ],
          [
            0.4583546475088609,
            0.5141954888900121
          ],
          [
            0.4845608307727007,
            0.5129681659738222
          ],
          [
            0.5085831654312205,
            0.5129681659738222
          ],
          [
            0.5391570459057003,
            0.5092861972252527
          ],
          [
            0.5719147749855,
            0.5068315513928732
          ],
          [
            0.5413408945110205,
            0.5117408430576325
          ],
          [
            0.5107670140365407,
            0.5141954888900121
          ],
          [
            0.4845608307727007,
            0.515422811806202
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "001492",
  "objects": [],
  "mask_file": "./person_labeling/./001492.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A person stands against a plain light-colored wall wearing a mustard yellow sleeveless top with braided hair visible and small earrings noticeable in a simple indoor setting with no other notable objects around.",
  "overall_past": "Before the current scene, the person likely prepared for a photo session—possibly for a professional profile, social media update, or official identification—by selecting their outfit (the mustard yellow sleeveless top), styling their hair into a neat braid (possibly with intentional dye at the ends for a distinctive look), and choosing small earrings to add subtle detail. They may have adjusted their posture in front of a mirror or a camera preview, ensuring their face was centered and their expression neutral to convey professionalism and clarity. The plain background suggests they chose a simple, uncluttered setting to avoid distractions, indicating a deliberate effort to present themselves in a clean, focused manner.",
  "overall_past_clean": "They meticulously rehearsed their stance, adjusted their expression to project calm confidence, and aligned their features with precision, all while mentally preparing to make a clear, composed impression.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the person is likely to step forward or adjust their position slightly to ensure the photograph is properly framed, then may smile or make a small gesture—such as raising a hand or tilting their head—to add a touch of warmth or personality to the image, transforming the neutral profile into a more engaging and personal representation, possibly for a social media post, job application, or online identity.",
  "overall_future_clean": "They confidently shift their stance to center themselves within the frame, then lift their chin slightly and offer a poised, genuine smile that radiates approachability and intent, instantly elevating the image from static to expressive.",
  "future_scene_ok": true
}