{
  "video_path": "./ref_datasets/part2/5426208003.mp4",
  "start_time": 0.0,
  "end_time": 5.88,
  "image_path": "./002491.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/5426208003.mp4",
      "start_time": 0.0,
      "end_time": 5.88,
      "image_path": "./ref_datasets/extracted_frames/person_1762649743365297810_1_5426208003.mp4_0.00_5.88.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/5426208003.mp4",
      "start_time": 0.0,
      "end_time": 5.88,
      "image_path": "./ref_datasets/extracted_frames/face_1762649743365297810_1_5426208003.mp4_0.00_5.88.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": false,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 1,
      "skeleton": 1,
      "face_box": 1,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark gray medical scrub top with a stethoscope around his neck. He also has on a white head covering and glasses.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "scrubs",
                "medical uniform"
              ],
              "name": "scrubs",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "stethoscope"
              ],
              "name": "stethoscope",
              "type": "accessory",
              "color": [
                "blue",
                "silver"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "medical cap"
              ],
              "name": "medical cap",
              "type": "headwear",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "tablet",
              "digital tablet"
            ],
            "name": "tablet",
            "position": "hand"
          }
        ],
        "description": "The person is an adult male who appears to be a medical professional, as indicated by his dark gray scrub top, stethoscope, and white medical cap. He is wearing clear-framed glasses and has a neutral expression. He is holding a tablet in his hand, possibly reviewing medical records or notes.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused and engaged in a professional interaction, possibly discussing medical information.",
        "meaningful": true,
        "story": "A male healthcare professional is consulting with another individual, likely a patient or colleague, using a tablet for reference. The setting suggests a medical office environment.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box is engaged in a focused discussion with another individual, likely a patient, as indicated by the medical setting and the stethoscope around their neck. They are holding a tablet, possibly reviewing medical records or discussing treatment options, which suggests they are providing professional advice or care. Their expression appears serious and attentive, indicating a commitment to understanding the patient's concerns and offering appropriate guidance. The presence of medical equipment on the table further supports the context of a healthcare consultation, where the individual is actively involved in delivering medical services.",
        "intention": "The individual is motivated to provide accurate medical guidance and ensure patient understanding through attentive communication and use of relevant tools and equipment",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "both hands",
            "action": [
              "holding",
              "reviewing"
            ]
          },
          "object": 0,
          "deleted": true
        }
      ],
      "without_face": false,
      "facex_detailing": {
        "landmarks": [
          [
            0.739231301099062,
            0.08488846582079691
          ],
          [
            0.7404858442466883,
            0.13033689090183803
          ],
          [
            0.737790018036252,
            0.17541796517750574
          ],
          [
            0.7316614100620861,
            0.21146111639719162
          ],
          [
            0.7250935389172463,
            0.25517563592819936
          ],
          [
            0.7262759990812767,
            0.2947212930709596
          ],
          [
            0.7279769404303459,
            0.32827545196290997
          ],
          [
            0.7290801688851345,
            0.35587432195269875
          ],
          [
            0.7333618789379085,
            0.40228802211700926
          ],
          [
            0.7516266093367622,
            0.4276192468310159
          ],
          [
            0.7741254772103968,
            0.4259594659956675
          ],
          [
            0.8006383066021261,
            0.4154430873810299
          ],
          [
            0.8219440494264876,
            0.39262193649534194
          ],
          [
            0.845335254924638,
            0.3574243257916163
          ],
          [
            0.8583116162390937,
            0.3058494704110282
          ],
          [
            0.8698669697557176,
            0.25421497405521454
          ],
          [
            0.8767503982498532,
            0.19698904052613272
          ],
          [
            0.7434465122542211,
            0.08953882550436354
          ],
          [
            0.7461609018700464,
            0.07878161990453325
          ],
          [
            0.74832495944131,
            0.09126218159993489
          ],
          [
            0.7511709739409742,
            0.08502047326829698
          ],
          [
            0.7524026158310118,
            0.0852382777229188
          ],
          [
            0.7548654065955254,
            0.0849754117784046
          ],
          [
            0.7670267994914736,
            0.0893123952169267
          ],
          [
            0.7749520041048527,
            0.10167223006959945
          ],
          [
            0.7847862813799155,
            0.1186265786488851
          ],
          [
            0.793901022984868,
            0.14647158516777886
          ],
          [
            0.7469580532539459,
            0.11824289881993853
          ],
          [
            0.7367227009719327,
            0.14763684726896742
          ],
          [
            0.7230863767010826,
            0.17053419446188306
          ],
          [
            0.715425003887642,
            0.19886038492596342
          ],
          [
            0.7309151762298175,
            0.23502182582068065
          ],
          [
            0.7284938569757201,
            0.23304737181890578
          ],
          [
            0.730811095166774,
            0.23326638615320597
          ],
          [
            0.7344481873725142,
            0.2393998320140536
          ],
          [
            0.7397150965850977,
            0.23907156293354334
          ],
          [
            0.7478384420985267,
            0.11792126231723361
          ],
          [
            0.7468716248869895,
            0.11832764262244815
          ],
          [
            0.749787907799085,
            0.12321152649228535
          ],
          [
            0.7455764045317967,
            0.11634720015147375
          ],
          [
            0.7483539925799484,
            0.11476123938484799
          ],
          [
            0.7498550263898713,
            0.11454664676908463
          ],
          [
            0.7647349687204474,
            0.15023500730120945
          ],
          [
            0.7659506697739874,
            0.14883215616619777
          ],
          [
            0.7720878781307312,
            0.16239377581883993
          ],
          [
            0.7767603509482883,
            0.17049438158671062
          ],
          [
            0.7721399871366365,
            0.1597081214662582
          ],
          [
            0.7630875709156195,
            0.14650680224100748
          ],
          [
            0.7263117084723143,
            0.29010244248405337
          ],
          [
            0.7264717878862506,
            0.29287468592325844
          ],
          [
            0.7244328501323859,
            0.2729806082589286
          ],
          [
            0.7239823879762775,
            0.270404086794172
          ],
          [
            0.725019117533451,
            0.2728233761257596
          ],
          [
            0.7375088724884249,
            0.2914007217165024
          ],
          [
            0.7471413591787929,
            0.3121763925703745
          ],
          [
            0.7406760968977496,
            0.3184275536310105
          ],
          [
            0.7327496015422401,
            0.33942100282699345
          ],
          [
            0.7240917826514868,
            0.3386451827155219
          ],
          [
            0.7248178268117564,
            0.3227181525457473
          ],
          [
            0.7290612596841085,
            0.30281745971195284
          ],
          [
            0.727512184246665,
            0.28860894611903604
          ],
          [
            0.726443689422948,
            0.2969730271233453
          ],
          [
            0.725299975488867,
            0.29084807653275746
          ],
          [
            0.7352078935397522,
            0.2947765471443297
          ],
          [
            0.7452493092488675,
            0.30804100642128596
          ],
          [
            0.7385451398435093,
            0.3143733947996109
          ],
          [
            0.7283235851497877,
            0.31117920799860876
          ],
          [
            0.727222801230493,
            0.30099330932374985
          ]
        ],
        "visibility": [
          1.5188968063739594e-05,
          0.9931453466415405,
          1.5102120414667297e-05,
          3.6858112048565594e-12,
          5.97523853312909e-12,
          3.005425227263492e-13,
          1.095546071396003e-12,
          8.785901783880945e-09,
          0.01960720866918564,
          0.7858121991157532,
          8.088644972303882e-05,
          0.15176935493946075,
          9.921191472528346e-13,
          2.3407912976836087e-06,
          1.140527050580431e-08,
          0.9938541650772095,
          8.43005873440994e-11,
          0.0015198809560388327,
          0.0001343295443803072,
          0.9864214658737183,
          7.66598784451844e-10,
          1.087799364474229e-10,
          0.8710127472877502,
          0.7448218464851379,
          6.192639716989801e-13,
          0.00022140750661492348,
          0.9176528453826904,
          0.07046913355588913,
          0.02853117696940899
        ],
        "headpose": {
          "pitch": 3.189015963809188,
          "yaw": 76.30621087903296,
          "roll": 1.415710811628291
        },
        "attributes": {
          "5 oClock Shadow": 0.00037612050073221326,
          "Arched Eyebrows": 0.0065024360083043575,
          "Attractive": 0.1302834153175354,
          "Bags Under Eyes": 0.0076186214573681355,
          "Bald": 4.9481215683044866e-05,
          "Bangs": 0.001157703110948205,
          "Big Lips": 0.17782197892665863,
          "Big Nose": 0.00560496561229229,
          "Black Hair": 0.12266221642494202,
          "Blond Hair": 0.005462938919663429,
          "Blurry": 0.08128581941127777,
          "Brown Hair": 0.10520204901695251,
          "Bushy Eyebrows": 0.011848715133965015,
          "Chubby": 0.001996703213080764,
          "Double Chin": 0.0001325403864029795,
          "Eyeglasses": 0.0007086404366418719,
          "Goatee": 7.822216866770759e-05,
          "Gray Hair": 0.00014017488865647465,
          "Heavy Makeup": 0.02888931706547737,
          "High Cheekbones": 0.018773198127746582,
          "Male": 0.00814603641629219,
          "Mouth Slightly Open": 0.19883973896503448,
          "Mustache": 2.3861328372731805e-05,
          "Narrow Eyes": 0.3512366712093353,
          "No Beard": 0.9981291890144348,
          "Oval Face": 0.03258640691637993,
          "Pale Skin": 0.0018036582041531801,
          "Pointy Nose": 0.22462336719036102,
          "Receding Hairline": 0.022403404116630554,
          "Rosy Cheeks": 0.000652759918011725,
          "Sideburns": 9.120192407863215e-05,
          "Smiling": 0.0047704000025987625,
          "Straight Hair": 0.04911591112613678,
          "Wavy Hair": 0.1486586630344391,
          "Wearing Earrings": 0.18943509459495544,
          "Wearing Hat": 0.14756061136722565,
          "Wearing Lipstick": 0.04987020790576935,
          "Wearing Necklace": 0.11914379894733429,
          "Wearing Necktie": 9.166665404336527e-05,
          "Young": 0.9890177249908447
        },
        "age": [
          0.4624761641025543,
          0.9696081876754761,
          0.98183673620224,
          0.29201605916023254,
          0.010502031072974205,
          8.471275214105844e-05,
          1.9689801774802618e-05,
          8.882747692950943e-07
        ],
        "race": [
          0.9112319350242615,
          0.004423316568136215,
          0.6956657767295837,
          0.2654523253440857,
          0.8340857625007629
        ],
        "gender": [
          0.004722564946860075,
          0.9968957901000977
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 5.766780143186763e-07,
          "disgust": 7.799926846560313e-14,
          "fear": 8.174287298406684,
          "happy": 2.827639451901704e-08,
          "sad": 91.82568885973825,
          "surprise": 1.9627339234897073e-14,
          "neutral": 1.9045990601265585e-05
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 385,
          "h": 551,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 34,
        "gender": {
          "Woman": 84.56310629844666,
          "Man": 15.436895191669464
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 7.180435844607849,
          "indian": 6.4730144771320255,
          "black": 44.12526856359618,
          "white": 12.831583579589894,
          "middle eastern": 10.314025245425077,
          "latino hispanic": 19.075662603895353
        },
        "dominant_race": "black"
      }
    },
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a dark gray medical scrub top with short sleeves. A stethoscope hangs around his neck, and he has on a white medical cap. He also wears clear-framed glasses.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "scrubs",
                "medical uniform"
              ],
              "name": "scrubs",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "stethoscope"
              ],
              "name": "stethoscope",
              "type": "accessory",
              "color": [
                "blue",
                "silver"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "glasses",
                "eyewear"
              ],
              "name": "glasses",
              "type": "accessory",
              "color": [
                "black",
                "transparent"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "cap",
                "medical cap"
              ],
              "name": "cap",
              "type": "headwear",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "tablet",
              "digital tablet"
            ],
            "name": "tablet",
            "position": "hand"
          }
        ],
        "description": "The person is an adult male who appears to be a medical professional, given his attire which includes a dark gray scrub top, a stethoscope around his neck, a white medical cap, and clear-framed glasses. His expression is neutral as he interacts with a digital tablet using both hands. The setting suggests a professional environment, likely a medical office.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be focused and engaged in a professional interaction, possibly discussing medical information.",
        "meaningful": true,
        "story": "A male healthcare professional is consulting with another individual, likely a patient or colleague, using a digital tablet. The setting suggests a medical office or clinic environment.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box appears to be engaged in a professional interaction, likely discussing medical information as they point at a tablet screen held by another individual. Their focused gaze and hand gesture suggest they are explaining or highlighting specific details on the device, possibly sharing insights or treatment plans. Wearing a stethoscope around their neck and medical attire indicates their role as a healthcare provider, and their serious expression implies a commitment to providing accurate and important information. The setting, which includes medical equipment like a blood pressure monitor, further supports the context of a clinical consultation where collaboration and communication are essential for patient care.",
        "intention": "The individual is focused on accurately conveying critical medical information to support informed decision making and effective patient care",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "left hand",
            "action": [
              [
                "left hand",
                "holds"
              ]
            ]
          },
          "object": 0
        }
      ],
      "facex_detailing": {
        "landmarks": [
          [
            0.5430477584933951,
            0.18204087599244698
          ],
          [
            0.5506780809944585,
            0.21507728207048288
          ],
          [
            0.556418519582422,
            0.24724515909871095
          ],
          [
            0.5650413580061424,
            0.27764933386807716
          ],
          [
            0.5742787499867734,
            0.30394945573554466
          ],
          [
            0.5867971683541934,
            0.32687565990225975
          ],
          [
            0.5991601728257678,
            0.3512494957636273
          ],
          [
            0.6141388512438252,
            0.3636079180177557
          ],
          [
            0.6285950072464489,
            0.3616749893420587
          ],
          [
            0.6441056820253531,
            0.3442346015304485
          ],
          [
            0.6547884616823424,
            0.3150951792954137
          ],
          [
            0.6630031000645389,
            0.2826970279532135
          ],
          [
            0.6682401323247523,
            0.24784326389353112
          ],
          [
            0.6713422041208972,
            0.20955704728131574
          ],
          [
            0.669709403954801,
            0.17165207875468746
          ],
          [
            0.6642773182619185,
            0.13483015929580366
          ],
          [
            0.659614283520551,
            0.09913251166621213
          ],
          [
            0.5497589091992094,
            0.17650513674216295
          ],
          [
            0.5548119890193145,
            0.1495095038540149
          ],
          [
            0.5649690196272873,
            0.14528192962918965
          ],
          [
            0.5753120484983637,
            0.14093536050231367
          ],
          [
            0.5847405258388747,
            0.13878882297132383
          ],
          [
            0.6028418441258726,
            0.12156145616813942
          ],
          [
            0.6108702302333854,
            0.11239039841152372
          ],
          [
            0.6208566886328516,
            0.10464776445318151
          ],
          [
            0.6309544590257463,
            0.10046057530811855
          ],
          [
            0.6425256201553912,
            0.1126097387737698
          ],
          [
            0.5990587260928891,
            0.16750102749577275
          ],
          [
            0.6023985046715964,
            0.1911683889923903
          ],
          [
            0.6050791094700495,
            0.2137882073720296
          ],
          [
            0.608917348015876,
            0.23630931156652946
          ],
          [
            0.5962995767948173,
            0.2548836118960507
          ],
          [
            0.6042406103795483,
            0.2553687031306917
          ],
          [
            0.6116925275041943,
            0.2556361440628294
          ],
          [
            0.6201289317260186,
            0.24575987581222775
          ],
          [
            0.6270865217206024,
            0.23788934107179996
          ],
          [
            0.5659128854672114,
            0.19297667943611346
          ],
          [
            0.5699838810023807,
            0.18460537264586754
          ],
          [
            0.5809114111143917,
            0.17637551650799138
          ],
          [
            0.5878923427136172,
            0.17962404647201455
          ],
          [
            0.5817964973016864,
            0.1878762407908364
          ],
          [
            0.571269447338723,
            0.19416352756439692
          ],
          [
            0.616223531145425,
            0.15933861208971214
          ],
          [
            0.6209497255228815,
            0.14961437573508612
          ],
          [
            0.6307016145260562,
            0.14164280481439417
          ],
          [
            0.6366023584490731,
            0.14255161607076253
          ],
          [
            0.6321562770576705,
            0.15265028148731855
          ],
          [
            0.6235627220500083,
            0.16040210055295753
          ],
          [
            0.5944546769594863,
            0.29818200194646444
          ],
          [
            0.5998286832478784,
            0.2844488997938771
          ],
          [
            0.6084428063283364,
            0.2777097351336606
          ],
          [
            0.6151512040978386,
            0.27478778349659433
          ],
          [
            0.6213082525701751,
            0.27042831113098786
          ],
          [
            0.6326771792911348,
            0.2684275449268402
          ],
          [
            0.6420420095679306,
            0.2734357063101713
          ],
          [
            0.6365884907898448,
            0.2947269025933806
          ],
          [
            0.6280490608442396,
            0.30874884330406394
          ],
          [
            0.6203056894597553,
            0.31662784303937636
          ],
          [
            0.6104201903655415,
            0.31998077460697716
          ],
          [
            0.6013953099648158,
            0.31271977828293246
          ],
          [
            0.5961338033456177,
            0.29798160494950715
          ],
          [
            0.6073860838299706,
            0.2935233743102462
          ],
          [
            0.6166400964061419,
            0.2910306390631136
          ],
          [
            0.6261197124563512,
            0.2829339302406109
          ],
          [
            0.6401700677971045,
            0.2750474354577443
          ],
          [
            0.6269225950042406,
            0.28548071800716335
          ],
          [
            0.617718622709314,
            0.2947993841120805
          ],
          [
            0.6069653376759518,
            0.29867091418574093
          ]
        ],
        "visibility": [
          0.8935046195983887,
          3.977957021561451e-05,
          0.9690208435058594,
          4.216905047371711e-09,
          0.9997766613960266,
          1.0,
          9.63047909863235e-07,
          0.06419133394956589,
          1.0,
          8.210897794924676e-05,
          0.08859454095363617,
          1.2229602361912839e-05,
          1.0,
          0.9872544407844543,
          0.9996868371963501,
          1.5857277730901842e-06,
          0.8687284588813782,
          2.407097963441629e-05,
          0.0668792724609375,
          0.9997453093528748,
          2.471453759960579e-14,
          1.5336074140520942e-17,
          0.0005643731565214694,
          9.064224926191855e-09,
          1.692415207976694e-09,
          3.7506835744854916e-14,
          2.401109283053709e-15,
          5.152843407700363e-16,
          7.168088814069051e-06
        ],
        "headpose": {
          "pitch": -8.966051648951915,
          "yaw": 3.7976227445675246,
          "roll": -17.438907290768256
        },
        "attributes": {
          "5 oClock Shadow": 0.15429021418094635,
          "Arched Eyebrows": 0.0011553955264389515,
          "Attractive": 0.006040500942617655,
          "Bags Under Eyes": 0.04268253967165947,
          "Bald": 0.01259829942137003,
          "Bangs": 6.332514021778479e-05,
          "Big Lips": 0.8539285659790039,
          "Big Nose": 0.9065536856651306,
          "Black Hair": 0.05673818290233612,
          "Blond Hair": 0.00011644869664451107,
          "Blurry": 0.020956382155418396,
          "Brown Hair": 0.00010210990876657888,
          "Bushy Eyebrows": 0.007149947807192802,
          "Chubby": 0.6417942047119141,
          "Double Chin": 0.20793360471725464,
          "Eyeglasses": 0.2263825684785843,
          "Goatee": 0.869382381439209,
          "Gray Hair": 0.0013015002477914095,
          "Heavy Makeup": 4.1208546463167295e-05,
          "High Cheekbones": 0.16597560048103333,
          "Male": 0.9999195337295532,
          "Mouth Slightly Open": 0.5826452970504761,
          "Mustache": 0.47558796405792236,
          "Narrow Eyes": 0.03561205044388771,
          "No Beard": 0.009133902378380299,
          "Oval Face": 0.26678502559661865,
          "Pale Skin": 3.2108204322867095e-05,
          "Pointy Nose": 0.000864935340359807,
          "Receding Hairline": 0.010694529861211777,
          "Rosy Cheeks": 4.205202276352793e-05,
          "Sideburns": 0.6935667395591736,
          "Smiling": 0.019837094470858574,
          "Straight Hair": 0.0003725984424818307,
          "Wavy Hair": 0.0030099297873675823,
          "Wearing Earrings": 0.006704063154757023,
          "Wearing Hat": 0.492744117975235,
          "Wearing Lipstick": 0.00011271544644841924,
          "Wearing Necklace": 0.030787993222475052,
          "Wearing Necktie": 0.005278581287711859,
          "Young": 0.6458026766777039
        },
        "age": [
          0.00021686431136913598,
          0.02355503849685192,
          0.9817274808883667,
          0.9825830459594727,
          0.7442214488983154,
          0.013750627636909485,
          0.0005079323309473693,
          8.51303502713563e-06
        ],
        "race": [
          0.02626657858490944,
          0.9982141256332397,
          0.6225522756576538,
          0.12871213257312775,
          0.028884518891572952
        ],
        "gender": [
          0.9999438524246216,
          0.00020125770242884755
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.016450199473183602,
          "disgust": 2.181657965394379e-07,
          "fear": 0.051509978948161006,
          "happy": 98.01695942878723,
          "sad": 1.6401512548327446,
          "surprise": 4.64521754395264e-06,
          "neutral": 0.2749264007434249
        },
        "dominant_emotion": "happy",
        "region": {
          "x": 0,
          "y": 0,
          "w": 386,
          "h": 465,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 46,
        "gender": {
          "Woman": 2.083873748779297,
          "Man": 97.91613221168518
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 0.773531058343116,
          "indian": 0.17173577658002237,
          "black": 98.99908894295031,
          "white": 0.00231145563837668,
          "middle eastern": 0.009448900363389051,
          "latino hispanic": 0.04388746426794465
        },
        "dominant_race": "black"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.3154868185520172,
        0.0016226887237280607,
        0.8316462635993958,
        0.8148908019065857
      ],
      [
        0.42630207538604736,
        0.003497710917145014,
        0.9997365474700928,
        0.9853532910346985
      ]
    ],
    "face_boxes": [
      [
        0.5396186709403992,
        0.044605646282434464,
        0.6738179922103882,
        0.3543657660484314
      ],
      [
        0.7204469442367554,
        0.043899014592170715,
        0.8543336391448975,
        0.4178767204284668
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6262872154580222,
            0.37976124763677316
          ],
          [
            0.5121125973330605,
            0.38172412380582016
          ],
          [
            0.3499515455034044,
            0.5956776262319526
          ],
          [
            0.4746059594949086,
            0.6683040444866949
          ],
          [
            0.7404618335829841,
            0.3777983714677262
          ],
          [
            0.7669371073510911,
            0.7468190912485783
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5275565070311229,
            0.919552194124722
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6753767855697208,
            0.9234779464628159
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5705788269042968,
            0.18347363073206466
          ],
          [
            0.6323544656965467,
            0.15206761202731117
          ],
          [
            0.5430004167291853,
            0.20899102092967675
          ],
          [
            0.6742736491627163,
            0.1422532311820758
          ]
        ],
        "dw_hand_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_2": [
          [
            0.48232791434393996,
            0.6879328061771656
          ],
          [
            0.5121125973330605,
            0.6898956823462128
          ],
          [
            0.5418972803221809,
            0.6938214346843069
          ],
          [
            0.56396000846227,
            0.6879328061771656
          ],
          [
            0.5805070545673371,
            0.6957843108533541
          ],
          [
            0.5518255079852211,
            0.6133435117533764
          ],
          [
            0.5716819633113014,
            0.6368980257819414
          ],
          [
            0.5760945089393192,
            0.6741926729938362
          ],
          [
            0.5738882361253103,
            0.7036358155295425
          ],
          [
            0.5407941439151764,
            0.6133435117533764
          ],
          [
            0.5584443264272478,
            0.6526010351343181
          ],
          [
            0.5562380536132389,
            0.6977471870224011
          ],
          [
            0.5474129623572033,
            0.7173759487128718
          ],
          [
            0.5275565070311229,
            0.6211950164295649
          ],
          [
            0.5418972803221809,
            0.6624154159795536
          ],
          [
            0.5396910075081719,
            0.7036358155295425
          ],
          [
            0.5319690526591407,
            0.719338824881919
          ],
          [
            0.5121125973330605,
            0.6349351496128943
          ],
          [
            0.5242470978101094,
            0.6663411683176477
          ],
          [
            0.5253502342171139,
            0.6957843108533541
          ],
          [
            0.5198345521820915,
            0.7114873202057307
          ]
        ],
        "dw_face": [
          [
            0.5418972803221809,
            0.1893622592392058
          ],
          [
            0.5474129623572033,
            0.2207682779439592
          ],
          [
            0.5540317807992299,
            0.25021142047966544
          ],
          [
            0.5628568720552656,
            0.27769168684632467
          ],
          [
            0.5716819633113014,
            0.30320907704393674
          ],
          [
            0.5860227366023594,
            0.32480071490345486
          ],
          [
            0.6003635098934174,
            0.34246660042487864
          ],
          [
            0.6158074195914799,
            0.3522809812701141
          ],
          [
            0.6334576021035513,
            0.34835522893201976
          ],
          [
            0.6489015118016137,
            0.33265221957964314
          ],
          [
            0.6599328758716583,
            0.30713482938203107
          ],
          [
            0.668757967127694,
            0.27965456301537184
          ],
          [
            0.6731705127557119,
            0.24824854431061844
          ],
          [
            0.6753767855697208,
            0.21684252560586503
          ],
          [
            0.6731705127557119,
            0.18543650690111163
          ],
          [
            0.6720673763487074,
            0.15403048819635826
          ],
          [
            0.6676548307206895,
            0.12262446949160495
          ],
          [
            0.5474129623572033,
            0.16777062137968787
          ],
          [
            0.5551349172062344,
            0.1579562405344526
          ],
          [
            0.56396000846227,
            0.15206761202731117
          ],
          [
            0.5738882361253103,
            0.1501047358582641
          ],
          [
            0.5838164637883505,
            0.14814185968921703
          ],
          [
            0.6091886011494531,
            0.13243885033684033
          ],
          [
            0.6191168288124932,
            0.12458734566065202
          ],
          [
            0.6290450564755333,
            0.11673584098446362
          ],
          [
            0.6389732841385735,
            0.11281008864636947
          ],
          [
            0.6500046482086181,
            0.11673584098446362
          ],
          [
            0.6003635098934174,
            0.16777062137968787
          ],
          [
            0.6025697827074262,
            0.1893622592392058
          ],
          [
            0.6058791919284396,
            0.20899102092967675
          ],
          [
            0.6080854647424486,
            0.2286197826201477
          ],
          [
            0.5981572370794085,
            0.2521742966487126
          ],
          [
            0.6047760555214352,
            0.25021142047966544
          ],
          [
            0.6124980103704665,
            0.24824854431061844
          ],
          [
            0.6191168288124932,
            0.24235991580347713
          ],
          [
            0.6268387836615245,
            0.23647128729633599
          ],
          [
            0.5595474628342522,
            0.19132513540825297
          ],
          [
            0.5661662812762791,
            0.17954787839397032
          ],
          [
            0.5760945089393192,
            0.17562212605587638
          ],
          [
            0.5849196001953548,
            0.1815107545630175
          ],
          [
            0.5771976453463236,
            0.1893622592392058
          ],
          [
            0.568372554090288,
            0.19328801157730013
          ],
          [
            0.6191168288124932,
            0.16188199287254654
          ],
          [
            0.62573564725452,
            0.14814185968921703
          ],
          [
            0.6345607385105556,
            0.1422532311820758
          ],
          [
            0.6455921025806003,
            0.14421610735112278
          ],
          [
            0.6378701477315691,
            0.1559933643654053
          ],
          [
            0.6290450564755333,
            0.16188199287254654
          ],
          [
            0.5948478278583951,
            0.2914318200296543
          ],
          [
            0.6014666463004219,
            0.27965456301537184
          ],
          [
            0.6102917375564575,
            0.27180305833918356
          ],
          [
            0.6158074195914799,
            0.2698401821701364
          ],
          [
            0.6213231016265022,
            0.26787730600108917
          ],
          [
            0.6323544656965467,
            0.2659144298320422
          ],
          [
            0.6433858297665914,
            0.2698401821701364
          ],
          [
            0.6378701477315691,
            0.28554319152251295
          ],
          [
            0.6312513292895423,
            0.2973204485367956
          ],
          [
            0.6213231016265022,
            0.3051719532129839
          ],
          [
            0.611394873963462,
            0.30713482938203107
          ],
          [
            0.6025697827074262,
            0.3012462008748898
          ],
          [
            0.5981572370794085,
            0.2914318200296543
          ],
          [
            0.6069823283354441,
            0.28554319152251295
          ],
          [
            0.6180136924054888,
            0.281617439184419
          ],
          [
            0.6290450564755333,
            0.2757288106772775
          ],
          [
            0.6411795569525826,
            0.27180305833918356
          ],
          [
            0.6301481928825379,
            0.281617439184419
          ],
          [
            0.6191168288124932,
            0.2875060676915601
          ],
          [
            0.6080854647424486,
            0.2914318200296543
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      },
      {
        "dw_body": [
          [
            0.7333861577510834,
            0.23523137549629977
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.9169060062037574,
            0.5283375091352872
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.5045391178131103,
            0.9040641636658018
          ],
          [
            0.8914785573217605,
            0.5637463038030844
          ],
          [
            0.6139877021312714,
            0.939472958333599
          ],
          [
            0.5244388604164123,
            0.9119327847030898
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4249401473999023,
            0.9040641636658018
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.4249401473999023,
            0.9119327847030898
          ],
          [
            0.4249401473999023,
            0.8902940768505472
          ],
          [
            0.7499692765871683,
            0.16834809667934963
          ],
          [
            0.7742911842134262,
            0.1742495624573159
          ],
          [
            0.8903730160660214,
            0.22146128868104537
          ],
          [
            0.8892674748102822,
            0.22146128868104537
          ]
        ],
        "dw_hand_1": [
          [
            0.5255444016721513,
            0.9040641636658018
          ],
          [
            0.5321776492065853,
            0.8391480401081736
          ],
          [
            0.5443386030197144,
            0.8194764875149528
          ],
          [
            0.5465496855311924,
            0.8273451085522412
          ],
          [
            0.5454441442754534,
            0.8273451085522412
          ],
          [
            0.5277554841836294,
            0.8293122638115631
          ],
          [
            0.5310721079508464,
            0.8391480401081736
          ],
          [
            0.5498663092984093,
            0.8116078664776645
          ],
          [
            0.5587106393443214,
            0.789969158625122
          ],
          [
            0.5167000716262394,
            0.8391480401081736
          ],
          [
            0.5277554841836294,
            0.8411151953674956
          ],
          [
            0.5310721079508464,
            0.8411151953674956
          ],
          [
            0.5332831904623243,
            0.8352137295895293
          ],
          [
            0.5144889891147614,
            0.8529181269234279
          ],
          [
            0.5211222366491953,
            0.8529181269234279
          ],
          [
            0.5255444016721513,
            0.8411151953674956
          ],
          [
            0.5244388604164123,
            0.8391480401081736
          ],
          [
            0.5133834478590223,
            0.8902940768505472
          ],
          [
            0.5200166953934563,
            0.8568524374420721
          ],
          [
            0.5244388604164123,
            0.8529181269234279
          ],
          [
            0.5244388604164123,
            0.8411151953674956
          ]
        ],
        "dw_hand_2": [
          [
            0.4956947877671984,
            0.7368559666234262
          ],
          [
            0.5144889891147614,
            0.7211187245488497
          ],
          [
            0.5365998142295414,
            0.7073486377335954
          ],
          [
            0.5564995568328434,
            0.6798084641030863
          ],
          [
            0.5631328043672773,
            0.6916113956590189
          ],
          [
            0.5487607680426704,
            0.6050565642488478
          ],
          [
            0.5697660519017113,
            0.640465358916645
          ],
          [
            0.5730826756689283,
            0.6896442403996967
          ],
          [
            0.5708715931574503,
            0.7211187245488497
          ],
          [
            0.5332831904623243,
            0.6129251852861362
          ],
          [
            0.5542884743213654,
            0.6640712220285099
          ],
          [
            0.5542884743213654,
            0.7034143272149511
          ],
          [
            0.5498663092984093,
            0.73095450084546
          ],
          [
            0.5200166953934563,
            0.6247281168420685
          ],
          [
            0.5388108967410195,
            0.6739069983251202
          ],
          [
            0.5343887317180633,
            0.705381482474273
          ],
          [
            0.5277554841836294,
            0.7211187245488497
          ],
          [
            0.5067502003245884,
            0.642432514175967
          ],
          [
            0.5200166953934563,
            0.6798084641030863
          ],
          [
            0.5189111541377174,
            0.7014471719556291
          ],
          [
            0.5167000716262394,
            0.7132501035115614
          ]
        ],
        "dw_face": [
          [
            0.7488637353314294,
            0.1585123203827394
          ],
          [
            0.7466526528199515,
            0.19982258082850263
          ],
          [
            0.7433360290527343,
            0.23916568601494395
          ],
          [
            0.7400194052855175,
            0.2765416359420632
          ],
          [
            0.7400194052855175,
            0.31391758586918245
          ],
          [
            0.7466526528199515,
            0.34932638053697956
          ],
          [
            0.7532859003543854,
            0.38473517520477674
          ],
          [
            0.7654468541675145,
            0.41030819357596365
          ],
          [
            0.7875576792822945,
            0.41227534883528555
          ],
          [
            0.8074574218855964,
            0.39850526202003117
          ],
          [
            0.8251460819774205,
            0.3788337094268105
          ],
          [
            0.8395181183020273,
            0.35522784631494564
          ],
          [
            0.8538901546266343,
            0.3276876726844368
          ],
          [
            0.8638400259282852,
            0.29227887801663965
          ],
          [
            0.8693677322069803,
            0.25687008334884254
          ],
          [
            0.8726843559741974,
            0.21949413342172328
          ],
          [
            0.8760009797414146,
            0.18211818349460404
          ],
          [
            0.7488637353314294,
            0.12113637045562016
          ],
          [
            0.7488637353314294,
            0.12113637045562016
          ],
          [
            0.7488637353314294,
            0.12310352571494214
          ],
          [
            0.7477581940756904,
            0.12310352571494214
          ],
          [
            0.7477581940756904,
            0.12507068097426413
          ],
          [
            0.7521803590986464,
            0.11916921519629797
          ],
          [
            0.7621302304002975,
            0.1152349046776539
          ],
          [
            0.7720801017019485,
            0.1152349046776539
          ],
          [
            0.7820299730035994,
            0.12113637045562016
          ],
          [
            0.7919798443052505,
            0.1329393020115525
          ],
          [
            0.7488637353314294,
            0.17031525193867172
          ],
          [
            0.7400194052855175,
            0.19195395979121446
          ],
          [
            0.7300695339838664,
            0.21359266764375703
          ],
          [
            0.7212252039379543,
            0.23523137549629977
          ],
          [
            0.7234362864494324,
            0.2549029280895204
          ],
          [
            0.7311750752396053,
            0.26277154912680856
          ],
          [
            0.7400194052855175,
            0.26670585964545274
          ],
          [
            0.7455471115642124,
            0.268673014904775
          ],
          [
            0.7510748178429073,
            0.26670585964545274
          ],
          [
            0.7488637353314294,
            0.16638094142002754
          ],
          [
            0.7488637353314294,
            0.16834809667934963
          ],
          [
            0.7488637353314294,
            0.16834809667934963
          ],
          [
            0.7488637353314294,
            0.16638094142002754
          ],
          [
            0.7488637353314294,
            0.16834809667934963
          ],
          [
            0.7488637353314294,
            0.16834809667934963
          ],
          [
            0.7665523954232535,
            0.176216717716638
          ],
          [
            0.7720801017019485,
            0.1742495624573159
          ],
          [
            0.7787133492363824,
            0.176216717716638
          ],
          [
            0.7853465967708164,
            0.18015102823528195
          ],
          [
            0.7787133492363824,
            0.18605249401324822
          ],
          [
            0.7709745604462094,
            0.18605249401324822
          ],
          [
            0.7433360290527343,
            0.3217862069064708
          ],
          [
            0.7389138640297783,
            0.31391758586918245
          ],
          [
            0.7378083227740394,
            0.3021146543132499
          ],
          [
            0.7378083227740394,
            0.3021146543132499
          ],
          [
            0.7400194052855175,
            0.300147499053928
          ],
          [
            0.7510748178429073,
            0.31195043060986033
          ],
          [
            0.7621302304002975,
            0.32572051742511476
          ],
          [
            0.7566025241216026,
            0.3355562937217252
          ],
          [
            0.7510748178429073,
            0.3434249147590133
          ],
          [
            0.7444415703084732,
            0.34539207001833544
          ],
          [
            0.7411249465412564,
            0.3375234489810471
          ],
          [
            0.7422304877969955,
            0.32965482794375894
          ],
          [
            0.7433360290527343,
            0.3217862069064708
          ],
          [
            0.7422304877969955,
            0.31981905164714847
          ],
          [
            0.7422304877969955,
            0.3178518963878266
          ],
          [
            0.7510748178429073,
            0.31981905164714847
          ],
          [
            0.7599191478888192,
            0.32572051742511476
          ],
          [
            0.7532859003543854,
            0.32572051742511476
          ],
          [
            0.7455471115642124,
            0.32572051742511476
          ],
          [
            0.7444415703084732,
            0.32375336216579265
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "002491",
  "objects": [
    {
      "box": [
        0.3457936644554138,
        0.6524607539176941,
        0.5762557983398438,
        0.8248737454414368
      ],
      "name": "tablet",
      "possible_names": [
        "tablet"
      ]
    }
  ],
  "mask_file": "./person_labeling/./002491.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A medical consultation takes place in a bright and modern office with a laptop stethoscope and decorative plant visible on the desk suggesting a professional and organized environment with a focus on technology and healthcare tools",
  "overall_past": "Before the current scene, the healthcare provider likely conducted an initial assessment of the patient, including taking vital signs such as blood pressure and listening to heart and lung sounds using the stethoscope. They may have reviewed the patient’s medical history and symptoms, possibly entering notes into the laptop or tablet, which would explain the device’s presence and the provider’s focused engagement with the screen. This preparatory phase would have set the stage for the current moment, where the provider is now sharing detailed information or treatment recommendations with the patient, using the tablet as a visual aid to enhance understanding and ensure clarity in the care plan.",
  "overall_past_clean": "The provider swiftly reviewed the patient’s medical records, confirmed vital signs, and assessed cardiac and pulmonary function, then documented findings and synthesized clinical insights prior to delivering the care plan.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the healthcare provider is likely to conclude the consultation by summarizing the diagnosis or treatment plan, confirming the patient’s understanding, and possibly scheduling follow-up appointments or prescribing medication. The focused interaction, use of digital tools like the tablet and laptop stethoscope, and the presence of medical equipment suggest a tech-integrated, patient-centered approach. The provider may then hand over a printed or digital copy of the plan, ensuring the patient feels informed and supported before leaving the appointment.",
  "overall_future_clean": "The provider confirms the diagnosis, outlines the treatment steps, ensures clarity through verbal recap and written documentation, and schedules the next appointment before handing over the plan, leaving the patient with clear direction and confidence in their care.",
  "future_scene_ok": true
}