{
  "video_path": "./ref_datasets/part2/7580054001.mp4",
  "start_time": 0.0,
  "end_time": 4.0,
  "image_path": "./007901.jpg",
  "represents_multiple_types": true,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/7580054000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/person_5625994110277055662_1_7580054000.mp4_0.00_6.08.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/7580054000.mp4",
      "start_time": 0.0,
      "end_time": 6.08,
      "image_path": "./ref_datasets/extracted_frames/face_5625994110277055662_1_7580054000.mp4_0.00_6.08.jpg",
      "type": "face"
    },
    {
      "video_path": "./ref_datasets/part2/7580054001.mp4",
      "start_time": 0.0,
      "end_time": 4.0,
      "image_path": "./ref_datasets/extracted_frames/person_7660395427457142168_1_7580054001.mp4_0.00_4.00.jpg",
      "type": "person"
    },
    {
      "video_path": "./ref_datasets/part2/7580054001.mp4",
      "start_time": 0.0,
      "end_time": 4.0,
      "image_path": "./ref_datasets/extracted_frames/face_7660395427457142168_1_7580054001.mp4_0.00_4.00.jpg",
      "type": "face"
    }
  ],
  "cross_video_duplicate": true,
  "types": [
    "person",
    "face"
  ],
  "persons": [
    {
      "body_box": 1,
      "skeleton": 0,
      "face_box": 1,
      "qwen_detailing": {
        "background": false,
        "age": "child",
        "gender": "male",
        "emotion": "neutral",
        "clothing_description": "The child is wearing a light yellow hoodie with a drawstring at the neck. The hoodie appears soft and casual, suitable for a relaxed setting. There are no visible accessories or additional layers of clothing on the child.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "jacket",
                "blazer"
              ],
              "name": "jacket",
              "type": "top",
              "color": [
                "beige"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "shirt",
                "blouse"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "bracelet"
              ],
              "name": "bracelet",
              "type": "accessory",
              "color": [
                "beige",
                "brown"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "pencil",
              "pen"
            ],
            "name": "pencil",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "notebook",
              "writing pad"
            ],
            "name": "notebook",
            "position": "hand"
          }
        ],
        "description": "A child, likely a boy based on appearance, is seated at a table engaged in writing or drawing. He is wearing a light yellow hoodie and holding a pencil in his hand while interacting with a notebook. His expression is neutral, suggesting focus on the task at hand. The setting appears to be indoors, possibly a classroom or a home environment, given the presence of another individual who seems to be teaching or guiding him.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The child appears to be focused and engaged in writing, showing a neutral expression typical for concentration.",
        "meaningful": true,
        "story": "The child seems to be participating in a music lesson or practice session, possibly learning about musical notation as he writes while observing the adult playing a recorder.",
        "race": "black",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box is playing a recorder while sitting at a table with another individual who appears to be taking notes. The person playing the recorder seems focused on producing music, possibly demonstrating a technique or teaching a lesson. Their posture and hand placement suggest they are experienced with the instrument, and their expression indicates concentration and engagement in the activity. The interaction between the two individuals suggests a learning environment, where the person playing the recorder is likely instructing or guiding the other person through musical practice or theory.",
        "intention": "The individual is demonstrating a musical technique to facilitate learning and skill development in a structured educational setting",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "both hands",
            "action": [
              "writing",
              "holding"
            ]
          },
          "object": 0,
          "deleted": true
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "left hand",
            "action": [
              [
                "left hand",
                "pressing"
              ],
              [
                "left hand",
                "holding"
              ]
            ]
          },
          "object": 1
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ],
              [
                "right hand",
                "writing"
              ]
            ]
          },
          "object": 2
        }
      ],
      "without_face": false,
      "deleted": false,
      "facex_detailing": {
        "landmarks": [
          [
            0.5877966450951086,
            0.3866984956764749
          ],
          [
            0.5927384512449699,
            0.40474557429552077
          ],
          [
            0.5960452463891771,
            0.4284100486763886
          ],
          [
            0.5968673542693809,
            0.4484732901411397
          ],
          [
            0.5965154108231661,
            0.45922920459083144
          ],
          [
            0.6011310034012668,
            0.4705742920083659
          ],
          [
            0.6077603265091225,
            0.48116192732538493
          ],
          [
            0.6111968355834799,
            0.4947475644094604
          ],
          [
            0.6168984485050989,
            0.512115839017289
          ],
          [
            0.634808974038987,
            0.517453135656459
          ],
          [
            0.6510411384244444,
            0.5101951535258974
          ],
          [
            0.6647722647934364,
            0.5008863936577524
          ],
          [
            0.68261530714691,
            0.4884849961314882
          ],
          [
            0.7039002976089558,
            0.4724868534931115
          ],
          [
            0.7105906523093974,
            0.4516653421201876
          ],
          [
            0.7181670740167931,
            0.43466370893376216
          ],
          [
            0.7261968627808586,
            0.4246483632496425
          ],
          [
            0.5929788394264444,
            0.3891139311449868
          ],
          [
            0.5873601610698397,
            0.3860916181866612
          ],
          [
            0.5933193205210266,
            0.3834706831989544
          ],
          [
            0.5969373489498461,
            0.37756506430783443
          ],
          [
            0.6063253514350407,
            0.3807658452008452
          ],
          [
            0.6052238277026585,
            0.3945971084492547
          ],
          [
            0.6163166247978412,
            0.39460319131612775
          ],
          [
            0.6250988602007508,
            0.4051633523511035
          ],
          [
            0.6305189159181382,
            0.4099758192364658
          ],
          [
            0.6381677765064139,
            0.42736401185393336
          ],
          [
            0.6044278351402788,
            0.40431138601686273
          ],
          [
            0.594850787977693,
            0.4186569556593895
          ],
          [
            0.5844112837440754,
            0.4287491887807846
          ],
          [
            0.5840893651127185,
            0.4433858371206692
          ],
          [
            0.5920049158038285,
            0.45098375688706127
          ],
          [
            0.593714907781157,
            0.4538849194134985
          ],
          [
            0.5975664445332118,
            0.4538216102868319
          ],
          [
            0.6019899761866009,
            0.45229072166340695
          ],
          [
            0.6070497922481053,
            0.45205315867705004
          ],
          [
            0.5968701961494627,
            0.39460013298583885
          ],
          [
            0.5956654225392317,
            0.39671594670840676
          ],
          [
            0.5982671163384877,
            0.40481196202869923
          ],
          [
            0.5961194840057817,
            0.3999261188719954
          ],
          [
            0.5984846073483664,
            0.3955152597544449
          ],
          [
            0.6011553413968868,
            0.3947440840303898
          ],
          [
            0.6184178050863679,
            0.4178299696317741
          ],
          [
            0.6196021318435669,
            0.42491344107048856
          ],
          [
            0.6248790412352829,
            0.43122321915413653
          ],
          [
            0.6249497486800744,
            0.43299344831279346
          ],
          [
            0.6241206538740289,
            0.42926459684967994
          ],
          [
            0.6124491778000322,
            0.416704193183354
          ],
          [
            0.5935148473769899,
            0.46673907823860644
          ],
          [
            0.5965498284688071,
            0.472906476684979
          ],
          [
            0.5941973207488892,
            0.46558828093111515
          ],
          [
            0.592106146692599,
            0.46450914655412945
          ],
          [
            0.5960032055302271,
            0.46288594704653535
          ],
          [
            0.6067721506590565,
            0.4700701710368905
          ],
          [
            0.6116494806986007,
            0.4813641894076552
          ],
          [
            0.6105367056907169,
            0.4821024466838155
          ],
          [
            0.6015428863505207,
            0.49056214647633684
          ],
          [
            0.5937160732884886,
            0.4842759496399334
          ],
          [
            0.5948869645910919,
            0.4764145876680102
          ],
          [
            0.5958795302128665,
            0.4682372680732182
          ],
          [
            0.5897489861205772,
            0.46854523686426025
          ],
          [
            0.5971824052787962,
            0.47226130078945844
          ],
          [
            0.5958141119076461,
            0.47252867658223424
          ],
          [
            0.6034013229703146,
            0.47546219996043615
          ],
          [
            0.6099223732002198,
            0.48098711924893517
          ],
          [
            0.6096408282322859,
            0.4810731445040021
          ],
          [
            0.599705759242729,
            0.4752723063741412
          ],
          [
            0.5961083765067752,
            0.4685892227504935
          ]
        ],
        "visibility": [
          1.982915136977681e-06,
          1.0,
          0.0003353091888129711,
          0.9994986057281494,
          0.035221926867961884,
          1.195812018295328e-07,
          0.7491574287414551,
          0.9999741315841675,
          3.9747569124948257e-10,
          0.9976734519004822,
          1.1371445907570887e-05,
          0.002400739351287484,
          7.133251021113063e-12,
          2.5569979467121584e-10,
          0.32139334082603455,
          0.9858742952346802,
          1.1386110110311876e-10,
          0.06430041044950485,
          2.597117236291524e-05,
          3.204424137948081e-05,
          5.282784059090773e-07,
          4.382974339023349e-08,
          0.9865343570709229,
          1.0730727950658547e-07,
          0.005958583205938339,
          0.9999798536300659,
          0.9903067350387573,
          0.8050872087478638,
          0.007868981920182705
        ],
        "headpose": {
          "pitch": -56.25865285365632,
          "yaw": 86.78719080193089,
          "roll": -38.96009228995349
        },
        "attributes": {
          "5 oClock Shadow": 0.0006328374147415161,
          "Arched Eyebrows": 0.004104466177523136,
          "Attractive": 0.07798033207654953,
          "Bags Under Eyes": 0.0010394200216978788,
          "Bald": 9.315682518717949e-07,
          "Bangs": 0.019174724817276,
          "Big Lips": 0.02329222299158573,
          "Big Nose": 0.001994472462683916,
          "Black Hair": 0.2590888440608978,
          "Blond Hair": 0.0011400007642805576,
          "Blurry": 0.1638975888490677,
          "Brown Hair": 0.2275247871875763,
          "Bushy Eyebrows": 0.003925705328583717,
          "Chubby": 0.001718332408927381,
          "Double Chin": 0.000159439179697074,
          "Eyeglasses": 0.0034507070668041706,
          "Goatee": 0.00037519654142670333,
          "Gray Hair": 0.0009769049938768148,
          "Heavy Makeup": 0.023046892136335373,
          "High Cheekbones": 0.0248776376247406,
          "Male": 0.16323454678058624,
          "Mouth Slightly Open": 0.06359129399061203,
          "Mustache": 0.00019770651124417782,
          "Narrow Eyes": 0.21240903437137604,
          "No Beard": 0.9914789795875549,
          "Oval Face": 0.03192754462361336,
          "Pale Skin": 0.0017497411463409662,
          "Pointy Nose": 0.2494494616985321,
          "Receding Hairline": 0.003578804200515151,
          "Rosy Cheeks": 0.0003492900577839464,
          "Sideburns": 0.0003308332816231996,
          "Smiling": 0.005968869663774967,
          "Straight Hair": 0.10268829017877579,
          "Wavy Hair": 0.3631778359413147,
          "Wearing Earrings": 0.13888618350028992,
          "Wearing Hat": 0.0005079495022073388,
          "Wearing Lipstick": 0.01295485906302929,
          "Wearing Necklace": 0.008800312876701355,
          "Wearing Necktie": 0.0007599920500069857,
          "Young": 0.8290356397628784
        },
        "age": [
          0.25790372490882874,
          0.06464561820030212,
          0.8026047348976135,
          0.11631053686141968,
          0.13223454356193542,
          0.010804598219692707,
          0.01067599467933178,
          0.00035546335857361555
        ],
        "race": [
          0.7705550193786621,
          0.0010378871811553836,
          0.9339179396629333,
          0.4223235845565796,
          0.7872510552406311
        ],
        "gender": [
          0.3626042306423187,
          0.6818490028381348
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.020153339354202677,
          "disgust": 7.214293948234846e-11,
          "fear": 51.13458023851153,
          "happy": 0.38707866375700667,
          "sad": 48.433795758033305,
          "surprise": 7.217107994638072e-09,
          "neutral": 0.02439153322752914
        },
        "dominant_emotion": "fear",
        "region": {
          "x": 0,
          "y": 0,
          "w": 193,
          "h": 380,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 37,
        "gender": {
          "Woman": 9.036266058683395,
          "Man": 90.96373319625854
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 28.16648055115226,
          "indian": 9.99958574769412,
          "black": 47.935414191211116,
          "white": 3.005681366067014,
          "middle eastern": 1.4257416047597888,
          "latino hispanic": 9.467094955867228
        },
        "dominant_race": "black"
      }
    },
    {
      "body_box": 0,
      "skeleton": 1,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a beige blazer over a gray top. She also has a bracelet on her left wrist.",
        "clothing": {
          "vague": false,
          "clothing": [
            {
              "possible_names": [
                "jacket",
                "coat"
              ],
              "name": "jacket",
              "type": "top",
              "color": [
                "beige"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "shirt",
                "blouse"
              ],
              "name": "shirt",
              "type": "top",
              "color": [
                "gray"
              ],
              "belonging_confident": true,
              "existence_confident": true
            },
            {
              "possible_names": [
                "bracelet"
              ],
              "name": "bracelet",
              "type": "accessory",
              "color": [
                "beige",
                "green"
              ],
              "belonging_confident": true,
              "existence_confident": true
            }
          ]
        },
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "recorder",
              "flute"
            ],
            "name": "recorder",
            "position": "hand"
          }
        ],
        "description": "A female adult is sitting at a table, playing a recorder with both hands. She is dressed in a beige blazer over a gray top and wears a bracelet on her left wrist. Her expression appears neutral as she focuses on playing the instrument.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears focused and engaged in playing the recorder, showing a calm and concentrated expression.",
        "meaningful": true,
        "story": "A woman is teaching a child how to play the recorder. She is demonstrating the technique while the child attentively writes notes, possibly learning music theory or practicing what she has been taught.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person in the green bounding box is playing a recorder while sitting at a table, likely teaching or demonstrating to the child beside them who appears to be writing or drawing. Their focused expression suggests they are concentrating on producing the correct notes, possibly as part of a music lesson. The interaction seems educational, with the adult guiding the child's learning process through practical demonstration, fostering an environment conducive to musical education and skill development.",
        "intention": "The individual is demonstrating proper recorder technique to facilitate the learner's musical skill development through hands on instruction",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.326372055559562,
            0.26335170432215643
          ],
          [
            0.33256411380553375,
            0.2812544128547112
          ],
          [
            0.34294598681270766,
            0.29704301424679297
          ],
          [
            0.3534211307606369,
            0.3124909277827967
          ],
          [
            0.36459957695511913,
            0.3275150412250133
          ],
          [
            0.38079939642280497,
            0.34111212761629195
          ],
          [
            0.3984916811897641,
            0.35182884136835735
          ],
          [
            0.41695574566170024,
            0.36003088443761777
          ],
          [
            0.4372284597820706,
            0.36063491311811263
          ],
          [
            0.4592836066528603,
            0.35673683629859065
          ],
          [
            0.4792319866715285,
            0.34701053493079687
          ],
          [
            0.4965271012492912,
            0.3330274973951635
          ],
          [
            0.5086456158173778,
            0.31436842491938954
          ],
          [
            0.5145768308134936,
            0.29564268422268686
          ],
          [
            0.5137097938981636,
            0.2767308213171505
          ],
          [
            0.5130068312246332,
            0.25827776202488517
          ],
          [
            0.5145837153076495,
            0.23699234418925785
          ],
          [
            0.3384424717022628,
            0.25514991808505283
          ],
          [
            0.3487725202841733,
            0.2485382473184949
          ],
          [
            0.36360187420138607,
            0.24822946747853644
          ],
          [
            0.37785332600275673,
            0.2486515035409303
          ],
          [
            0.39202502000899536,
            0.2500820992071004
          ],
          [
            0.4237800935273448,
            0.2469588241761639
          ],
          [
            0.437408880045805,
            0.2406756417382331
          ],
          [
            0.4512496066471887,
            0.23643388969912416
          ],
          [
            0.4666364510854085,
            0.23470558501070454
          ],
          [
            0.4832186855967083,
            0.2381810445161093
          ],
          [
            0.4080607466281406,
            0.26413638739004025
          ],
          [
            0.40871286638199333,
            0.27437528519048576
          ],
          [
            0.4120345603852045,
            0.2846568779576392
          ],
          [
            0.413288087220419,
            0.2957785619511491
          ],
          [
            0.40364671598666557,
            0.30419437047981085
          ],
          [
            0.410978646442373,
            0.306061405085382
          ],
          [
            0.41764008298752797,
            0.3064951810808409
          ],
          [
            0.42515652718998137,
            0.30297851353174166
          ],
          [
            0.43062051761718023,
            0.29994546093401453
          ],
          [
            0.35911414691064725,
            0.2683405473118737
          ],
          [
            0.36830455121539885,
            0.2675890158684481
          ],
          [
            0.3792249591262252,
            0.26619675578106017
          ],
          [
            0.38987302947296665,
            0.26779992913916
          ],
          [
            0.3795150940380399,
            0.2682658970178593
          ],
          [
            0.3693324247996012,
            0.2683311459031843
          ],
          [
            0.4345033444109417,
            0.2611189677601769
          ],
          [
            0.4417884137895372,
            0.258638158369632
          ],
          [
            0.4524702646744945,
            0.2584197226202204
          ],
          [
            0.46320207465893376,
            0.2571398401189418
          ],
          [
            0.45444710065448096,
            0.25897956265225297
          ],
          [
            0.4444950061500388,
            0.2599164660842646
          ],
          [
            0.40099112470313986,
            0.3227874100563072
          ],
          [
            0.4062228564862852,
            0.31918694763666106
          ],
          [
            0.41490434316731006,
            0.31555250226741743
          ],
          [
            0.4216798576413008,
            0.3149425529298328
          ],
          [
            0.429354961523934,
            0.31403528657697494
          ],
          [
            0.4419077574260651,
            0.31519728987699464
          ],
          [
            0.45639572881516954,
            0.3170084161772614
          ],
          [
            0.4464721398378806,
            0.3247748583910011
          ],
          [
            0.43571599223626356,
            0.330317188196239
          ],
          [
            0.4277025154658726,
            0.33128437754653745
          ],
          [
            0.41949442148839355,
            0.33107793856234774
          ],
          [
            0.4108391703121246,
            0.32866898810579664
          ],
          [
            0.40529982258403113,
            0.3228400336135001
          ],
          [
            0.4151380624405291,
            0.3198400582940806
          ],
          [
            0.42438446838389,
            0.3205507669420469
          ],
          [
            0.43161233133739896,
            0.31916272430902437
          ],
          [
            0.45203899763248584,
            0.31764914482122375
          ],
          [
            0.43461993424980727,
            0.3237719288184529
          ],
          [
            0.4255193493353627,
            0.3250503852253869
          ],
          [
            0.4171707093400299,
            0.3232194422965958
          ]
        ],
        "visibility": [
          0.9999997615814209,
          0.036167435348033905,
          2.820162262651138e-05,
          9.60868682886011e-17,
          0.8378458619117737,
          0.9970335960388184,
          1.932349169564418e-09,
          3.6753732501892955e-07,
          0.00016800528101157397,
          1.9033778642096877e-07,
          4.4067666630680775e-18,
          7.922583758739749e-15,
          3.3140571758849546e-05,
          2.9040346719694764e-15,
          4.1701048303366406e-07,
          7.56052189712815e-14,
          1.127959947666568e-08,
          0.0006410811911337078,
          1.550882767478376e-14,
          8.994801464723423e-05,
          3.129191751294591e-28,
          2.8564500550586243e-15,
          0.0055906218476593494,
          0.999997615814209,
          0.017538808286190033,
          0.8287779688835144,
          0.9999747276306152,
          0.9999972581863403,
          0.9998738765716553
        ],
        "headpose": {
          "pitch": -17.536843665729776,
          "yaw": 4.955895615528395,
          "roll": -10.039537966650832
        },
        "attributes": {
          "5 oClock Shadow": 8.056967635639012e-05,
          "Arched Eyebrows": 0.02728884108364582,
          "Attractive": 0.3196876645088196,
          "Bags Under Eyes": 0.15311601758003235,
          "Bald": 6.200748885021312e-06,
          "Bangs": 0.0002553433587308973,
          "Big Lips": 0.05076625570654869,
          "Big Nose": 0.04190309718251228,
          "Black Hair": 0.0035425794776529074,
          "Blond Hair": 0.0928548127412796,
          "Blurry": 0.0005950127961114049,
          "Brown Hair": 0.4002242386341095,
          "Bushy Eyebrows": 0.009924781508743763,
          "Chubby": 0.004296877887099981,
          "Double Chin": 0.00017779531481210142,
          "Eyeglasses": 0.001541860867291689,
          "Goatee": 4.2574891267577186e-05,
          "Gray Hair": 0.0006380611448548734,
          "Heavy Makeup": 0.04556046426296234,
          "High Cheekbones": 0.01603756472468376,
          "Male": 0.005428714212030172,
          "Mouth Slightly Open": 0.1485307663679123,
          "Mustache": 4.541295311355498e-06,
          "Narrow Eyes": 0.5362783074378967,
          "No Beard": 0.9996167421340942,
          "Oval Face": 0.21983110904693604,
          "Pale Skin": 0.02786986157298088,
          "Pointy Nose": 0.05155074968934059,
          "Receding Hairline": 0.15994258224964142,
          "Rosy Cheeks": 0.0003794469521380961,
          "Sideburns": 3.0088804123806767e-05,
          "Smiling": 0.003080558031797409,
          "Straight Hair": 0.4286966919898987,
          "Wavy Hair": 0.03330668807029724,
          "Wearing Earrings": 0.03306646645069122,
          "Wearing Hat": 9.143137140199542e-05,
          "Wearing Lipstick": 0.07133150845766068,
          "Wearing Necklace": 0.021567827090620995,
          "Wearing Necktie": 0.00010794967238325626,
          "Young": 0.9976293444633484
        },
        "age": [
          0.8029531240463257,
          0.9954981803894043,
          0.6812718510627747,
          0.019906247034668922,
          0.011274107731878757,
          0.0001863449433585629,
          3.943829869967885e-05,
          1.1559301128727384e-05
        ],
        "race": [
          0.9998992681503296,
          0.0001731959928292781,
          0.5674434304237366,
          0.0026808222755789757,
          0.03562126308679581
        ],
        "gender": [
          0.014399136416614056,
          0.9861838221549988
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 2.4771992457317538e-06,
          "disgust": 4.4636254040137475e-14,
          "fear": 5.324900520520259e-08,
          "happy": 0.008919289393816143,
          "sad": 0.05118090775795281,
          "surprise": 4.0786913776957867e-10,
          "neutral": 99.9398946762085
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 294,
          "h": 380,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 24,
        "gender": {
          "Woman": 99.41205382347107,
          "Man": 0.5879483185708523
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 2.4556609190540257e-06,
          "indian": 1.4687999261298046e-06,
          "black": 2.207531379916361e-09,
          "white": 99.98557567596436,
          "middle eastern": 0.005683980998583138,
          "latino hispanic": 0.00873482131282799
        },
        "dominant_race": "white"
      }
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.1807510256767273,
        0.15896619856357574,
        0.6426462531089783,
        0.612978458404541
      ],
      [
        0.39854806661605835,
        0.3131081461906433,
        0.9993806481361389,
        0.9983499646186829
      ]
    ],
    "face_boxes": [
      [
        0.32958465814590454,
        0.20934553444385529,
        0.5117393136024475,
        0.34155187010765076
      ],
      [
        0.5898063778877258,
        0.38786187767982483,
        0.7093296051025391,
        0.5203732252120972
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.8375342890602556,
            0.552887864112854
          ],
          [
            0.7518360303672892,
            0.5372070757548014
          ],
          [
            0.6482009268316086,
            0.5999302291870117
          ],
          [
            0.5027131853295957,
            0.6044104544321695
          ],
          [
            0.923232547753222,
            0.5685686524709066
          ],
          [
            0.7279202372436704,
            0.6503327631950379
          ],
          [
            0.5326079267341189,
            0.6301717495918274
          ],
          [
            0.7657869096893999,
            0.8172211535771687
          ],
          [
            0.40705001283512143,
            0.8161010972658794
          ],
          [
            0.5565237198577375,
            0.9684287556012471
          ],
          [
            0.9092816684311112,
            0.8553030681610108
          ],
          [
            0.45488159908235837,
            0.8788242506980896
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.606348288865276,
            0.4408822329839071
          ],
          [
            0.6163132026667837,
            0.44424240191777553
          ],
          [
            0.7358921682848765,
            0.4532028524080912
          ],
          [
            0.7119763751612581,
            0.46328335920969643
          ]
        ],
        "dw_hand_1": [
          [
            0.5306149439738173,
            0.6290516932805381
          ],
          [
            0.5346009094944204,
            0.6167310738563537
          ],
          [
            0.5326079267341189,
            0.6021703418095908
          ],
          [
            0.5166640646517064,
            0.5999302291870117
          ],
          [
            0.5086921336105001,
            0.6021703418095908
          ],
          [
            0.4827833577265803,
            0.6021703418095908
          ],
          [
            0.4787973922059771,
            0.6021703418095908
          ],
          [
            0.4847763404868818,
            0.612250848611196
          ],
          [
            0.5007202025692942,
            0.617851130167643
          ],
          [
            0.46883247840446934,
            0.6133709049224854
          ],
          [
            0.46484651288386636,
            0.6167310738563537
          ],
          [
            0.4768044094456755,
            0.6256915243466696
          ],
          [
            0.4967342370486911,
            0.6301717495918274
          ],
          [
            0.46285353012356467,
            0.6256915243466696
          ],
          [
            0.45687458184266005,
            0.6312918059031167
          ],
          [
            0.4668394956441679,
            0.6357720311482749
          ],
          [
            0.4827833577265803,
            0.6391322000821433
          ],
          [
            0.4608605473632632,
            0.6380121437708536
          ],
          [
            0.4528886163220569,
            0.6447324816385903
          ],
          [
            0.4588675646029615,
            0.6492127068837485
          ],
          [
            0.46883247840446934,
            0.6503327631950379
          ]
        ],
        "dw_hand_2": [
          [
            0.49872721980899254,
            0.6167310738563537
          ],
          [
            0.5007202025692942,
            0.6055305107434592
          ],
          [
            0.5047061680898972,
            0.5932098913192749
          ],
          [
            0.5027131853295957,
            0.590969778696696
          ],
          [
            0.4967342370486911,
            0.590969778696696
          ],
          [
            0.46285353012356467,
            0.5842494408289591
          ],
          [
            0.45089563356175544,
            0.5842494408289591
          ],
          [
            0.45687458184266005,
            0.5965700602531433
          ],
          [
            0.4668394956441679,
            0.6077706233660378
          ],
          [
            0.4429237025205493,
            0.5920898350079855
          ],
          [
            0.42897282319843855,
            0.5943299476305642
          ],
          [
            0.44491668528085077,
            0.6088906796773276
          ],
          [
            0.4588675646029615,
            0.617851130167643
          ],
          [
            0.42897282319843855,
            0.6021703418095908
          ],
          [
            0.41701492663662904,
            0.6055305107434592
          ],
          [
            0.4329587887190415,
            0.6156110175450644
          ],
          [
            0.45089563356175544,
            0.6245714680353799
          ],
          [
            0.41900790939693056,
            0.6144909612337747
          ],
          [
            0.4130289611160261,
            0.6167310738563537
          ],
          [
            0.4249868576778354,
            0.6223313554128013
          ],
          [
            0.43694475423964446,
            0.6290516932805381
          ]
        ],
        "dw_face": [
          [
            0.6003693405843714,
            0.44424240191777553
          ],
          [
            0.6023623233446729,
            0.45432290871938075
          ],
          [
            0.606348288865276,
            0.46440341552098596
          ],
          [
            0.606348288865276,
            0.47336386601130165
          ],
          [
            0.6103342543858791,
            0.48344437281290686
          ],
          [
            0.6183061854270854,
            0.4935248796145121
          ],
          [
            0.6282710992285929,
            0.5013652737935385
          ],
          [
            0.6342500475094976,
            0.5103257242838541
          ],
          [
            0.6482009268316086,
            0.5125658369064331
          ],
          [
            0.6621518061537195,
            0.5080856116612753
          ],
          [
            0.6721167199552271,
            0.5024853301048279
          ],
          [
            0.6820816337567347,
            0.4946449359258016
          ],
          [
            0.6860675992773381,
            0.4868045417467753
          ],
          [
            0.690053564797941,
            0.47672403494517007
          ],
          [
            0.690053564797941,
            0.4677635844548544
          ],
          [
            0.690053564797941,
            0.4588031339645386
          ],
          [
            0.690053564797941,
            0.4487226271629334
          ],
          [
            0.5983763578240697,
            0.43528195142745973
          ],
          [
            0.5983763578240697,
            0.43640200773874926
          ],
          [
            0.5983763578240697,
            0.43528195142745973
          ],
          [
            0.6003693405843714,
            0.43416189511617015
          ],
          [
            0.6003693405843714,
            0.43416189511617015
          ],
          [
            0.6023623233446729,
            0.43528195142745973
          ],
          [
            0.606348288865276,
            0.43528195142745973
          ],
          [
            0.6123272371461808,
            0.43640200773874926
          ],
          [
            0.6183061854270854,
            0.4386421203613281
          ],
          [
            0.6222921509476885,
            0.4408822329839071
          ],
          [
            0.6043553061049746,
            0.44536245822906495
          ],
          [
            0.6003693405843714,
            0.4509627397855123
          ],
          [
            0.5943903923034668,
            0.45544296503067017
          ],
          [
            0.5904044267828639,
            0.46104324658711754
          ],
          [
            0.5963833750637685,
            0.4655234718322754
          ],
          [
            0.6023623233446729,
            0.4677635844548544
          ],
          [
            0.606348288865276,
            0.4677635844548544
          ],
          [
            0.6103342543858791,
            0.4688836407661438
          ],
          [
            0.6123272371461808,
            0.4677635844548544
          ],
          [
            0.6023623233446729,
            0.44536245822906495
          ],
          [
            0.6023623233446729,
            0.44536245822906495
          ],
          [
            0.6023623233446729,
            0.44536245822906495
          ],
          [
            0.6023623233446729,
            0.44424240191777553
          ],
          [
            0.6023623233446729,
            0.44424240191777553
          ],
          [
            0.6023623233446729,
            0.44424240191777553
          ],
          [
            0.6103342543858791,
            0.44648251454035437
          ],
          [
            0.6123272371461808,
            0.44648251454035437
          ],
          [
            0.6163132026667837,
            0.4476025708516439
          ],
          [
            0.6183061854270854,
            0.4476025708516439
          ],
          [
            0.6163132026667837,
            0.4487226271629334
          ],
          [
            0.6123272371461808,
            0.4487226271629334
          ],
          [
            0.6183061854270854,
            0.4868045417467753
          ],
          [
            0.6123272371461808,
            0.4845644291241964
          ],
          [
            0.6103342543858791,
            0.48008420387903844
          ],
          [
            0.6103342543858791,
            0.48008420387903844
          ],
          [
            0.6123272371461808,
            0.48008420387903844
          ],
          [
            0.6202991681873868,
            0.48344437281290686
          ],
          [
            0.6262781164682917,
            0.4868045417467753
          ],
          [
            0.6262781164682917,
            0.49016471068064366
          ],
          [
            0.6262781164682917,
            0.49240482330322266
          ],
          [
            0.62428513370799,
            0.4935248796145121
          ],
          [
            0.6202991681873868,
            0.49128476699193324
          ],
          [
            0.6202991681873868,
            0.48904465436935424
          ],
          [
            0.6183061854270854,
            0.4868045417467753
          ],
          [
            0.6163132026667837,
            0.4845644291241964
          ],
          [
            0.6163132026667837,
            0.48344437281290686
          ],
          [
            0.6222921509476885,
            0.4845644291241964
          ],
          [
            0.6262781164682917,
            0.4868045417467753
          ],
          [
            0.62428513370799,
            0.48904465436935424
          ],
          [
            0.6222921509476885,
            0.49016471068064366
          ],
          [
            0.6202991681873868,
            0.48904465436935424
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      },
      {
        "dw_body": [
          [
            0.41823264017860234,
            0.28975752626359463
          ],
          [
            0.44733640726562923,
            0.4022072063460946
          ],
          [
            0.2605872351238736,
            0.40970385168492796
          ],
          [
            0.23633409588468457,
            0.5909863662421704
          ],
          [
            0.33092133891752185,
            0.5105678071528673
          ],
          [
            0.6340855794073849,
            0.39471056100726126
          ],
          [
            0.6607640325704928,
            0.560999784886837
          ],
          [
            0.5443489642223853,
            0.46013582941889764
          ],
          [
            0.33092133891752185,
            0.6714049253314733
          ],
          [
            0.21693158449333333,
            0.7790840129256249
          ],
          [
            0.2993922579065761,
            0.9671816596090793
          ],
          [
            0.5613261616898177,
            0.6700418989062309
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.33092133891752185,
            0.9644556067585945
          ],
          [
            0.3721516756241432,
            0.2693121298849583
          ],
          [
            0.4570376629613048,
            0.26249699775874613
          ],
          [
            0.33092133891752185,
            0.27476423558592794
          ],
          [
            0.5225211389071153,
            0.2597709449082613
          ]
        ],
        "dw_hand_1": [
          [
            0.5394983363745476,
            0.46286188226938246
          ],
          [
            0.5128198832114396,
            0.4424164858907461
          ],
          [
            0.4885667439722506,
            0.4192450366616249
          ],
          [
            0.4618882908091426,
            0.4056147724092007
          ],
          [
            0.43035920979819686,
            0.39743661385774615
          ],
          [
            0.505543941439683,
            0.39879964028298853
          ],
          [
            0.47158954650481827,
            0.38789542888104916
          ],
          [
            0.4352098376460347,
            0.38789542888104916
          ],
          [
            0.40853138448292675,
            0.390621481731534
          ],
          [
            0.5079692553636018,
            0.40697779883444307
          ],
          [
            0.46431360473306155,
            0.39743661385774615
          ],
          [
            0.427933895874278,
            0.4015256931334734
          ],
          [
            0.40368075663508896,
            0.4083408252596855
          ],
          [
            0.505543941439683,
            0.4178820102363825
          ],
          [
            0.46431360473306155,
            0.41106687811017034
          ],
          [
            0.4327845237221158,
            0.41651898381114005
          ],
          [
            0.4158073262546835,
            0.42197108951210976
          ],
          [
            0.5006933135918451,
            0.4301492480635643
          ],
          [
            0.4667389186569804,
            0.42606016878783703
          ],
          [
            0.44733640726562923,
            0.4274231952130795
          ],
          [
            0.4352098376460347,
            0.43151227448880675
          ]
        ],
        "dw_hand_2": [
          [
            0.34547322246103523,
            0.5105678071528673
          ],
          [
            0.35759979208062975,
            0.4860333314985037
          ],
          [
            0.3600251060045487,
            0.4614988558441401
          ],
          [
            0.3721516756241432,
            0.44514253874123094
          ],
          [
            0.3867035591676566,
            0.43151227448880675
          ],
          [
            0.3333466528414407,
            0.4465055651664734
          ],
          [
            0.35274916423279196,
            0.435601353764534
          ],
          [
            0.377002303471981,
            0.43151227448880675
          ],
          [
            0.40125544271117003,
            0.4301492480635643
          ],
          [
            0.3284960249936029,
            0.4546837237179279
          ],
          [
            0.3551744781567109,
            0.44377951231598856
          ],
          [
            0.3842782452437377,
            0.44105345946550367
          ],
          [
            0.40853138448292675,
            0.4424164858907461
          ],
          [
            0.3284960249936029,
            0.46695096154510973
          ],
          [
            0.35759979208062975,
            0.4574097765684128
          ],
          [
            0.3867035591676566,
            0.45604675014317037
          ],
          [
            0.4061060705590078,
            0.4574097765684128
          ],
          [
            0.33577196676535964,
            0.480581225797534
          ],
          [
            0.35759979208062975,
            0.47240306724607944
          ],
          [
            0.3794276173958999,
            0.471040040820837
          ],
          [
            0.3939795009394133,
            0.4696770143955946
          ]
        ],
        "dw_face": [
          [
            0.33092133891752185,
            0.2638600241839886
          ],
          [
            0.33577196676535964,
            0.2788533148616552
          ],
          [
            0.34304790853711636,
            0.29248357911407946
          ],
          [
            0.3551744781567109,
            0.3061138433665037
          ],
          [
            0.3648757338523865,
            0.3183810811936855
          ],
          [
            0.3818529313198188,
            0.33064831902086733
          ],
          [
            0.3988301287872511,
            0.34155253042280675
          ],
          [
            0.42065795410252127,
            0.34836766254901885
          ],
          [
            0.4424857794177914,
            0.34836766254901885
          ],
          [
            0.46431360473306155,
            0.34291555684804914
          ],
          [
            0.4837161161244128,
            0.3320113454461098
          ],
          [
            0.4958426857440073,
            0.31974410761892796
          ],
          [
            0.505543941439683,
            0.3061138433665037
          ],
          [
            0.5103945692875207,
            0.2911205526888371
          ],
          [
            0.5128198832114396,
            0.2774902884364128
          ],
          [
            0.5128198832114396,
            0.26249699775874613
          ],
          [
            0.5103945692875207,
            0.2475037070810795
          ],
          [
            0.34062259461319744,
            0.2597709449082613
          ],
          [
            0.35274916423279196,
            0.2570448920577765
          ],
          [
            0.3648757338523865,
            0.2570448920577765
          ],
          [
            0.377002303471981,
            0.2570448920577765
          ],
          [
            0.39155418701549444,
            0.2570448920577765
          ],
          [
            0.427933895874278,
            0.2529558127820492
          ],
          [
            0.4424857794177914,
            0.2502297599315643
          ],
          [
            0.4570376629613048,
            0.2475037070810795
          ],
          [
            0.46916423258089934,
            0.24614068065583705
          ],
          [
            0.4837161161244128,
            0.24614068065583705
          ],
          [
            0.41338201233076455,
            0.26794910345971584
          ],
          [
            0.41338201233076455,
            0.2761272620111704
          ],
          [
            0.4158073262546835,
            0.2843054205626249
          ],
          [
            0.4158073262546835,
            0.2938466055393219
          ],
          [
            0.40125544271117003,
            0.300661737665534
          ],
          [
            0.4109566984068456,
            0.300661737665534
          ],
          [
            0.42065795410252127,
            0.300661737665534
          ],
          [
            0.43035920979819686,
            0.2992987112402916
          ],
          [
            0.4400604654938725,
            0.2979356848150492
          ],
          [
            0.35759979208062975,
            0.27340120916068555
          ],
          [
            0.3673010477763054,
            0.2720381827354431
          ],
          [
            0.3794276173958999,
            0.27067515631020067
          ],
          [
            0.39155418701549444,
            0.2693121298849583
          ],
          [
            0.3794276173958999,
            0.2720381827354431
          ],
          [
            0.3673010477763054,
            0.27340120916068555
          ],
          [
            0.4376351515699536,
            0.265223050609231
          ],
          [
            0.4497617211895481,
            0.265223050609231
          ],
          [
            0.4618882908091426,
            0.2638600241839886
          ],
          [
            0.47401486042873714,
            0.26249699775874613
          ],
          [
            0.4618882908091426,
            0.2638600241839886
          ],
          [
            0.4497617211895481,
            0.265223050609231
          ],
          [
            0.39640481486333223,
            0.31974410761892796
          ],
          [
            0.40368075663508896,
            0.31429200191795825
          ],
          [
            0.4158073262546835,
            0.310202922642231
          ],
          [
            0.4230832680264402,
            0.310202922642231
          ],
          [
            0.43035920979819686,
            0.310202922642231
          ],
          [
            0.4449110933417103,
            0.310202922642231
          ],
          [
            0.45946297688522375,
            0.3156550283432007
          ],
          [
            0.4546123490373859,
            0.3224701604694128
          ],
          [
            0.4424857794177914,
            0.32928529259562495
          ],
          [
            0.43035920979819686,
            0.3333743718713522
          ],
          [
            0.4158073262546835,
            0.3320113454461098
          ],
          [
            0.4061060705590078,
            0.32655923974514006
          ],
          [
            0.3988301287872511,
            0.31974410761892796
          ],
          [
            0.4109566984068456,
            0.3156550283432007
          ],
          [
            0.4230832680264402,
            0.31429200191795825
          ],
          [
            0.4400604654938725,
            0.3129289754927158
          ],
          [
            0.4570376629613048,
            0.3156550283432007
          ],
          [
            0.4449110933417103,
            0.3224701604694128
          ],
          [
            0.427933895874278,
            0.32655923974514006
          ],
          [
            0.41338201233076455,
            0.3251962133198977
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            0.30181757183049496,
            0.9903531088382006
          ],
          [
            0.2557366072760358,
            0.9903531088382006
          ],
          [
            0.3139441414500895,
            0.9753598181605339
          ]
        ]
      }
    ]
  },
  "new_filename": "007901",
  "objects": [
    {
      "box": [
        0.00046728551387786865,
        0.5959575176239014,
        0.4169078469276428,
        0.6444083452224731
      ],
      "name": "notebook",
      "possible_names": [
        "notebook"
      ],
      "deleted": true
    },
    {
      "box": [
        0.315188467502594,
        0.6253325939178467,
        0.490001380443573,
        0.6631259918212891
      ],
      "name": "notebook",
      "possible_names": [
        "notebook"
      ],
      "deleted": false
    },
    {
      "box": [
        0.5173348784446716,
        0.5691900849342346,
        0.584194004535675,
        0.5951847434043884
      ],
      "name": "pencil",
      "possible_names": [
        "pencil"
      ]
    }
  ],
  "mask_file": "./person_labeling/./007901.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A warmly lit indoor setting with wooden furniture and greenery features a musical lesson with sheet music on the table and a recorder being played creating an intimate educational atmosphere",
  "overall_past": "Before the current scene, the individual playing the recorder likely set up the learning environment by arranging the sheet music on the table, ensuring the recorder was properly assembled and tuned, and perhaps explaining the basics of the piece they were about to play. They may have also engaged the learner in a brief conversation about musical notation or breathing techniques, preparing them mentally and physically for the lesson. This preparation created a calm, focused atmosphere conducive to learning, setting the stage for the current moment of active demonstration and attentive observation.",
  "overall_past_clean": "The individual established a structured and intentional learning space by organizing the necessary materials, calibrating the instrument for optimal performance, and initiating a preparatory dialogue centered on foundational musical concepts and physical readiness, thereby cultivating a mindset of concentration and readiness for instruction.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual playing the recorder is likely to pause and offer feedback or guidance to the learner, perhaps pointing out a specific note or technique that needs improvement. The learner may then attempt to replicate the correct sound, practicing with renewed focus, while the instructor continues to support and correct their form, reinforcing the learning process in a collaborative and nurturing environment.",
  "overall_future_clean": "The learner adjusts their approach based on the feedback, refining their execution with deliberate precision, while the instructor maintains steady guidance, ensuring each correction strengthens the developing skill through consistent, focused practice.",
  "future_scene_ok": true
}