{
  "image_path": "./ref_datasets/hico_det/images/train/train_00018567.jpg",
  "image_id": "train_00018567",
  "width": 480,
  "height": 640,
  "split": "train",
  "source": "zhimeng/hico_det",
  "dataset_index": 18567,
  "annotations": {
    "objects": "[{'id': 377, 'bbox_human': [94, 427, 1, 437], 'bbox_object': [186, 347, 281, 334], 'connection': 1, 'invis': 0}, {'id': 378, 'bbox_human': [90, 431, 8, 445], 'bbox_object': [178, 353, 275, 339], 'connection': 1, 'invis': 0}, {'id': 381, 'bbox_human': [94, 427, 4, 438], 'bbox_object': [185, 349, 279, 337], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('knife', 'cut_with'), ('knife', 'hold'), ('knife', 'wield')]",
    "negative_captions": "[('knife', 'wash'), ('knife', 'lick'), ('knife', 'no_interaction')]",
    "ambiguous_captions": "[('knife', 'stick')]",
    "positive_objects": "[376, 377, 380]",
    "negative_objects": "[379, 381, 382]",
    "ambiguous_objects": "[378]",
    "size": "[480, 640, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": true,
        "age": "adult",
        "gender": "male",
        "emotion": "unknown",
        "clothing_description": "The person is wearing a red shirt and a white apron. They are also wearing glasses.",
        "clothing": [
          {
            "possible_names": [
              "glasses"
            ],
            "name": "glasses",
            "type": "accessory",
            "color": [
              "clear",
              "black"
            ]
          },
          {
            "possible_names": [
              "shirt"
            ],
            "name": "shirt",
            "type": "top",
            "color": [
              "red"
            ]
          },
          {
            "possible_names": [
              "apron"
            ],
            "name": "apron",
            "type": "other",
            "color": [
              "white"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "knife"
            ],
            "name": "knife",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "turkey"
            ],
            "name": "turkey",
            "position": "body"
          }
        ],
        "description": "The person is an adult male in the background. He is wearing glasses, a red shirt, and a white apron. His emotion appears to be neutral. He is holding a knife in one hand and has a turkey on the counter in front of him.",
        "blurry": true,
        "face_seen": false,
        "emotion_description": "The person's face is blurred, making it impossible to determine their emotional state.",
        "meaningful": true,
        "story": "A man appears to be preparing a turkey for cooking, possibly for a special meal or holiday dinner. He is focused on the task at hand, using a large knife to cut the bird. The setting suggests a home kitchen environment.",
        "race": "unknown",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is focused on preparing a whole chicken for cooking, using a large knife to cut through it while standing at a kitchen counter. Wearing an apron over a red shirt suggests they are engaged in a culinary task, possibly preparing a meal for family or friends. The presence of a wine bottle nearby indicates that this could be part of a festive or special occasion dinner preparation. Their concentration on the task shows a level of seriousness and care in ensuring the chicken is properly prepared, which might be driven by a desire to create a delicious and well-cooked dish.",
        "intention": "The intention is to meticulously prepare a whole chicken with care and precision to ensure a delicious and impressive meal for a special occasion",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.6970570919769151,
            0.03105168087141854
          ],
          [
            0.6754033751430966,
            0.04529916388647897
          ],
          [
            0.6569356123606364,
            0.07766607488904681
          ],
          [
            0.6388270125502632,
            0.10627732617514474
          ],
          [
            0.6260497020468826,
            0.13112639359065464
          ],
          [
            0.6212738398994718,
            0.16683511734008788
          ],
          [
            0.6188043090559188,
            0.19454054832458495
          ],
          [
            0.6270076745677563,
            0.22447261129106794
          ],
          [
            0.6529683395155839,
            0.24154178074428012
          ],
          [
            0.6845248477799551,
            0.25739103044782363
          ],
          [
            0.7181542768364861,
            0.2572165284837995
          ],
          [
            0.7415997329921951,
            0.25142555236816405
          ],
          [
            0.7619894681941894,
            0.24355639048985073
          ],
          [
            0.7850702250287647,
            0.22767697743007115
          ],
          [
            0.8051738991623834,
            0.2094207899911063
          ],
          [
            0.8298558761676152,
            0.20322358948843816
          ],
          [
            0.8674575804244905,
            0.1901940209524972
          ],
          [
            0.7103848886631784,
            0.09608710833958219
          ],
          [
            0.7226336619683674,
            0.1065669127873012
          ],
          [
            0.7376733689790681,
            0.12388115950993131
          ],
          [
            0.7478517932551247,
            0.13618008409227644
          ],
          [
            0.7606199031074842,
            0.14754046031406948
          ],
          [
            0.793907465679305,
            0.1728645597185407
          ],
          [
            0.8108345030319123,
            0.1785938603537423
          ],
          [
            0.8249366274901799,
            0.1901482445853097
          ],
          [
            0.8338762721845082,
            0.19495553970336915
          ],
          [
            0.8386727636768704,
            0.20088860648018975
          ],
          [
            0.7637653718392055,
            0.1721402508871896
          ],
          [
            0.7501309522560665,
            0.1822117056165423
          ],
          [
            0.7356244410787309,
            0.19263625144958496
          ],
          [
            0.7234598178239097,
            0.205794586454119
          ],
          [
            0.6932297684607052,
            0.18144621849060058
          ],
          [
            0.7018632444597426,
            0.19386111668178013
          ],
          [
            0.7143226322673616,
            0.20444714682442805
          ],
          [
            0.7283730882264319,
            0.21061451094491143
          ],
          [
            0.7397068294740858,
            0.21237855638776507
          ],
          [
            0.7035941330449922,
            0.1146627800805228
          ],
          [
            0.7063701272010803,
            0.12300933429173062
          ],
          [
            0.7282548362300509,
            0.14156683853694368
          ],
          [
            0.7373344732182366,
            0.14740145547049385
          ],
          [
            0.7217845505192166,
            0.1412142072405134
          ],
          [
            0.7081740440357298,
            0.12724659102303643
          ],
          [
            0.7848617587770735,
            0.18200221742902484
          ],
          [
            0.7903253864674341,
            0.18976909773690362
          ],
          [
            0.8036735362949826,
            0.19996931893484932
          ],
          [
            0.8046258374339058,
            0.20455678531101773
          ],
          [
            0.7999319709482647,
            0.20188943317958286
          ],
          [
            0.7904509179648899,
            0.18918003354753768
          ],
          [
            0.6623727858776137,
            0.19701263563973564
          ],
          [
            0.675619808336099,
            0.20164734976632256
          ],
          [
            0.6936110891046978,
            0.20665101323808943
          ],
          [
            0.7023094422760464,
            0.21501408985682896
          ],
          [
            0.7055937493840854,
            0.21614499092102052
          ],
          [
            0.7185934283903668,
            0.22436088834490095
          ],
          [
            0.7185087504841032,
            0.23565303938729426
          ],
          [
            0.7005582619281043,
            0.2321636949266706
          ],
          [
            0.6859346526719274,
            0.2272711617606027
          ],
          [
            0.6820103018766358,
            0.22269272804260254
          ],
          [
            0.674794745019504,
            0.2121360642569406
          ],
          [
            0.6678016978360357,
            0.20611042295183454
          ],
          [
            0.6674647232251508,
            0.19676546369280135
          ],
          [
            0.6778176407019297,
            0.20948771749223982
          ],
          [
            0.6974705627276784,
            0.214508547101702
          ],
          [
            0.707897202031953,
            0.2244405473981585
          ],
          [
            0.7161920277845293,
            0.23567398616245816
          ],
          [
            0.7008764485518137,
            0.22334612437656948
          ],
          [
            0.6930236468712488,
            0.21618847846984862
          ],
          [
            0.6763557131091754,
            0.2055694035121373
          ]
        ],
        "visibility": [
          0.9999885559082031,
          0.19387584924697876,
          0.9851526021957397,
          3.108169277510342e-10,
          0.03928985074162483,
          0.9999737739562988,
          3.939837805365344e-15,
          2.7210369374364163e-11,
          0.6240604519844055,
          1.528344364487566e-05,
          8.576334948884323e-06,
          0.7708868384361267,
          0.9942740797996521,
          1.5294495824491605e-05,
          0.9784731864929199,
          2.3554573402861934e-08,
          0.9947336912155151,
          0.9999969005584717,
          1.4503733297374123e-14,
          0.38184964656829834,
          1.6618581956421707e-19,
          2.5577720497160783e-11,
          1.9016414398720372e-07,
          0.4720388948917389,
          0.07000095397233963,
          0.9997628331184387,
          0.654109537601471,
          0.9999924898147583,
          8.99993974599056e-05
        ],
        "headpose": {
          "pitch": -38.18977672517028,
          "yaw": 15.95079519327736,
          "roll": 35.59068484030533
        },
        "attributes": {
          "5 oClock Shadow": 0.030477816238999367,
          "Arched Eyebrows": 0.002729206345975399,
          "Attractive": 0.029337799176573753,
          "Bags Under Eyes": 0.03875581920146942,
          "Bald": 0.0005135336541570723,
          "Bangs": 0.0020412702579051256,
          "Big Lips": 0.02614240162074566,
          "Big Nose": 0.12661884725093842,
          "Black Hair": 0.05703375115990639,
          "Blond Hair": 0.006807886064052582,
          "Blurry": 0.3104856014251709,
          "Brown Hair": 0.03127116337418556,
          "Bushy Eyebrows": 0.004365033470094204,
          "Chubby": 0.011731822974979877,
          "Double Chin": 0.0006601457134820521,
          "Eyeglasses": 0.02818235754966736,
          "Goatee": 0.0036354062613099813,
          "Gray Hair": 0.004271277226507664,
          "Heavy Makeup": 0.0009572478593327105,
          "High Cheekbones": 0.015114875510334969,
          "Male": 0.7723302841186523,
          "Mouth Slightly Open": 0.0021217786706984043,
          "Mustache": 0.010163645260035992,
          "Narrow Eyes": 0.16597573459148407,
          "No Beard": 0.741190493106842,
          "Oval Face": 0.019584523513913155,
          "Pale Skin": 0.0002839740482158959,
          "Pointy Nose": 0.09158248454332352,
          "Receding Hairline": 0.08898568153381348,
          "Rosy Cheeks": 7.418071618303657e-05,
          "Sideburns": 0.015618923120200634,
          "Smiling": 0.0019284436712041497,
          "Straight Hair": 0.43744537234306335,
          "Wavy Hair": 0.009561181999742985,
          "Wearing Earrings": 0.016194771975278854,
          "Wearing Hat": 0.0010331764351576567,
          "Wearing Lipstick": 0.000877662212587893,
          "Wearing Necklace": 0.0278797410428524,
          "Wearing Necktie": 0.0011788186384364963,
          "Young": 0.7246848344802856
        },
        "age": [
          0.001539125805720687,
          0.005237931851297617,
          0.28206443786621094,
          0.24064937233924866,
          0.9675602316856384,
          0.27482685446739197,
          0.04179022088646889,
          0.0007919574272818863
        ],
        "race": [
          0.14921239018440247,
          0.6584556698799133,
          0.9412004351615906,
          0.1549166589975357,
          0.38537538051605225
        ],
        "gender": [
          0.3123978078365326,
          0.6951989531517029
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 6.139634922146797,
          "disgust": 1.2784954606104293e-05,
          "fear": 16.438637673854828,
          "happy": 0.3169216215610504,
          "sad": 20.88339626789093,
          "surprise": 0.11320989578962326,
          "neutral": 56.10818266868591
        },
        "dominant_emotion": "neutral",
        "region": {
          "x": 0,
          "y": 0,
          "w": 172,
          "h": 191,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 30,
        "gender": {
          "Woman": 23.611772060394287,
          "Man": 76.38823390007019
        },
        "dominant_gender": "Man",
        "race": {
          "asian": 30.74134886264801,
          "indian": 9.873025864362717,
          "black": 8.285922557115555,
          "white": 17.8744837641716,
          "middle eastern": 12.727545201778412,
          "latino hispanic": 20.497673749923706
        },
        "dominant_race": "asian"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "hand",
                "cut with"
              ],
              [
                "hand",
                "hold"
              ],
              [
                "hand",
                "wield"
              ]
            ],
            "negative_action": [
              "wash",
              "lick",
              "no interaction"
            ],
            "position": "hand"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.19756704568862915,
        0.0013661384582519531,
        0.8922744393348694,
        0.6863480806350708
      ]
    ],
    "face_boxes": [
      [
        0.633745551109314,
        0.03864474222064018,
        0.8750690221786499,
        0.248135045170784
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            0.6247888760434257,
            0.2035250275499291
          ],
          [
            0.44932162441589213,
            0.15222316160798072
          ],
          [
            0.2396531288270597,
            0.3328949503600597
          ],
          [
            0.4314774971317362,
            0.42211558678083944
          ],
          [
            0.8002561276709592,
            0.2548268934918775
          ],
          [
            0.7660548837096604,
            0.4488817777070733
          ],
          [
            0.6946783745730365,
            0.5180277709331776
          ],
          [
            0.4180944016686193,
            0.6250925346381135
          ],
          [
            0.38538016831433336,
            0.7700760688218806
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6307369184714776,
            0.6317840823696721
          ],
          [
            0.6753472366818675,
            0.7700760688218806
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7318536397483615,
            0.15556893547375994
          ],
          [
            0.7943080852429072,
            0.1801046104894744
          ],
          [
            0.6575031093977117,
            0.08084665247135688
          ],
          [
            0.8329703610252451,
            0.16895203093687697
          ]
        ],
        "dw_hand_1": [
          [
            0.6931913639660235,
            0.5157972550226583
          ],
          [
            0.6842693003239456,
            0.5191430288884373
          ],
          [
            0.6708862048608286,
            0.5180277709331776
          ],
          [
            0.6604771306117375,
            0.525834576619996
          ],
          [
            0.6545290881836856,
            0.5314108663962949
          ],
          [
            0.6961653851800494,
            0.529180350485775
          ],
          [
            0.6991394063940756,
            0.5414481879936326
          ],
          [
            0.6931913639660235,
            0.5369871561725934
          ],
          [
            0.6827822897169324,
            0.5325261243515544
          ],
          [
            0.6961653851800494,
            0.5414481879936326
          ],
          [
            0.6946783745730365,
            0.5548312834567495
          ],
          [
            0.6827822897169324,
            0.5537160255014897
          ],
          [
            0.6693991942538154,
            0.5492549936804505
          ],
          [
            0.6946783745730365,
            0.5492549936804505
          ],
          [
            0.6917043533590106,
            0.5592923152777882
          ],
          [
            0.6753472366818675,
            0.5581770573225285
          ],
          [
            0.6679121836468025,
            0.5570617993672689
          ],
          [
            0.6917043533590106,
            0.5559465414120092
          ],
          [
            0.6827822897169324,
            0.561522831188308
          ],
          [
            0.6768342472888804,
            0.5637533470988274
          ],
          [
            0.6708862048608286,
            0.5637533470988274
          ]
        ],
        "dw_hand_2": [
          [
            0.4389125501668012,
            0.4210003288255799
          ],
          [
            0.48054884716316504,
            0.42992239246765773
          ],
          [
            0.526646175980568,
            0.43772919815447586
          ],
          [
            0.5459773138717369,
            0.45557332543863194
          ],
          [
            0.5548993775138149,
            0.48010900045434635
          ],
          [
            0.5400292714436848,
            0.4366139401992162
          ],
          [
            0.5593604093348539,
            0.4578038413491513
          ],
          [
            0.5608474199418668,
            0.4823395163648658
          ],
          [
            0.5548993775138149,
            0.49906838569376194
          ],
          [
            0.5147500911244639,
            0.4455360038412942
          ],
          [
            0.5281331865875809,
            0.47787848454382675
          ],
          [
            0.529620197194594,
            0.4934920959174634
          ],
          [
            0.525159165373555,
            0.5001836436490218
          ],
          [
            0.48798390019822996,
            0.4544580674833722
          ],
          [
            0.50285400626836,
            0.48457003227538537
          ],
          [
            0.5043410168753729,
            0.4946073538727231
          ],
          [
            0.5013669956613469,
            0.4946073538727231
          ],
          [
            0.46270471987900913,
            0.46338013112545023
          ],
          [
            0.477574825949139,
            0.48457003227538537
          ],
          [
            0.4820358577701781,
            0.491261580006944
          ],
          [
            0.48352286837719105,
            0.4923768379622035
          ]
        ],
        "dw_face": [
          [
            0.6679121836468025,
            0.09980603771077261
          ],
          [
            0.6545290881836856,
            0.11318913317388954
          ],
          [
            0.6426330033275816,
            0.12880274454752608
          ],
          [
            0.6307369184714776,
            0.1444163559211625
          ],
          [
            0.6262758866504387,
            0.16226048320531844
          ],
          [
            0.6247888760434257,
            0.1801046104894744
          ],
          [
            0.6307369184714776,
            0.19794873777363042
          ],
          [
            0.6381719715065427,
            0.21467760710252656
          ],
          [
            0.6500680563626465,
            0.2291759605209033
          ],
          [
            0.6679121836468025,
            0.24144379802876043
          ],
          [
            0.6917043533590106,
            0.24367431393927994
          ],
          [
            0.7110354912501795,
            0.234752250297202
          ],
          [
            0.7318536397483615,
            0.225830186655124
          ],
          [
            0.7526717882465433,
            0.216908123013046
          ],
          [
            0.7734899367447253,
            0.20687080141570827
          ],
          [
            0.7913340640288813,
            0.19348770595259132
          ],
          [
            0.8076911807060242,
            0.1801046104894744
          ],
          [
            0.7154965230712184,
            0.13437903432382478
          ],
          [
            0.7303666291413483,
            0.1388400661448638
          ],
          [
            0.7437497246044652,
            0.14553161387642222
          ],
          [
            0.7556458094605693,
            0.15222316160798072
          ],
          [
            0.7660548837096604,
            0.16002996729479896
          ],
          [
            0.7868730322078422,
            0.17006728889213668
          ],
          [
            0.7943080852429072,
            0.17118254684739637
          ],
          [
            0.8017431382779722,
            0.17341306275791588
          ],
          [
            0.8106652019200501,
            0.17452832071317567
          ],
          [
            0.8151262337410892,
            0.1767588366236951
          ],
          [
            0.7690289049236863,
            0.17452832071317567
          ],
          [
            0.7615938518886213,
            0.1856809002657731
          ],
          [
            0.7526717882465433,
            0.19571822186311083
          ],
          [
            0.7452367352114784,
            0.20687080141570827
          ],
          [
            0.7140095124642054,
            0.19794873777363042
          ],
          [
            0.7214445654992704,
            0.20352502754992904
          ],
          [
            0.7288796185343354,
            0.20910131732622786
          ],
          [
            0.7378016821764135,
            0.21244709119200705
          ],
          [
            0.7467237458184913,
            0.21244709119200705
          ],
          [
            0.7169835336782313,
            0.14887738774220152
          ],
          [
            0.7259055973203095,
            0.15445367751850023
          ],
          [
            0.7363146715694003,
            0.15779945138427953
          ],
          [
            0.7452367352114784,
            0.16337574116057815
          ],
          [
            0.7333406503553744,
            0.16002996729479896
          ],
          [
            0.7244185867132965,
            0.15556893547375994
          ],
          [
            0.7794379791727774,
            0.17787409457895498
          ],
          [
            0.7868730322078422,
            0.1801046104894744
          ],
          [
            0.7928210746358942,
            0.18233512639999389
          ],
          [
            0.7972821064569331,
            0.1845656423105134
          ],
          [
            0.7913340640288813,
            0.1834503843552536
          ],
          [
            0.7853860216008293,
            0.1812198684447341
          ],
          [
            0.6827822897169324,
            0.20240976959466933
          ],
          [
            0.6991394063940756,
            0.20798605937096815
          ],
          [
            0.7140095124642054,
            0.21467760710252656
          ],
          [
            0.7184705442852445,
            0.216908123013046
          ],
          [
            0.7229315761062833,
            0.21802338096830587
          ],
          [
            0.7259055973203095,
            0.22136915483408498
          ],
          [
            0.7259055973203095,
            0.2235996707446045
          ],
          [
            0.7199575548922574,
            0.225830186655124
          ],
          [
            0.7125225018571925,
            0.2269454446103837
          ],
          [
            0.7050874488221275,
            0.2269454446103837
          ],
          [
            0.6946783745730365,
            0.2202538968788253
          ],
          [
            0.6872433215379715,
            0.21133183323674726
          ],
          [
            0.6842693003239456,
            0.20352502754992904
          ],
          [
            0.6991394063940756,
            0.21133183323674726
          ],
          [
            0.7140095124642054,
            0.21913863892356558
          ],
          [
            0.7184705442852445,
            0.22136915483408498
          ],
          [
            0.7244185867132965,
            0.2235996707446045
          ],
          [
            0.7184705442852445,
            0.22248441278934478
          ],
          [
            0.7125225018571925,
            0.2202538968788253
          ],
          [
            0.6976523957870626,
            0.21244709119200705
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "knife",
      "possible_names": [
        "knife"
      ],
      "box": [
        0.3875,
        0.4390625,
        0.7229166666666667,
        0.521875
      ]
    },
    {
      "name": "knife",
      "possible_names": [
        "knife"
      ],
      "box": [
        0.37083333333333335,
        0.4296875,
        0.7354166666666667,
        0.5296875
      ]
    }
  ],
  "scene": "A kitchen scene with wooden cabinets and countertops features a large uncooked turkey being prepared on a cutting board alongside a bottle of wine and various kitchen tools suggesting a home cooking environment for a festive meal preparation",
  "overall_past": "Before the current scene, the individual likely selected and brought the whole chicken from the refrigerator, possibly after thawing it if it was frozen, and then placed it on the cutting board to begin preparation. They may have already gathered the necessary tools—such as the large knife, a cutting board, and kitchen utensils—while also opening the bottle of wine, perhaps to enjoy a small sip while cooking or to use in the recipe. The presence of wooden cabinets and countertops suggests a familiar, well-used kitchen, indicating this preparation is part of a routine or tradition, possibly for a holiday or family gathering. The focused expression and apron imply that the cooking process had already begun with intention and care, setting the stage for a special meal.",
  "overall_past_clean": "The individual had retrieved the chicken from the refrigerator, carefully handling it with deliberate intent, then proceeded to prepare the cooking space by arranging tools and opening a bottle of wine, all done with the quiet precision of a practiced ritual.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to season the chicken thoroughly, possibly using herbs, salt, and pepper, before placing it in the oven to roast. The presence of the wine bottle nearby suggests it may be used to baste the bird during cooking or to deglaze the pan later, enhancing the flavor. With focused attention and care, the next step would involve preparing the oven and setting a timer, ensuring the turkey is cooked to perfection for the festive meal.",
  "overall_future_clean": "The oven door slams shut with a decisive click, the dial spinning to the set temperature as the timer begins its steady countdown, the air already humming with the promise of golden skin and rich, savory aroma.",
  "future_scene_ok": true
}