{
  "image_path": "./ref_datasets/hico_det/images/test/test_00002288.jpg",
  "image_id": "test_00002288",
  "width": 640,
  "height": 428,
  "split": "test",
  "source": "zhimeng/hico_det",
  "dataset_index": 2288,
  "annotations": {
    "objects": "[{'id': 135, 'bbox_human': [369, 520, 233, 427], 'bbox_object': [2, 373, 94, 423], 'connection': 1, 'invis': 0}, {'id': 138, 'bbox_human': [370, 522, 233, 424], 'bbox_object': [1, 372, 87, 421], 'connection': 1, 'invis': 0}]",
    "positive_captions": "[('horse', 'kiss'), ('horse', 'pet')]",
    "negative_captions": "[('horse', 'feed'), ('horse', 'groom'), ('horse', 'hold'), ('horse', 'hug'), ('horse', 'jump'), ('horse', 'load'), ('horse', 'hop_on'), ('horse', 'race'), ('horse', 'ride'), ('horse', 'run'), ('horse', 'straddle'), ('horse', 'train'), ('horse', 'walk'), ('horse', 'wash'), ('horse', 'no_interaction')]",
    "ambiguous_captions": "[]",
    "positive_objects": "[134, 137]",
    "negative_objects": "[129, 130, 131, 132, 133, 135, 136, 138, 139, 140, 141, 142, 143, 144, 145]",
    "ambiguous_objects": "[]",
    "size": "[640, 428, 3]"
  },
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": 0,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "female",
        "emotion": "neutral",
        "clothing_description": "The person is wearing a gray hoodie.",
        "clothing": [
          {
            "possible_names": [
              "hoodie",
              "sweatshirt"
            ],
            "name": "hoodie",
            "type": "top",
            "color": [
              "gray"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "horse"
            ],
            "name": "horse",
            "position": "other"
          }
        ],
        "description": "The person is in the foreground, and appears to be an adult female. She is happy and wearing a gray hoodie. She is making physical contact with and appears to be interacting closely with a horse beside her, showing affection by bringing her face near the horse.",
        "blurry": false,
        "face_seen": true,
        "emotion_description": "The person appears to be calmly interacting with the horse, showing a gentle and composed demeanor.",
        "meaningful": true,
        "story": "A woman is enjoying a peaceful moment outdoors with two horses. She seems to have a close bond with the animals, as she is comfortably close to them, suggesting familiarity and trust. The setting implies a rural or farm environment where such interactions are common.",
        "race": "white",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is standing close to two horses, showing a gentle interaction as one horse nuzzles her face affectionately. Her body language suggests comfort and trust with the animals, indicating a likely bond or familiarity. She appears calm and content, possibly enjoying the moment of connection with the horse, which could be motivated by a love for animals or a desire for companionship. The setting seems peaceful, enhancing the serene atmosphere of this interaction.",
        "intention": "The intention is to connect with animals through gentle interaction fostering a sense of peace and mutual trust",
        "intention_ok": true
      },
      "facex_detailing": {
        "landmarks": [
          [
            0.5874262640518801,
            0.6035216379865945
          ],
          [
            0.5865874430962971,
            0.615134794339637
          ],
          [
            0.58329995402268,
            0.6337099005287894
          ],
          [
            0.5797802226884025,
            0.6498763971876239
          ],
          [
            0.577415699219065,
            0.6644985774489685
          ],
          [
            0.576630031264254,
            0.6838702276965803
          ],
          [
            0.5768362828397324,
            0.698899150690504
          ],
          [
            0.5770291763756956,
            0.7119482878212616
          ],
          [
            0.5825989018593516,
            0.7273431352684113
          ],
          [
            0.5933914339968136,
            0.7376178377301734
          ],
          [
            0.6046241670846939,
            0.7356117004068576
          ],
          [
            0.619373447660889,
            0.7340181984793201
          ],
          [
            0.6318961364882333,
            0.725877914632433
          ],
          [
            0.648769440821239,
            0.7127798154293615
          ],
          [
            0.6590441309979984,
            0.6946227655550826
          ],
          [
            0.6655384295753071,
            0.670744899754849
          ],
          [
            0.6744142615369388,
            0.6495547173656672
          ],
          [
            0.5918550415230649,
            0.6011972058121766
          ],
          [
            0.5938193229692323,
            0.5862355187674549
          ],
          [
            0.594962138948696,
            0.5913096645645528
          ],
          [
            0.5990556537040642,
            0.5891506738751848
          ],
          [
            0.6009769075683186,
            0.585469662904421
          ],
          [
            0.6114476554095745,
            0.5825675883503241
          ],
          [
            0.6176321246794292,
            0.5800437035961686
          ],
          [
            0.6204462626150675,
            0.581069904271369
          ],
          [
            0.6265898026525974,
            0.5811493476337998
          ],
          [
            0.6336494601198605,
            0.5940754092105718
          ],
          [
            0.6006675307239805,
            0.598818018216794
          ],
          [
            0.5948514660554273,
            0.61018268956998
          ],
          [
            0.5879872913339308,
            0.6175165227322139
          ],
          [
            0.5830942285912377,
            0.6246691978821289
          ],
          [
            0.586229565526758,
            0.6524451679795066
          ],
          [
            0.5872639294181552,
            0.6529290781161178
          ],
          [
            0.5890522462981088,
            0.6529446042905026
          ],
          [
            0.5932607385729041,
            0.6502369834838786
          ],
          [
            0.598621587987457,
            0.6518925983851679
          ],
          [
            0.5927966172673872,
            0.6113406144410809
          ],
          [
            0.5938211826341493,
            0.6101260223439603
          ],
          [
            0.597416022845677,
            0.6076015954978953
          ],
          [
            0.5974240094423294,
            0.6097841899449103
          ],
          [
            0.5962435373238155,
            0.608398967177591
          ],
          [
            0.5933970794081688,
            0.6106177948823123
          ],
          [
            0.6131839929946832,
            0.6119312628884819
          ],
          [
            0.6139005202267851,
            0.6030438439709163
          ],
          [
            0.6209809619401183,
            0.6067881596900115
          ],
          [
            0.6242766991257668,
            0.6088401058487326
          ],
          [
            0.6205135550882135,
            0.6085884427833304
          ],
          [
            0.6142397264284747,
            0.6082910784732833
          ],
          [
            0.5820448524717774,
            0.6764126486071599
          ],
          [
            0.5829579251153129,
            0.6775839312850076
          ],
          [
            0.5842491365436997,
            0.668864080839068
          ],
          [
            0.5852436400949955,
            0.666023386813929
          ],
          [
            0.5869588094630411,
            0.6652926138150836
          ],
          [
            0.5954163766333035,
            0.6696003989001936
          ],
          [
            0.6016349964908192,
            0.6816157377928058
          ],
          [
            0.5958564447505134,
            0.6823022165031076
          ],
          [
            0.5910289704799652,
            0.6860953039416325
          ],
          [
            0.5850812743284872,
            0.6874392780665561
          ],
          [
            0.5844586497970989,
            0.6851655707976846
          ],
          [
            0.5844431000096457,
            0.6790788635233534
          ],
          [
            0.5830411056854895,
            0.6792450498675153
          ],
          [
            0.5843610547482967,
            0.6763395862044576
          ],
          [
            0.5858189760042088,
            0.6763171411165408
          ],
          [
            0.5945940851100853,
            0.673590096039511
          ],
          [
            0.6019105880388191,
            0.6802530097706774
          ],
          [
            0.5937063275703361,
            0.680461553769691
          ],
          [
            0.5864593441465071,
            0.6812808822407742
          ],
          [
            0.5838068476212877,
            0.6769728488692931
          ]
        ],
        "visibility": [
          0.9999971389770508,
          0.9999998807907104,
          0.9999406337738037,
          0.0014214172260835767,
          0.9999996423721313,
          0.9998438358306885,
          6.062838009412985e-10,
          3.182988734806713e-07,
          0.14384734630584717,
          6.962203315197257e-06,
          0.9990001320838928,
          0.0018336749635636806,
          5.131715941075754e-09,
          0.07065299153327942,
          1.0708569447848149e-10,
          0.005450646858662367,
          0.016299143433570862,
          0.00024359884264413267,
          2.1777043002657592e-05,
          1.0267977874206524e-12,
          1.6796298950794153e-05,
          8.71196795260154e-11,
          0.9780381917953491,
          7.342018059329231e-16,
          9.367189132919538e-15,
          4.775576809001869e-11,
          9.93033722807013e-07,
          8.1691114246496e-06,
          5.515504497566326e-08
        ],
        "headpose": {
          "pitch": 39.20140970351921,
          "yaw": 58.490768919700244,
          "roll": 38.19222193289315
        },
        "attributes": {
          "5 oClock Shadow": 0.0010905737290158868,
          "Arched Eyebrows": 0.001563261728733778,
          "Attractive": 0.2302575558423996,
          "Bags Under Eyes": 0.003364181611686945,
          "Bald": 2.556332390213356e-08,
          "Bangs": 0.5007513761520386,
          "Big Lips": 0.04205621778964996,
          "Big Nose": 0.0012918519787490368,
          "Black Hair": 0.0027006431482732296,
          "Blond Hair": 0.055537428706884384,
          "Blurry": 0.08562703430652618,
          "Brown Hair": 0.44050824642181396,
          "Bushy Eyebrows": 0.0018106548814103007,
          "Chubby": 0.00044294263352639973,
          "Double Chin": 4.9364283768227324e-05,
          "Eyeglasses": 0.000640926300548017,
          "Goatee": 5.295768642099574e-05,
          "Gray Hair": 0.0012706503039225936,
          "Heavy Makeup": 0.010625668801367283,
          "High Cheekbones": 0.015111100859940052,
          "Male": 0.4444902241230011,
          "Mouth Slightly Open": 0.07576825469732285,
          "Mustache": 8.417724529863335e-06,
          "Narrow Eyes": 0.12509047985076904,
          "No Beard": 0.9979598522186279,
          "Oval Face": 0.08957576006650925,
          "Pale Skin": 0.11024142801761627,
          "Pointy Nose": 0.18904271721839905,
          "Receding Hairline": 1.907046498672571e-05,
          "Rosy Cheeks": 6.70437584631145e-05,
          "Sideburns": 3.593925430322997e-05,
          "Smiling": 0.021584415808320045,
          "Straight Hair": 0.05750954896211624,
          "Wavy Hair": 0.43290963768959045,
          "Wearing Earrings": 0.11384301632642746,
          "Wearing Hat": 0.0008642210741527379,
          "Wearing Lipstick": 0.015440571121871471,
          "Wearing Necklace": 0.025237616151571274,
          "Wearing Necktie": 0.0014105888549238443,
          "Young": 0.9220901131629944
        },
        "age": [
          0.9216180443763733,
          0.9846429824829102,
          0.5146937966346741,
          0.043372586369514465,
          0.053766652941703796,
          0.00033266484388150275,
          8.881265239324421e-05,
          1.1830672974610934e-06
        ],
        "race": [
          0.9985332489013672,
          4.99016787216533e-05,
          0.7325725555419922,
          0.18729601800441742,
          0.29054394364356995
        ],
        "gender": [
          0.21096527576446533,
          0.8040143847465515
        ]
      },
      "deepface_detailing": {
        "emotion": {
          "angry": 0.051806174451485276,
          "disgust": 5.799550564181827e-12,
          "fear": 0.04398823366500437,
          "happy": 4.569293077585912e-11,
          "sad": 99.64602589607239,
          "surprise": 1.2171612459241365e-10,
          "neutral": 0.2581800566986203
        },
        "dominant_emotion": "sad",
        "region": {
          "x": 0,
          "y": 0,
          "w": 77,
          "h": 103,
          "left_eye": null,
          "right_eye": null
        },
        "face_confidence": 0.0,
        "age": 29,
        "gender": {
          "Woman": 95.26278972625732,
          "Man": 4.737204313278198
        },
        "dominant_gender": "Woman",
        "race": {
          "asian": 4.187328368425369,
          "indian": 0.4826047923415899,
          "black": 0.1317038433626294,
          "white": 78.01759839057922,
          "middle eastern": 9.255483746528625,
          "latino hispanic": 7.925283908843994
        },
        "dominant_race": "white"
      },
      "hoi": [
        {
          "relationship": {
            "action": [
              [
                "mouth",
                "kiss"
              ],
              [
                "mouth",
                "pet"
              ]
            ],
            "negative_action": [
              "feed",
              "groom",
              "hold",
              "hug",
              "jump",
              "load",
              "hop on",
              "race",
              "ride",
              "run",
              "straddle",
              "train",
              "walk",
              "wash",
              "no interaction"
            ],
            "position": "mouth"
          },
          "object": 0
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.5802348256111145,
        0.5490980744361877,
        0.8085366487503052,
        0.992128312587738
      ]
    ],
    "face_boxes": [
      [
        0.5825300812721252,
        0.5674910545349121,
        0.6638357639312744,
        0.7294736504554749
      ]
    ],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7828938666110238,
            0.8635632464447497
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6791337261286875,
            0.8686622485657719
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6153188040480018,
            0.9451472803811046
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.6065503414720297,
            0.6311944355010244
          ],
          [
            0.6177544880968828,
            0.6377502953709101
          ],
          [
            0.6659810322647294,
            0.6996667496976081
          ],
          [
            0.663058211406072,
            0.6982098919487445
          ]
        ],
        "dw_hand_1": [
          [
            0.6153188040480018,
            0.926936558520311
          ],
          [
            0.6226258561946452,
            0.918923840901562
          ],
          [
            0.6323685923901696,
            0.9007131190407685
          ],
          [
            0.635291413248827,
            0.8977994035430416
          ],
          [
            0.6348042764390509,
            0.8956141169197464
          ],
          [
            0.6240872666239738,
            0.8977994035430416
          ],
          [
            0.6323685923901696,
            0.8380682358396387
          ],
          [
            0.635291413248827,
            0.8293270893464578
          ],
          [
            0.6367528236781557,
            0.8293270893464578
          ],
          [
            0.6206773089555402,
            0.9167385542782668
          ],
          [
            0.6294457715315123,
            0.8329692337186165
          ],
          [
            0.6328557291999459,
            0.8329692337186165
          ],
          [
            0.6338300028194983,
            0.8322408048441848
          ],
          [
            0.6182416249066591,
            0.9254797007714477
          ],
          [
            0.6265229506728549,
            0.8409819513373658
          ],
          [
            0.6299329083412886,
            0.8395250935885022
          ],
          [
            0.6318814555803935,
            0.8380682358396387
          ],
          [
            0.6167802144773304,
            0.9349492761390604
          ],
          [
            0.6226258561946452,
            0.8621063886958862
          ],
          [
            0.6294457715315123,
            0.8606495309470228
          ],
          [
            0.6274972242924075,
            0.8489946689561149
          ]
        ],
        "dw_hand_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_face": [
          [
            0.607037478281806,
            0.6282807200032974
          ],
          [
            0.6021661101840436,
            0.6399355819942053
          ],
          [
            0.5968076052765052,
            0.6530473017339765
          ],
          [
            0.5919362371787429,
            0.6661590214737478
          ],
          [
            0.5875520058907568,
            0.6792707412135192
          ],
          [
            0.5856034586516519,
            0.6938393187021541
          ],
          [
            0.5831677746027708,
            0.7084078961907889
          ],
          [
            0.5865777322712045,
            0.7200627581816967
          ],
          [
            0.5958333316569526,
            0.7266186180515825
          ],
          [
            0.6060632046622534,
            0.7288039046748777
          ],
          [
            0.6167802144773304,
            0.7295323335493092
          ],
          [
            0.6270100874826312,
            0.7266186180515825
          ],
          [
            0.6362656868683796,
            0.7222480448049919
          ],
          [
            0.6440598758247991,
            0.7120500405629475
          ],
          [
            0.6508797911616664,
            0.7003951785720397
          ],
          [
            0.656725432878981,
            0.6880118877067001
          ],
          [
            0.6625710745962957,
            0.6756285968413607
          ],
          [
            0.6104474359502394,
            0.6180827157612531
          ],
          [
            0.6104474359502394,
            0.6180827157612531
          ],
          [
            0.6104474359502394,
            0.6188111446356848
          ],
          [
            0.6104474359502394,
            0.6188111446356848
          ],
          [
            0.6109345727600157,
            0.6188111446356848
          ],
          [
            0.6143445304284494,
            0.6180827157612531
          ],
          [
            0.6187287617164354,
            0.6195395735101165
          ],
          [
            0.6221387193848689,
            0.6217248601334118
          ],
          [
            0.6250615402435262,
            0.6253670045055704
          ],
          [
            0.6279843611021836,
            0.6304660066265926
          ],
          [
            0.6075246150915821,
            0.6304660066265926
          ],
          [
            0.6011918365644913,
            0.6362934376220465
          ],
          [
            0.5948590580374002,
            0.6406640108686371
          ],
          [
            0.5885262795103092,
            0.6457630129896592
          ],
          [
            0.5875520058907568,
            0.6530473017339765
          ],
          [
            0.5899876899396379,
            0.6581463038549988
          ],
          [
            0.5933976476080716,
            0.6617884482271574
          ],
          [
            0.5963204684667289,
            0.6639737348504526
          ],
          [
            0.5992432893253863,
            0.6639737348504526
          ],
          [
            0.6065503414720297,
            0.6304660066265926
          ],
          [
            0.607037478281806,
            0.6311944355010244
          ],
          [
            0.607037478281806,
            0.6311944355010244
          ],
          [
            0.607037478281806,
            0.6304660066265926
          ],
          [
            0.6065503414720297,
            0.6311944355010244
          ],
          [
            0.6065503414720297,
            0.6311944355010244
          ],
          [
            0.6143445304284494,
            0.6362934376220465
          ],
          [
            0.6172673512871067,
            0.6355650087476149
          ],
          [
            0.6197030353359878,
            0.6377502953709101
          ],
          [
            0.6226258561946452,
            0.6413924397430687
          ],
          [
            0.6192158985262115,
            0.6413924397430687
          ],
          [
            0.6158059408577781,
            0.6406640108686371
          ],
          [
            0.5885262795103092,
            0.6799991700879511
          ],
          [
            0.5880391427005331,
            0.6763570257157923
          ],
          [
            0.5890134163200855,
            0.6727148813436336
          ],
          [
            0.5890134163200855,
            0.6727148813436336
          ],
          [
            0.5904748267494142,
            0.6727148813436336
          ],
          [
            0.594371921227624,
            0.6778138834646559
          ],
          [
            0.5982690157058339,
            0.6850981722089732
          ],
          [
            0.594371921227624,
            0.6858266010834049
          ],
          [
            0.5904748267494142,
            0.6865550299578368
          ],
          [
            0.5865777322712045,
            0.6865550299578368
          ],
          [
            0.5865777322712045,
            0.6843697433345415
          ],
          [
            0.5880391427005331,
            0.6821844567112463
          ],
          [
            0.5885262795103092,
            0.6799991700879511
          ],
          [
            0.5890134163200855,
            0.6799991700879511
          ],
          [
            0.5895005531298618,
            0.6785423123390875
          ],
          [
            0.5933976476080716,
            0.6807275989623828
          ],
          [
            0.5972947420862813,
            0.6843697433345415
          ],
          [
            0.5933976476080716,
            0.6821844567112463
          ],
          [
            0.5895005531298618,
            0.6799991700879511
          ],
          [
            0.5895005531298618,
            0.6799991700879511
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "objects": [
    {
      "name": "horse",
      "possible_names": [
        "horse"
      ],
      "box": [
        0.003125,
        0.21962616822429906,
        0.5828125,
        0.9883177570093458
      ]
    }
  ],
  "scene": "A serene outdoor setting features two brown horses with bridles interacting closely amidst greenery and a wire fence under an overcast sky",
  "overall_past": "Before the current scene, the individual likely spent time gradually building trust with the two horses, perhaps by spending quiet moments near them, offering gentle gestures or treats, and allowing the animals to become accustomed to their presence. The calm, overcast sky and serene setting suggest a slow, deliberate approach, possibly over several visits or a longer period, fostering a sense of safety and familiarity. This prior interaction would explain the horses’ relaxed posture and the affectionate nuzzle, indicating that the bond had developed through consistent, patient, and respectful engagement.",
  "overall_past_clean": "The individual approached the horses with steady, unhurried movements, maintaining a low, soothing presence that invited curiosity without intrusion, gradually earning their trust through repeated, consistent displays of calm and non-threatening behavior over multiple encounters.",
  "past_scene_ok": true,
  "overall_future": "The horse continues to nuzzle gently against the person’s shoulder, as if seeking reassurance or affection, and the person softly strokes its neck in response, their quiet laughter blending with the soft rustle of leaves in the breeze. The moment deepens into a shared stillness, as both animal and human seem to exist in a peaceful harmony, the overcast sky gradually parting to allow a single beam of sunlight to break through and illuminate the wire fence and the greenery around them—suggesting a quiet, hopeful continuation of connection and calm.",
  "overall_future_clean": "The horse lifts its head slightly, nostrils flaring as the sunlight warms its coat, and with a slow, deliberate step, it turns toward the open path ahead, the person following closely, their presence a quiet promise of movement forward into the light.",
  "future_scene_ok": true
}