{
  "video_path": "./ref_datasets/part2/6613678001.mp4",
  "start_time": 0.0,
  "end_time": 1.2,
  "image_path": "./021010.jpg",
  "represents_multiple_types": false,
  "cross_video_duplicate": false,
  "original_detections": [
    {
      "video_path": "./ref_datasets/part2/6613678001.mp4",
      "start_time": 0.0,
      "end_time": 1.2,
      "image_path": "./ref_datasets/extracted_frames/person_5538306784096213114_1_6613678001.mp4_0.00_1.20.jpg",
      "type": "person"
    }
  ],
  "types": [
    "person"
  ],
  "persons": [
    {
      "body_box": 0,
      "skeleton": 0,
      "face_box": null,
      "qwen_detailing": {
        "background": false,
        "age": "adult",
        "gender": "unknown",
        "emotion": "neutral",
        "clothing_description": "The person is dressed in a casual outfit consisting of a light beige sweater with ribbed cuffs and a pair of white pants. The sweater appears comfortable and suitable for a relaxed setting. There are no visible accessories or footwear in the image.",
        "clothing": [
          {
            "possible_names": [
              "sweater",
              "jumper",
              "pullover"
            ],
            "name": "sweater",
            "type": "top",
            "color": [
              "light beige"
            ]
          },
          {
            "possible_names": [
              "pants",
              "trousers"
            ],
            "name": "pants",
            "type": "bottom",
            "color": [
              "white"
            ]
          }
        ],
        "objects": [
          {
            "standalone": false,
            "possible_names": [
              "smartphone",
              "mobile phone"
            ],
            "name": "smartphone",
            "position": "hand"
          },
          {
            "standalone": false,
            "possible_names": [
              "credit card",
              "bank card"
            ],
            "name": "credit card",
            "position": "hand"
          }
        ],
        "description": "An adult male is seated in a relaxed position with his feet up on a desk, suggesting a casual or leisurely moment. He is holding a smartphone in one hand, which displays an image of food, possibly indicating he is browsing recipes or a menu. In his other hand, he holds a credit card, which might imply he is considering making an online purchase. His attire consists of a light beige sweater and white pants, both of which contribute to the overall laid-back atmosphere. The setting includes a wooden desk with a laptop and notebook, against a backdrop of a white brick wall.",
        "blurry": false,
        "face_seen": false,
        "emotion_description": "The person appears to be relaxed and focused on their phone, suggesting a neutral emotional state.",
        "meaningful": true,
        "story": "The person is sitting comfortably in a chair with their feet up on a desk, holding a smartphone displaying food options and a credit card. They seem to be browsing or ordering food online, indicating a casual and leisurely moment.",
        "race": "unknown",
        "text": "no_text",
        "text_relationship": "no_text",
        "behaviour": "The person is seated comfortably in a wicker chair with their feet propped up on a wooden desk, suggesting a relaxed and casual posture. They are holding a smartphone in one hand, displaying an image of food, which indicates they might be browsing recipes or meal options online. The other hand rests on their leg with a credit card, possibly preparing to make an online purchase or payment related to the food they are viewing. The overall setting, with a laptop and notebook on the desk, implies a home office environment where the individual is taking a break from work to engage in leisurely activities such as online shopping or planning meals.",
        "intention": "The individual is taking a break from work to browse and potentially purchase food online using a smartphone and credit card while relaxing in a home office setting",
        "intention_ok": true
      },
      "hoi": [
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "left hand",
            "action": [
              [
                "left hand",
                "holding"
              ],
              [
                "left hand",
                "looking at"
              ]
            ]
          },
          "object": 0
        },
        {
          "relevant": true,
          "relationship": {
            "standalone": false,
            "position": "right hand",
            "action": [
              [
                "right hand",
                "holding"
              ]
            ]
          },
          "object": 1
        }
      ]
    }
  ],
  "detect_results": {
    "body_boxes": [
      [
        0.0006594267324544489,
        0.19292230904102325,
        0.9033316373825073,
        0.9948762655258179
      ]
    ],
    "face_boxes": [],
    "skeletons": [
      {
        "dw_body": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.23303453756821113,
            0.8025776299834252
          ],
          [
            0.6673372257434601,
            0.8792513820528984
          ],
          [
            0.7014447666996314,
            0.6683985638618469
          ],
          [
            0.02611545576743808,
            0.6952343770861625
          ],
          [
            0.00792476725748001,
            0.6198385208845139
          ],
          [
            0.1852839802295712,
            0.4792699754238129
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.7355523076558028,
            0.43837730765342714
          ],
          [
            0.7582906682932504,
            0.33870142996311187
          ],
          [
            -1.0,
            -1.0
          ],
          [
            0.3785600456478757,
            0.46010153740644455
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_hand_1": [
          [
            0.21484384905825307,
            0.4754362878203392
          ],
          [
            0.21711768512199783,
            0.4422109952569008
          ],
          [
            0.22166535724948733,
            0.40898570269346235
          ],
          [
            0.2466775539506797,
            0.38981726467609407
          ],
          [
            0.27623742277936153,
            0.37831620186567305
          ],
          [
            0.262594406396893,
            0.3962067440152168
          ],
          [
            0.2853327670343406,
            0.38214988946914674
          ],
          [
            0.32171414405425675,
            0.37831620186567305
          ],
          [
            0.35354784894668334,
            0.375760410130024
          ],
          [
            0.2853327670343406,
            0.40770780682563784
          ],
          [
            0.31489263586302246,
            0.3936509522795677
          ],
          [
            0.35354784894668334,
            0.3885393688082695
          ],
          [
            0.38083388171162047,
            0.3885393688082695
          ],
          [
            0.3012496194805539,
            0.42048676550388336
          ],
          [
            0.328535652245491,
            0.4102635985612869
          ],
          [
            0.35354784894668334,
            0.40770780682563784
          ],
          [
            0.37628620958413095,
            0.40770780682563784
          ],
          [
            0.31034496373553294,
            0.4370994117856026
          ],
          [
            0.33080948830923573,
            0.42943203657865525
          ],
          [
            0.34672634075544906,
            0.4268762448430061
          ],
          [
            0.3603693571379176,
            0.42943203657865525
          ]
        ],
        "dw_hand_2": [
          [
            0.6923494224446524,
            0.670954355597496
          ],
          [
            0.6468727011697573,
            0.6428406465053559
          ],
          [
            0.5991221438311173,
            0.6121711456775665
          ],
          [
            0.592300635639883,
            0.5840574365854263
          ],
          [
            0.5877529635123935,
            0.564888998568058
          ],
          [
            0.6741587339346944,
            0.5815016448497772
          ],
          [
            0.6878017503171628,
            0.5508321440219879
          ],
          [
            0.6946232585083971,
            0.5316637060046197
          ],
          [
            0.6991709306358866,
            0.5150510597229004
          ],
          [
            0.7173616191458447,
            0.5866132283210754
          ],
          [
            0.7378261437195476,
            0.5572216233611107
          ],
          [
            0.7491953240382714,
            0.5354973936080932
          ],
          [
            0.7560168322295057,
            0.5214405390620231
          ],
          [
            0.7514691601020161,
            0.5981142911314964
          ],
          [
            0.7742075207394638,
            0.5751121655106545
          ],
          [
            0.7855767010581876,
            0.5572216233611107
          ],
          [
            0.7901243731856771,
            0.541886872947216
          ],
          [
            0.7787551928669533,
            0.613449041545391
          ],
          [
            0.7969458813769114,
            0.599392186999321
          ],
          [
            0.8060412256318904,
            0.5878911241889
          ],
          [
            0.8105888977593798,
            0.576390061378479
          ]
        ],
        "dw_face": [
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_1": [
          [
            -1.0,
            -1.0
          ],
          [
            0.846970274779296,
            0.39492884814739226
          ],
          [
            -1.0,
            -1.0
          ]
        ],
        "dw_foot_2": [
          [
            0.846970274779296,
            0.2096339473128319
          ],
          [
            0.8401487665880617,
            0.22752448946237563
          ],
          [
            -1.0,
            -1.0
          ]
        ]
      }
    ]
  },
  "new_filename": "021010",
  "objects": [
    {
      "box": [
        0.26333728432655334,
        0.29977354407310486,
        0.39852234721183777,
        0.44682595133781433
      ],
      "name": "smartphone",
      "possible_names": [
        "smartphone"
      ]
    },
    {
      "box": [
        0.627515435218811,
        0.5033835172653198,
        0.7355910539627075,
        0.5768107175827026
      ],
      "name": "credit card",
      "possible_names": [
        "credit card"
      ]
    }
  ],
  "mask_file": "./person_labeling/./021010.jpg_masks.pkl",
  "hoi_processed": true,
  "scene": "A cozy indoor setting with a white brick wall wooden desk and chair featuring a laptop notebook smartphone and credit card all bathed in soft natural light creating a minimalist and modern atmosphere",
  "overall_past": "Before the current scene, the individual likely finished a work session at their desk, closing the laptop or saving their progress, and then shifted into a more relaxed state by moving into the wicker chair. They may have been researching recipes or meal ideas for dinner, possibly after feeling hungry or inspired by a recent culinary show or social media post. The credit card resting on their leg suggests they had already decided on a dish or meal plan and were preparing to make a purchase—perhaps ordering ingredients online or booking a meal delivery—indicating a transition from focused work to leisurely decision-making.",
  "overall_past_clean": "After concluding a period of concentrated work, the individual closed their device, saved their progress, and deliberately transitioned into a more relaxed mindset by shifting their posture and focus toward leisurely planning, having already made a decision to act on a culinary idea by preparing to make a purchase.",
  "past_scene_ok": true,
  "overall_future": "After the current scene, the individual is likely to proceed with placing an online order for the meal they are viewing on their smartphone. The combination of the credit card resting on their leg, the focused gaze on the food image, and the presence of a laptop and notebook—suggesting a functional home workspace—indicates a seamless transition from browsing to purchasing. With the digital tools readily available and the relaxed posture signaling a moment of personal indulgence, it is plausible that they will complete the transaction, possibly adding the meal to a delivery app or e-commerce platform, and then set the phone down to continue their break or return to work.",
  "overall_future_clean": "The screen lights up with a confirmation message as the order is placed, followed by a soft chime signaling the transaction’s success, then the device is set down, momentarily still, before the user leans back, exhaling softly, already turning their attention to the next task.",
  "future_scene_ok": true
}