{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    },
    "widgets": {
      "application/vnd.jupyter.widget-state+json": {
        "6d69c7fe088c4cdabb7b6506dc7813da": {
          "model_module": "anywidget",
          "model_name": "AnyModel",
          "model_module_version": "~0.9.*",
          "state": {
            "_anywidget_id": "rerun_notebook.Viewer",
            "_css": "/* src/js/widget.css */\n.rerun_notebook canvas {\n  width: 100%;\n  height: 100%;\n  min-width: 200px;\n  min-height: 400px;\n  max-width: 960px;\n  max-height: 720px;\n}\n.rerun_notebook {\n  margin: 0;\n  padding: 0;\n  width: 100%;\n  height: 100%;\n  background: transparent !important;\n}\ndiv.cell-output-ipywidget-background {\n  margin: 0;\n  padding: 0;\n  background: transparent !important;\n}\n",
            "_dom_classes": [],
            "_esm": "https://app.rerun.io/version/0.23.2/widget.js",
            "_height": 600,
            "_model_module": "anywidget",
            "_model_module_version": "~0.9.*",
            "_model_name": "AnyModel",
            "_panel_states": {},
            "_recording_id": "",
            "_time_ctrl": null,
            "_url": null,
            "_view_count": null,
            "_view_module": "anywidget",
            "_view_module_version": "~0.9.*",
            "_view_name": "AnyView",
            "_width": 640,
            "layout": "IPY_MODEL_2e93afa71152452f9e0d6a13b043d1ec"
          }
        },
        "2e93afa71152452f9e0d6a13b043d1ec": {
          "model_module": "@jupyter-widgets/base",
          "model_name": "LayoutModel",
          "model_module_version": "1.2.0",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "5ed03eb0229346af9b6c8253c484a713": {
          "model_module": "@jupyter-widgets/base",
          "model_name": "LayoutModel",
          "model_module_version": "1.2.0",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        }
      }
    }
  },
  "cells": [
    {
      "cell_type": "markdown",
      "source": [
        "# 🔍 IndEgo Dataset Explorer\n",
        "\n",
        "Welcome to **IndEgo**, a multimodal dataset capturing real-world **industrial scenarios** from both **egocentric** (wearable smart glasses) and **exocentric** (external camera) perspectives.\n",
        "\n",
        "This Colab notebook helps you:\n",
        "- 🎥 Load and play example videos from [Hugging Face 🤗](https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo)\n",
        "- 🔎 Visualize sample frames from egocentric workflows (e.g., drilling, clamping, assembly)\n",
        "- 📊 Lay the foundation for mistake detection, VQA, task understanding, and more.\n",
        "\n",
        "> 🚀 This notebook is beginner-friendly and requires no setup. Ideal for researchers, engineers, and students exploring AI for industrial applications.\n",
        "\n",
        "---\n",
        "\n",
        "📁 **Dataset Access**  \n",
        "👉 [IndEgo_Demo on Hugging Face](https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo)\n",
        "\n",
        "---\n",
        "\n",
        "🔗 **Project Repository**  \n",
        "👉 [IndEgo on GitHub](https://github.com/Vivek9Chavan/IndEgo)\n",
        "\n",
        "---"
      ],
      "metadata": {
        "id": "R2OaGD6T-Tv7"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "GxH3XAfW-PjZ",
        "outputId": "0569a64c-1945-4da5-f61f-cebe780350c7",
        "cellView": "form"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Requirement already satisfied: datasets in /usr/local/lib/python3.11/dist-packages (2.14.4)\n",
            "Requirement already satisfied: opencv-python in /usr/local/lib/python3.11/dist-packages (4.11.0.86)\n",
            "Requirement already satisfied: matplotlib in /usr/local/lib/python3.11/dist-packages (3.10.0)\n",
            "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.11/dist-packages (from datasets) (2.0.2)\n",
            "Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.11/dist-packages (from datasets) (18.1.0)\n",
            "Requirement already satisfied: dill<0.3.8,>=0.3.0 in /usr/local/lib/python3.11/dist-packages (from datasets) (0.3.7)\n",
            "Requirement already satisfied: pandas in /usr/local/lib/python3.11/dist-packages (from datasets) (2.2.2)\n",
            "Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.11/dist-packages (from datasets) (2.32.3)\n",
            "Requirement already satisfied: tqdm>=4.62.1 in /usr/local/lib/python3.11/dist-packages (from datasets) (4.67.1)\n",
            "Requirement already satisfied: xxhash in /usr/local/lib/python3.11/dist-packages (from datasets) (3.5.0)\n",
            "Requirement already satisfied: multiprocess in /usr/local/lib/python3.11/dist-packages (from datasets) (0.70.15)\n",
            "Requirement already satisfied: fsspec>=2021.11.1 in /usr/local/lib/python3.11/dist-packages (from fsspec[http]>=2021.11.1->datasets) (2025.3.2)\n",
            "Requirement already satisfied: aiohttp in /usr/local/lib/python3.11/dist-packages (from datasets) (3.11.15)\n",
            "Requirement already satisfied: huggingface-hub<1.0.0,>=0.14.0 in /usr/local/lib/python3.11/dist-packages (from datasets) (0.31.2)\n",
            "Requirement already satisfied: packaging in /usr/local/lib/python3.11/dist-packages (from datasets) (24.2)\n",
            "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.11/dist-packages (from datasets) (6.0.2)\n",
            "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (1.3.2)\n",
            "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (0.12.1)\n",
            "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (4.58.0)\n",
            "Requirement already satisfied: kiwisolver>=1.3.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (1.4.8)\n",
            "Requirement already satisfied: pillow>=8 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (11.2.1)\n",
            "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (3.2.3)\n",
            "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.11/dist-packages (from matplotlib) (2.9.0.post0)\n",
            "Requirement already satisfied: aiohappyeyeballs>=2.3.0 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (2.6.1)\n",
            "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (1.3.2)\n",
            "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (25.3.0)\n",
            "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (1.6.0)\n",
            "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (6.4.3)\n",
            "Requirement already satisfied: propcache>=0.2.0 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (0.3.1)\n",
            "Requirement already satisfied: yarl<2.0,>=1.17.0 in /usr/local/lib/python3.11/dist-packages (from aiohttp->datasets) (1.20.0)\n",
            "Requirement already satisfied: filelock in /usr/local/lib/python3.11/dist-packages (from huggingface-hub<1.0.0,>=0.14.0->datasets) (3.18.0)\n",
            "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.11/dist-packages (from huggingface-hub<1.0.0,>=0.14.0->datasets) (4.13.2)\n",
            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.11/dist-packages (from python-dateutil>=2.7->matplotlib) (1.17.0)\n",
            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.11/dist-packages (from requests>=2.19.0->datasets) (3.4.2)\n",
            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.11/dist-packages (from requests>=2.19.0->datasets) (3.10)\n",
            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.11/dist-packages (from requests>=2.19.0->datasets) (2.4.0)\n",
            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.11/dist-packages (from requests>=2.19.0->datasets) (2025.4.26)\n",
            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.11/dist-packages (from pandas->datasets) (2025.2)\n",
            "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.11/dist-packages (from pandas->datasets) (2025.2)\n"
          ]
        }
      ],
      "source": [
        "# @title\n",
        "!pip install datasets opencv-python matplotlib\n",
        "\n",
        "from datasets import load_dataset\n",
        "from IPython.display import Video, display\n",
        "import matplotlib.pyplot as plt\n",
        "import cv2\n",
        "import os\n",
        "import requests"
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 📂 Dataset Structure Overview\n",
        "\n",
        "In this section, we query the [IndEgo_Demo](https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo) dataset directly from Hugging Face and display its **hierarchical folder layout**.\n",
        "\n",
        "This gives a quick overview of how the dataset is organized — including major categories like `Assembly`, `Inspection_Repair`, `Woodworking`, and more — without needing to download the dataset.\n",
        "\n",
        "> The tree-like structure helps you navigate categories and subfolders that contain egocentric and exocentric videos, annotations, SLAM, gaze, and more."
      ],
      "metadata": {
        "id": "loCTPQYAaUHx"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "## Display Dataset Structure\n",
        "\n",
        "!pip install -q huggingface_hub\n",
        "\n",
        "from huggingface_hub import list_repo_files\n",
        "\n",
        "repo_id = \"vivek9chavan/IndEgo_Demo\"\n",
        "files = list_repo_files(repo_id, repo_type=\"dataset\")\n",
        "\n",
        "# Collect folder structure only (no files)\n",
        "folders = set()\n",
        "for f in files:\n",
        "    parts = f.split('/')\n",
        "    for i in range(1, len(parts)):  # skip top level files\n",
        "        folders.add('/'.join(parts[:i]))\n",
        "\n",
        "# Format as tree-like output\n",
        "print(f\"📁 Folder structure of {repo_id}:\\n\")\n",
        "for folder in sorted(folders):\n",
        "    depth = folder.count('/')\n",
        "    indent = '│   ' * depth + '├── '\n",
        "    print(f\"{indent}{folder.split('/')[-1]}/\")"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "1eqsagxD-TXU",
        "outputId": "78282718-5c36-426b-ce04-18de0ec6c52d",
        "cellView": "form"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.11/dist-packages/huggingface_hub/utils/_auth.py:94: UserWarning: \n",
            "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
            "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
            "You will be able to reuse this secret in all of your notebooks.\n",
            "Please note that authentication is recommended but still optional to access public models or datasets.\n",
            "  warnings.warn(\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "📁 Folder structure of vivek9chavan/IndEgo_Demo:\n",
            "\n",
            "├── 1_Assembly/\n",
            "│   ├── 01_ECU/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 02_IKEA_Lamp/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 03_Mechanical_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 04_IKEA_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 05_Trolley_Prototype/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 06_Workstation_Computer/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 07_Inspection_Assembly/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 08_Camera_Mount_Subassembly/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 09_ITEM_Prototype/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 10_Circular_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "├── 1_Disassembly/\n",
            "│   ├── 01_ECU/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 02_IKEA_Lamp/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 03_Mechanical_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 04_IKEA_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 05_Trolley_Prototype/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 06_Workstation_Computer/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 07_Inspection_Assembly/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 08_Camera_Mount_Subassembly/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 09_ITEM_Prototype/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 10_Circular_Desk/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "├── 2_Inspection_Repair/\n",
            "│   ├── annotations/\n",
            "│   ├── mp4/\n",
            "│   ├── mp4_480/\n",
            "│   ├── mp4_exo/\n",
            "│   ├── mps/\n",
            "│   ├── vrs/\n",
            "├── 3_Logistics_Organization/\n",
            "│   ├── annotations/\n",
            "│   ├── mp4_480/\n",
            "│   ├── mps/\n",
            "│   ├── vrs/\n",
            "├── 4_Woodworking/\n",
            "│   ├── annotations/\n",
            "│   ├── mp4_480/\n",
            "├── 5_Miscellaneous/\n",
            "├── 6_Tools_Objects_in_Context/\n",
            "├── 7_Tools_Objects_demo/\n",
            "├── 8_Singular_Actions/\n",
            "│   ├── 10_Sealing_a_cardboard_box_with_tape/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_10_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_15_Short_10_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 11_Loading_a_trolley__yellow_one__with_different_objects/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_412_Short_11_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_11_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 11_Loading_a_trolley_yellow_one_with_different_objects/\n",
            "│   ├── 12_Pushing_a_trolley_from_one_side_to_the_other/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_12_vrs/\n",
            "│   │   │   ├── mps_User_15_Short_12_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 13_Unloading_a_trolley/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_15_Short_13_vrs/\n",
            "│   │   │   ├── mps_User_16_Short_13_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 14_Carrying_461_toolbox_from_one_floor_to_the_other/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_14_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 15_Sorting_tools_of_461_toolbox/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_15_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 16_Plugging_in_a_cable__of_drill_machine/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_16_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_16_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 16_Plugging_in_a_cable_of_drill_machine/\n",
            "│   ├── 17_Unplugging_a_cable__of_drill_machine/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_17_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_17_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 17_Unplugging_a_cable_of_drill_machine/\n",
            "│   ├── 18_Putting_on_working_gloves/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_18_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_15_Short_18_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 19_Sawing_Wood/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_19_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_19_vrs/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 1_Screwing_screw_with_allen_wrench/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_15_Short_1_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_16_Short_1_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 20_Inspecting_wooden_block_from_all_sides/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_20_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_20_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 21_Open_a_drawer_and_search_for_a_tool/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_21_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_21_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 22_Carrying_toolbox_from_one_room_to_another/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_22_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_15_Short_22_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 23_Closing_Door/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_23_vrs/\n",
            "│   │   │   ├── mps_User_15_Short_23_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 24_Shaking__opening_and_using_an_oil_can/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_410_Short_24_vrs/\n",
            "│   │   │   ├── mps_User_14_412_Short_24_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 24_Shaking_opening_and_using_an_oil_can/\n",
            "│   ├── 25_Opening_a_toolbox/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_25_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_25_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 26_Rasping_a_wooden_block/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_26_vrs/\n",
            "│   │   │   ├── mps_User_14_Short_26_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 27_Opening_a_manual_and_skim_through_the_pages/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_11_Short_27_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 28_Adjusting_and_stepping_on_a_ladder/\n",
            "│   ├── 29_Stepping_down_from_a_ladder/\n",
            "│   ├── 2_Unscrewing_with_allen_wrench/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_15_Short_2_vrs/\n",
            "│   │   │   ├── mps_User_16_Short_2_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 30_Binding_steel_rods/\n",
            "│   ├── 31_Taking_pieces_from_a_workstation_and_placing_them_in_box/\n",
            "│   ├── 32_Lifting_up_with_trolley/\n",
            "│   ├── 33_Setting_up_a_camera_onto_a_tripod/\n",
            "│   ├── 34_Weighing_an_object/\n",
            "│   ├── 35_Scratching_a_metal_plate/\n",
            "│   ├── 36_Adjusting_height_of_a_table_higher/\n",
            "│   ├── 37_Adjusting_height_of_a_table_lower/\n",
            "│   ├── 38_Release_trolley_brake/\n",
            "│   ├── 39_Adjust_rollstoppers_of_rolling_assembly/\n",
            "│   ├── 3_Clamping_a_wooden_block_on_a_table_with_a_clamp/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_3_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_17_Short_3_vrs/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 40_Rolling_the_assembly_around_the_room/\n",
            "│   ├── 41_Marking_drilling_hole_with_hammer_and_hole_puncher/\n",
            "│   ├── 42_Taking_box_out_of_a_shelf/\n",
            "│   ├── 43_Using_hammer_to_put_in_a_nail/\n",
            "│   ├── 44_Pumping_a_bike_tire/\n",
            "│   ├── 45_Putting_on_safety_shoes/\n",
            "│   ├── 46_Taking_off_safety_shoes/\n",
            "│   ├── 47_Cutting_zip_ties_with_a_cutter_knife/\n",
            "│   ├── 48_Wrapping_a_box_or_something_else_with_transparent_foil/\n",
            "│   ├── 49_Closing_a_toolbox/\n",
            "│   ├── 4_Drilling_a_hole_into_a_wooden_block/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_16_Short_4_vrs/\n",
            "│   │   │   ├── mps_User_17_Short_4_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 50_Taking_out_small_table/\n",
            "│   ├── 51_Putting_away_small_table/\n",
            "│   ├── 52_Switching_out_camera_lenses/\n",
            "│   ├── 53_Replacing_batteries_of_electric_caliper/\n",
            "│   ├── 54_Marking_a_cutting_line_on_wood_with_pencil/\n",
            "│   ├── 55_Measuring_angles_with_a_protractor/\n",
            "│   ├── 56_Testing_something_with_a_multimeter_e.g._a_battery/\n",
            "│   ├── 57_Clamping_clamp_onto_table/\n",
            "│   ├── 58_Putting_in_battery_and_SD_card_into_a_camera/\n",
            "│   ├── 59_Sticking_two_pieces_of_wood_together_with_double_sided_tape/\n",
            "│   ├── 5_Cleaning_workplace_from_wood_chips/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_5_vrs/\n",
            "│   │   │   ├── mps_User_16_Short_5_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 60_Cleaning_robot_arm_with_cloth/\n",
            "│   ├── 61_Stripping_a_wire_from_outer_layer/\n",
            "│   ├── 62_Clamping_together_two_pieces_of_wood/\n",
            "│   ├── 63_Detaching_a_fire_extinguisher/\n",
            "│   ├── 64_Attaching_a_fire_extinguisher/\n",
            "│   ├── 65_Taking_out_some_needed_tools_from_a_toolbox/\n",
            "│   ├── 66_Detaching_camera_from_tripod/\n",
            "│   ├── 67_Marking_drill_holes_on_a_piece_of_wood_with_pencil/\n",
            "│   ├── 68_Opening_door/\n",
            "│   ├── 69_Getting_SD_card_and_battery_out_of_the_DSLR_Camera/\n",
            "│   ├── 6_Measuring_the_length_of_a_table/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_16_Short_6_vrs/\n",
            "│   │   │   ├── mps_User_17_Short_6_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 70_Assembling_a_drill_machine_bit/\n",
            "│   ├── 71_Sanding_wood_surfaces_with_sandpaper/\n",
            "│   ├── 72_Attaching_zip_ties_to_secure_cables/\n",
            "│   ├── 73_Disassembling_drill_machine/\n",
            "│   ├── 74_Replacing_an_old_blade_in_a_box_cutter/\n",
            "│   ├── 75_Replacing_drilling_machine_battery/\n",
            "│   ├── 76_Tightening_a_screw_of_PC_monitor_with_screwdriver/\n",
            "│   ├── 77_Untightening_a_screw_of_PC_monitor_with_screwdriver/\n",
            "│   ├── 78_Setting_up_a_tripod/\n",
            "│   ├── 79_Dismantling_a_tripod/\n",
            "│   ├── 7_Measuring_a_screw_with_a_caliper/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_16_Short_7_vrs/\n",
            "│   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── slam/\n",
            "│   │   │   ├── mps_User_17_Short_7_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 80_Checking_level_of_a_table_with_a_spirit_level/\n",
            "│   ├── 81_Pulling_out_a_nail_with_pliers/\n",
            "│   ├── 82_Greasing_drill_attachment_with_a_grease_gun/\n",
            "│   ├── 83_Wrapping_an_object_in_bubble_wrap/\n",
            "│   ├── 84_Bring_out_trash_bag_from_room_and_place_it_in_front_of_door/\n",
            "│   ├── 85_Coiling_an_extension_cord_after_use/\n",
            "│   ├── 86_Uncoiling_an_extension_cord_before_use/\n",
            "│   ├── 87_Opening_hatch_of_big_wooden_trolley/\n",
            "│   ├── 88_Closing_hatch_of_big_wooden_trolley/\n",
            "│   ├── 89_Unbinding_bars/\n",
            "│   ├── 8_Placing_box_in_shelf/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_14_Short_8_vrs/\n",
            "│   │   │   ├── mps_User_15_Short_8_vrs/\n",
            "│   │   ├── vrs/\n",
            "│   ├── 90_Loading_big_wooden_trolley_with_bars/\n",
            "│   ├── 91_Unloading_big_wooden_trolley_from_bars/\n",
            "│   ├── 92_Laying_down_the_carpet/\n",
            "│   ├── 93_Putting_on_a_safety_vest/\n",
            "│   ├── 94_Putting_on_safety_goggles/\n",
            "│   ├── 9_Opening_a_cardboard_box_with_scissors_cutter_knife/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps_User_15_Short_9_vrs/\n",
            "│   │   │   ├── mps_User_16_Short_9_vrs/\n",
            "│   │   ├── vrs/\n",
            "├── Mistake_Detection/\n",
            "│   ├── Task_1/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_10/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   │   ├── mps/\n",
            "│   │   │   │   ├── mps_User_14_2111_10c_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_14_2111_10c_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_14_411_2111_10m_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_411_2111_10m_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_412_2111_10c_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_14_412_2111_10m_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_412_2111_10m_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_412_2111_10m_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_412_2111_10m_4_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_14_412_211_10c_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_15_412_0511_10c_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_15_412_0511_10m_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_15_412_0511_10m_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_15_412_0511_10m_4_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_16_0611_10c_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_16_0611_10m_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_16_0611_10m_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10c_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10c_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10m_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10m_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10m_4_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10m_5_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_17_412_0511_10m_6_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_2_0611_10c_1_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_2_0611_10c_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   │   │   ├── mps_User_2_0611_10m_2_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   ├── mps_User_2_0611_10m_3_vrs/\n",
            "│   │   │   │   │   ├── eye_gaze/\n",
            "│   │   │   │   │   ├── hand_tracking/\n",
            "│   │   │   │   │   ├── slam/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_11/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_12/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_13/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_14/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_15/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_16/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_17/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_18/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_19/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_2/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_20/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_21/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_22/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_23/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_24/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_25/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_3/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_4/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_5/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_6/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_7/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_8/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n",
            "│   ├── Task_9/\n",
            "│   │   ├── annotations/\n",
            "│   │   ├── mp4/\n",
            "│   │   ├── mp4_480/\n",
            "│   │   ├── mp4_exo/\n",
            "│   │   ├── mps/\n",
            "│   │   ├── vrs/\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 📘 Overview\n",
        "\n",
        "Below, we present a **small subset of examples** from the IndEgo dataset, chosen to illustrate:\n",
        "\n",
        "- 🧠 The range of **use cases**: from mistake detection to collaborative task understanding  \n",
        "- 🏷️ Rich **annotations** for steps, mistakes, narrations, and more  \n",
        "- 🎥 Multimodal **data streams**: egocentric video, gaze, hand tracking, motion, SLAM  \n",
        "- 📦 How to **access and explore** the dataset directly via Hugging Face and Colab\n"
      ],
      "metadata": {
        "id": "iloYI69tb30k"
      }
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🎥 Egocentric View: Assembly Task – Embedded Control Unit\n",
        "\n",
        "The following video shows an **egocentric recording** of a user performing an assembly task involving an **Embedded Control Unit (ECU)**."
      ],
      "metadata": {
        "id": "m-zFBWrVaxET"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "from IPython.display import HTML\n",
        "\n",
        "# Assembly scenario video URL (direct access via Hugging Face CDN)\n",
        "video_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Assembly/01_ECU/mp4_480/User_16_410_2110_2_480.mp4\"\n",
        "\n",
        "print(\"🎥 Assembly Scenario: Embedded Control Unit\")\n",
        "HTML(f\"\"\"\n",
        "<video width=\"480\" controls>\n",
        "  <source src=\"{video_url}\" type=\"video/mp4\">\n",
        "  Your browser does not support the video tag.\n",
        "</video>\n",
        "\"\"\")"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 519
        },
        "id": "4nF8sMGqAunU",
        "outputId": "19db3d53-9466-4aaa-abad-5011ef261618",
        "cellView": "form"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "🎥 Assembly Scenario: Embedded Control Unit\n"
          ]
        },
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ],
            "text/html": [
              "\n",
              "<video width=\"480\" controls>\n",
              "  <source src=\"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Assembly/01_ECU/mp4_480/User_16_410_2110_2_480.mp4\" type=\"video/mp4\">\n",
              "  Your browser does not support the video tag.\n",
              "</video>\n"
            ]
          },
          "metadata": {},
          "execution_count": 3
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🤝 Collaborative Work: Dual Egocentric Views\n",
        "\n",
        "This example demonstrates a **collaborative disassembly task** involving two users working on a mechanical desk. Each user wears an egocentric device (smart glasses), capturing their perspective during the task.\n",
        "\n",
        "In the videos below, you can:\n",
        "\n",
        "- 👀 Observe how both users coordinate their actions from different viewpoints  \n",
        "- 🔧 Analyze handovers, object interactions, and tool usage across perspectives  \n",
        "- 🎯 Lay the groundwork for research in collaboration-aware AI, action alignment, and task graph construction\n",
        "\n",
        "> Each view is recorded independently and aligned by shared timestamps and task context."
      ],
      "metadata": {
        "id": "NoH15wXxaKSP"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "from IPython.display import HTML\n",
        "\n",
        "# Collaborative Disassembly Scenario: Two Users working on the same task\n",
        "user1_video = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/03_Mechanical_Desk/mp4_480/User_1_User_15_411_2910_1_480.mp4\"\n",
        "user2_video = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/03_Mechanical_Desk/mp4_480/User_15_User_1_411_2910_1_480.mp4\"\n",
        "\n",
        "print(\"🤝 Collaborative Scenario: Mechanical Desk Disassembly\")\n",
        "\n",
        "HTML(f\"\"\"\n",
        "<table style=\"width: 100%; table-layout: fixed;\">\n",
        "  <tr>\n",
        "    <td style=\"text-align: center;\"><b>User 1 View</b></td>\n",
        "    <td style=\"text-align: center;\"><b>User 15 View</b></td>\n",
        "  </tr>\n",
        "  <tr>\n",
        "    <td>\n",
        "      <video width=\"480\" controls>\n",
        "        <source src=\"{user1_video}\" type=\"video/mp4\">\n",
        "        Your browser does not support the video tag.\n",
        "      </video>\n",
        "    </td>\n",
        "    <td>\n",
        "      <video width=\"480\" controls>\n",
        "        <source src=\"{user2_video}\" type=\"video/mp4\">\n",
        "        Your browser does not support the video tag.\n",
        "      </video>\n",
        "    </td>\n",
        "  </tr>\n",
        "</table>\n",
        "\"\"\")"
      ],
      "metadata": {
        "id": "TQu8pIEFBk6_",
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 546
        },
        "outputId": "c6d49ab6-ed7b-40e8-c967-07f5e8cce410"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "🤝 Collaborative Scenario: Mechanical Desk Disassembly\n"
          ]
        },
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ],
            "text/html": [
              "\n",
              "<table style=\"width: 100%; table-layout: fixed;\">\n",
              "  <tr>\n",
              "    <td style=\"text-align: center;\"><b>User 1 View</b></td>\n",
              "    <td style=\"text-align: center;\"><b>User 15 View</b></td>\n",
              "  </tr>\n",
              "  <tr>\n",
              "    <td>\n",
              "      <video width=\"480\" controls>\n",
              "        <source src=\"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/03_Mechanical_Desk/mp4_480/User_1_User_15_411_2910_1_480.mp4\" type=\"video/mp4\">\n",
              "        Your browser does not support the video tag.\n",
              "      </video>\n",
              "    </td>\n",
              "    <td>\n",
              "      <video width=\"480\" controls>\n",
              "        <source src=\"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/03_Mechanical_Desk/mp4_480/User_15_User_1_411_2910_1_480.mp4\" type=\"video/mp4\">\n",
              "        Your browser does not support the video tag.\n",
              "      </video>\n",
              "    </td>\n",
              "  </tr>\n",
              "</table>\n"
            ]
          },
          "metadata": {},
          "execution_count": 3
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🧠 Fine-Grained Temporal Annotations\n",
        "\n",
        "This section loads the fine-grained **temporal action annotations** for one of the collaborative disassembly tasks. Each row represents a time segment labeled with a high-level action (e.g., *\"Remove Tabletop Screws\"*, *\"Find Tools\"*, *\"Help Worker 2\"*).\n",
        "\n",
        "These annotations are useful for:\n",
        "- ⏱️ Action recognition and temporal localization\n",
        "- ❌ Mistake detection or sequence validation\n",
        "- 🤖 Task graph learning and robotic imitation\n",
        "\n",
        "> The annotations were created using the [VGG VIA](http://www.robots.ox.ac.uk/~vgg/software/via/) tool and are structured as temporal segments in JSON format."
      ],
      "metadata": {
        "id": "TX7IcqGxb0MO"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "import json\n",
        "import pandas as pd\n",
        "import requests\n",
        "\n",
        "# Load the annotation JSON from Hugging Face\n",
        "annotation_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/03_Mechanical_Desk/annotations/A_User_1_User_15_411_2910_1.json\"\n",
        "data = requests.get(annotation_url).json()\n",
        "\n",
        "# Ask user for the starting time (in seconds)\n",
        "start_time_input = float(input(\"Enter a time in seconds (e.g., 200): \"))\n",
        "\n",
        "# Parse the temporal segments\n",
        "segments = []\n",
        "for meta in data[\"metadata\"].values():\n",
        "    if \"z\" in meta and \"av\" in meta:\n",
        "        start = meta[\"z\"][0]\n",
        "        end = meta[\"z\"][1] if len(meta[\"z\"]) > 1 else None\n",
        "        if start >= start_time_input:\n",
        "            label = list(meta[\"av\"].values())[0]\n",
        "            duration = round(end - start, 2) if end else \"N/A\"\n",
        "            segments.append({\n",
        "                \"Action Label\": label,\n",
        "                \"Start Time (s)\": round(start, 2),\n",
        "                \"End Time (s)\": round(end, 2) if end else \"—\",\n",
        "                \"Duration (s)\": duration\n",
        "            })\n",
        "\n",
        "# Display results\n",
        "if segments:\n",
        "    df = pd.DataFrame(segments)\n",
        "    df.sort_values(\"Start Time (s)\", inplace=True)\n",
        "    df.reset_index(drop=True, inplace=True)\n",
        "    display(df.head(10))\n",
        "else:\n",
        "    print(f\"No annotations found starting at or after {start_time_input} seconds.\")"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 380
        },
        "id": "uJney6TsYYGu",
        "outputId": "dda7667b-1210-4cb6-ea63-75798351e216",
        "cellView": "form"
      },
      "execution_count": null,
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Enter a time in seconds (e.g., 200): 200\n"
          ]
        },
        {
          "output_type": "display_data",
          "data": {
            "text/plain": [
              "                        Action Label  Start Time (s) End Time (s) Duration (s)\n",
              "0                      Help Worker 2          205.64       218.39        12.75\n",
              "1                         Find Tools          220.89       262.76        41.88\n",
              "2           Prepare Drilling Machine          262.76       335.51        72.75\n",
              "3             Carry Table to the Lab          299.13            —          N/A\n",
              "4             Remove Tabletop Screws          335.51       350.39        14.87\n",
              "5  Hand Drilling Machine to Coworker          350.39       354.89          4.5\n",
              "6             Remove Tabletop Screws          354.89       442.89         88.0\n",
              "7                           Planning          442.89       458.39         15.5\n",
              "8                      Adjust Height          458.39       483.51        25.12\n",
              "9             Remove Tabletop Screws          483.51       518.26        34.75"
            ],
            "text/html": [
              "\n",
              "  <div id=\"df-72eb44ff-7ab0-438b-9ce4-0204feb3aee5\" class=\"colab-df-container\">\n",
              "    <div>\n",
              "<style scoped>\n",
              "    .dataframe tbody tr th:only-of-type {\n",
              "        vertical-align: middle;\n",
              "    }\n",
              "\n",
              "    .dataframe tbody tr th {\n",
              "        vertical-align: top;\n",
              "    }\n",
              "\n",
              "    .dataframe thead th {\n",
              "        text-align: right;\n",
              "    }\n",
              "</style>\n",
              "<table border=\"1\" class=\"dataframe\">\n",
              "  <thead>\n",
              "    <tr style=\"text-align: right;\">\n",
              "      <th></th>\n",
              "      <th>Action Label</th>\n",
              "      <th>Start Time (s)</th>\n",
              "      <th>End Time (s)</th>\n",
              "      <th>Duration (s)</th>\n",
              "    </tr>\n",
              "  </thead>\n",
              "  <tbody>\n",
              "    <tr>\n",
              "      <th>0</th>\n",
              "      <td>Help Worker 2</td>\n",
              "      <td>205.64</td>\n",
              "      <td>218.39</td>\n",
              "      <td>12.75</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>1</th>\n",
              "      <td>Find Tools</td>\n",
              "      <td>220.89</td>\n",
              "      <td>262.76</td>\n",
              "      <td>41.88</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>2</th>\n",
              "      <td>Prepare Drilling Machine</td>\n",
              "      <td>262.76</td>\n",
              "      <td>335.51</td>\n",
              "      <td>72.75</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>3</th>\n",
              "      <td>Carry Table to the Lab</td>\n",
              "      <td>299.13</td>\n",
              "      <td>—</td>\n",
              "      <td>N/A</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>4</th>\n",
              "      <td>Remove Tabletop Screws</td>\n",
              "      <td>335.51</td>\n",
              "      <td>350.39</td>\n",
              "      <td>14.87</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>5</th>\n",
              "      <td>Hand Drilling Machine to Coworker</td>\n",
              "      <td>350.39</td>\n",
              "      <td>354.89</td>\n",
              "      <td>4.5</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>6</th>\n",
              "      <td>Remove Tabletop Screws</td>\n",
              "      <td>354.89</td>\n",
              "      <td>442.89</td>\n",
              "      <td>88.0</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>7</th>\n",
              "      <td>Planning</td>\n",
              "      <td>442.89</td>\n",
              "      <td>458.39</td>\n",
              "      <td>15.5</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>8</th>\n",
              "      <td>Adjust Height</td>\n",
              "      <td>458.39</td>\n",
              "      <td>483.51</td>\n",
              "      <td>25.12</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th>9</th>\n",
              "      <td>Remove Tabletop Screws</td>\n",
              "      <td>483.51</td>\n",
              "      <td>518.26</td>\n",
              "      <td>34.75</td>\n",
              "    </tr>\n",
              "  </tbody>\n",
              "</table>\n",
              "</div>\n",
              "    <div class=\"colab-df-buttons\">\n",
              "\n",
              "  <div class=\"colab-df-container\">\n",
              "    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-72eb44ff-7ab0-438b-9ce4-0204feb3aee5')\"\n",
              "            title=\"Convert this dataframe to an interactive table.\"\n",
              "            style=\"display:none;\">\n",
              "\n",
              "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n",
              "    <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n",
              "  </svg>\n",
              "    </button>\n",
              "\n",
              "  <style>\n",
              "    .colab-df-container {\n",
              "      display:flex;\n",
              "      gap: 12px;\n",
              "    }\n",
              "\n",
              "    .colab-df-convert {\n",
              "      background-color: #E8F0FE;\n",
              "      border: none;\n",
              "      border-radius: 50%;\n",
              "      cursor: pointer;\n",
              "      display: none;\n",
              "      fill: #1967D2;\n",
              "      height: 32px;\n",
              "      padding: 0 0 0 0;\n",
              "      width: 32px;\n",
              "    }\n",
              "\n",
              "    .colab-df-convert:hover {\n",
              "      background-color: #E2EBFA;\n",
              "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
              "      fill: #174EA6;\n",
              "    }\n",
              "\n",
              "    .colab-df-buttons div {\n",
              "      margin-bottom: 4px;\n",
              "    }\n",
              "\n",
              "    [theme=dark] .colab-df-convert {\n",
              "      background-color: #3B4455;\n",
              "      fill: #D2E3FC;\n",
              "    }\n",
              "\n",
              "    [theme=dark] .colab-df-convert:hover {\n",
              "      background-color: #434B5C;\n",
              "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
              "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
              "      fill: #FFFFFF;\n",
              "    }\n",
              "  </style>\n",
              "\n",
              "    <script>\n",
              "      const buttonEl =\n",
              "        document.querySelector('#df-72eb44ff-7ab0-438b-9ce4-0204feb3aee5 button.colab-df-convert');\n",
              "      buttonEl.style.display =\n",
              "        google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
              "\n",
              "      async function convertToInteractive(key) {\n",
              "        const element = document.querySelector('#df-72eb44ff-7ab0-438b-9ce4-0204feb3aee5');\n",
              "        const dataTable =\n",
              "          await google.colab.kernel.invokeFunction('convertToInteractive',\n",
              "                                                    [key], {});\n",
              "        if (!dataTable) return;\n",
              "\n",
              "        const docLinkHtml = 'Like what you see? Visit the ' +\n",
              "          '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
              "          + ' to learn more about interactive tables.';\n",
              "        element.innerHTML = '';\n",
              "        dataTable['output_type'] = 'display_data';\n",
              "        await google.colab.output.renderOutput(dataTable, element);\n",
              "        const docLink = document.createElement('div');\n",
              "        docLink.innerHTML = docLinkHtml;\n",
              "        element.appendChild(docLink);\n",
              "      }\n",
              "    </script>\n",
              "  </div>\n",
              "\n",
              "\n",
              "    <div id=\"df-d6a9ec57-72d6-4f37-b9c2-5990abe6f02d\">\n",
              "      <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-d6a9ec57-72d6-4f37-b9c2-5990abe6f02d')\"\n",
              "                title=\"Suggest charts\"\n",
              "                style=\"display:none;\">\n",
              "\n",
              "<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
              "     width=\"24px\">\n",
              "    <g>\n",
              "        <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n",
              "    </g>\n",
              "</svg>\n",
              "      </button>\n",
              "\n",
              "<style>\n",
              "  .colab-df-quickchart {\n",
              "      --bg-color: #E8F0FE;\n",
              "      --fill-color: #1967D2;\n",
              "      --hover-bg-color: #E2EBFA;\n",
              "      --hover-fill-color: #174EA6;\n",
              "      --disabled-fill-color: #AAA;\n",
              "      --disabled-bg-color: #DDD;\n",
              "  }\n",
              "\n",
              "  [theme=dark] .colab-df-quickchart {\n",
              "      --bg-color: #3B4455;\n",
              "      --fill-color: #D2E3FC;\n",
              "      --hover-bg-color: #434B5C;\n",
              "      --hover-fill-color: #FFFFFF;\n",
              "      --disabled-bg-color: #3B4455;\n",
              "      --disabled-fill-color: #666;\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart {\n",
              "    background-color: var(--bg-color);\n",
              "    border: none;\n",
              "    border-radius: 50%;\n",
              "    cursor: pointer;\n",
              "    display: none;\n",
              "    fill: var(--fill-color);\n",
              "    height: 32px;\n",
              "    padding: 0;\n",
              "    width: 32px;\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart:hover {\n",
              "    background-color: var(--hover-bg-color);\n",
              "    box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
              "    fill: var(--button-hover-fill-color);\n",
              "  }\n",
              "\n",
              "  .colab-df-quickchart-complete:disabled,\n",
              "  .colab-df-quickchart-complete:disabled:hover {\n",
              "    background-color: var(--disabled-bg-color);\n",
              "    fill: var(--disabled-fill-color);\n",
              "    box-shadow: none;\n",
              "  }\n",
              "\n",
              "  .colab-df-spinner {\n",
              "    border: 2px solid var(--fill-color);\n",
              "    border-color: transparent;\n",
              "    border-bottom-color: var(--fill-color);\n",
              "    animation:\n",
              "      spin 1s steps(1) infinite;\n",
              "  }\n",
              "\n",
              "  @keyframes spin {\n",
              "    0% {\n",
              "      border-color: transparent;\n",
              "      border-bottom-color: var(--fill-color);\n",
              "      border-left-color: var(--fill-color);\n",
              "    }\n",
              "    20% {\n",
              "      border-color: transparent;\n",
              "      border-left-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "    }\n",
              "    30% {\n",
              "      border-color: transparent;\n",
              "      border-left-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "      border-right-color: var(--fill-color);\n",
              "    }\n",
              "    40% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "      border-top-color: var(--fill-color);\n",
              "    }\n",
              "    60% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "    }\n",
              "    80% {\n",
              "      border-color: transparent;\n",
              "      border-right-color: var(--fill-color);\n",
              "      border-bottom-color: var(--fill-color);\n",
              "    }\n",
              "    90% {\n",
              "      border-color: transparent;\n",
              "      border-bottom-color: var(--fill-color);\n",
              "    }\n",
              "  }\n",
              "</style>\n",
              "\n",
              "      <script>\n",
              "        async function quickchart(key) {\n",
              "          const quickchartButtonEl =\n",
              "            document.querySelector('#' + key + ' button');\n",
              "          quickchartButtonEl.disabled = true;  // To prevent multiple clicks.\n",
              "          quickchartButtonEl.classList.add('colab-df-spinner');\n",
              "          try {\n",
              "            const charts = await google.colab.kernel.invokeFunction(\n",
              "                'suggestCharts', [key], {});\n",
              "          } catch (error) {\n",
              "            console.error('Error during call to suggestCharts:', error);\n",
              "          }\n",
              "          quickchartButtonEl.classList.remove('colab-df-spinner');\n",
              "          quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n",
              "        }\n",
              "        (() => {\n",
              "          let quickchartButtonEl =\n",
              "            document.querySelector('#df-d6a9ec57-72d6-4f37-b9c2-5990abe6f02d button');\n",
              "          quickchartButtonEl.style.display =\n",
              "            google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
              "        })();\n",
              "      </script>\n",
              "    </div>\n",
              "\n",
              "    </div>\n",
              "  </div>\n"
            ],
            "application/vnd.google.colaboratory.intrinsic+json": {
              "type": "dataframe",
              "summary": "{\n  \"name\": \"    print(f\\\"No annotations found starting at or after {start_time_input} seconds\",\n  \"rows\": 10,\n  \"fields\": [\n    {\n      \"column\": \"Action Label\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 8,\n        \"samples\": [\n          \"Find Tools\",\n          \"Hand Drilling Machine to Coworker\",\n          \"Help Worker 2\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    },\n    {\n      \"column\": \"Start Time (s)\",\n      \"properties\": {\n        \"dtype\": \"number\",\n        \"std\": 97.41324619030685,\n        \"min\": 205.64,\n        \"max\": 483.51,\n        \"num_unique_values\": 10,\n        \"samples\": [\n          458.39,\n          220.89,\n          350.39\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    },\n    {\n      \"column\": \"End Time (s)\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 10,\n        \"samples\": [\n          483.51,\n          262.76,\n          354.89\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    },\n    {\n      \"column\": \"Duration (s)\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 10,\n        \"samples\": [\n          25.12,\n          41.88,\n          4.5\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    }\n  ]\n}"
            }
          },
          "metadata": {}
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🗣️ Verbal Narration Transcript\n",
        "\n",
        "Our dataset includes user narration for several scenarios.\n",
        "\n",
        "Below is the automatically aligned **narration transcript** for the selected egocentric video (`User_1_User_15_411_2910_1`).\n",
        "\n",
        "These transcripts contain the user’s spoken thoughts and intentions during task execution, offering valuable context for:\n",
        "\n",
        "- 🧠 Understanding reasoning and decision-making  \n",
        "- 🔎 Interpreting ambiguous actions  \n",
        "- 🤝 Linking visual actions with collaborative intent\n"
      ],
      "metadata": {
        "id": "rOfg6xx4rTJ5"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "import requests\n",
        "import json\n",
        "from IPython.display import display, HTML\n",
        "\n",
        "# URL to narration transcripts\n",
        "narration_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/1_Disassembly/narration_transcript_disassembly.json\"\n",
        "\n",
        "# Load the JSON file\n",
        "data = requests.get(narration_url).json()\n",
        "\n",
        "# Target video name\n",
        "target_name = \"User_1_User_15_411_2910_1_480.mp4\"\n",
        "\n",
        "# Search for the matching transcript\n",
        "transcript_text = None\n",
        "for entry in data:\n",
        "    if entry.get(\"name\") == target_name:\n",
        "        transcript_text = entry.get(\"transcript\")\n",
        "        break\n",
        "\n",
        "# Display result in scrollable box with larger font\n",
        "if transcript_text:\n",
        "    display(HTML(f\"\"\"\n",
        "    <h4>🗣️ Narration for <code>{target_name}</code></h4>\n",
        "    <div style=\"border:1px solid #ccc; padding:10px; max-height:400px; overflow-y:auto; white-space:pre-wrap; font-size:16px; line-height:1.5;\">\n",
        "    {transcript_text}\n",
        "    </div>\n",
        "    \"\"\"))\n",
        "else:\n",
        "    print(f\"No transcript found for video name '{target_name}'.\")"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 479
        },
        "cellView": "form",
        "id": "G34FjkEcuHRG",
        "outputId": "1716c6fe-08ff-4015-91ba-9c9e4319b278"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "display_data",
          "data": {
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ],
            "text/html": [
              "\n",
              "    <h4>🗣️ Narration for <code>User_1_User_15_411_2910_1_480.mp4</code></h4>\n",
              "    <div style=\"border:1px solid #ccc; padding:10px; max-height:400px; overflow-y:auto; white-space:pre-wrap; font-size:16px; line-height:1.5;\">\n",
              "     so let's first we get some tools so you can empty that trolley and bring it to the other room and I can go here  Any other tools there?  Let me see if this dual fits. It's too large. Hello. Oh, sorry.  You can carry this to the other room.  Can maybe place this here and take the trolley back. No, I mean just here. It's out of the way. And position this here.  So we need a couple of different tools for this. Firstly, of course, the crosshead screwdrivers for the upper wooden table. And then we can first we can take this off and then we can disassemble the lower frame. So.  uh we could also flip it but the problem is that these things are stuck so we cannot flip it at the moment and also prepare the drilling machine too  So it is attached using the screws. So there's two on this side here and there's one somewhere in the middle. So if you come in the front, you should be able to see.  You can also use this if you want. I think there's a screw somewhere on the inside here. Yeah, but this side is not moving. And I cannot reach it without going in here and somehow reaching for the tool.  Let me check. OK. And the problem is that the height of the table is just too low. Can you pass me that too? Thanks.  Let's just do a temporary solution. Maybe we can put the trolley, put this under trolley and raise the height slightly. We cannot move it because if you check the wooden desk is in the way or maybe we can move the desk and then you can raise it. I think that's a slightly easier solution.  yeah i think that should be sufficient so let's check again okay now it is much easier to reach it  so now we can maybe remove this and place it here it would be at a risk of sliding i'm guessing so  okay so let's flip this then okay so then the instructions are need to have some gloves first of all  I think the other pair of gloves are in the other room where the safety kit is. You can go pick them up.  Let's use this if you want  i think we have another bit here and you need this bit so i'm guessing but you could do like the big screws okay let's do that  Or perhaps it's a bad idea to try this because some of them are too tight. So we have to start with the first loosen. We have to first loosen them, I think.  I think they are quite small anyway, so we don't need the drilling machine  Did you remove the lower ones already? Okay. Just place it here.  so i think these have the same size i think this was placed here to guide the crank so i think we can unscrew first the outer ones and then the inner ones you can find a drill bit  This should work.  Okay.  This end seems to be extremely tightly fixed. You have to go the other direction. Like this way. Am I screwing it accidentally? You're tightening it.  I can take the longer one.  I can separate them.  so all the parts have been separated and yeah then we can just put the tools back and finish the process  And the other drilling machine is here.  Can you put this in? And I'll take the trolley out.  Okay, the process is complete.\n",
              "    </div>\n",
              "    "
            ]
          },
          "metadata": {}
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🪵 Visualizing Egocentric Interaction: Rasping a Wooden Block (User 14)\n",
        "\n",
        "This example demonstrates how to visualize a lightweight egocentric scenario using **Project Aria's MPS data** rendered in the **Rerun SDK**.\n",
        "\n",
        "We load and display:\n",
        "- 🎥 Egocentric video from **User 14**\n",
        "- 👁️ Eye gaze vectors\n",
        "- ✋ Hand pose trajectories (wrist & palm)\n",
        "- 🧭 SLAM trajectory from closed-loop mapping\n",
        "- 🌍 3D global point cloud\n",
        "\n",
        "This takes a few minutes to load, due to the large file sizes and their processing.\n",
        "\n",
        "> ⚡ Tip: You can interact with the scene using zoom, pan, or object selection directly in the viewer below.\n"
      ],
      "metadata": {
        "id": "C-2Gnj7KaJRc"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "# Install rerun SDK with notebook support and projectaria_tools\n",
        "!pip install -q \"rerun-sdk[notebook]\" projectaria-tools[all]"
      ],
      "metadata": {
        "id": "Kj8gJobvuxi3",
        "cellView": "form"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "# ⚡ Lightweight sample: Singular Action 26 (Rasping a Wooden Block, User-14)\n",
        "\n",
        "import pathlib, requests, shutil, rerun as rr, tqdm\n",
        "\n",
        "# --------------------------------------------------------------------\n",
        "# 1.  Download required files (few MB each, so ~ seconds to fetch)\n",
        "# --------------------------------------------------------------------\n",
        "base = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/8_Singular_Actions/26_Rasping_a_wooden_block\"\n",
        "urls = {\n",
        "    \"vrs\"       : f\"{base}/vrs/User_14_Short_26.vrs\",\n",
        "    \"trajectory\": f\"{base}/mps/mps_User_14_Short_26_vrs/slam/closed_loop_trajectory.csv\",\n",
        "    \"points\"    : f\"{base}/mps/mps_User_14_Short_26_vrs/slam/semidense_points.csv.gz\",\n",
        "    \"gaze\"      : f\"{base}/mps/mps_User_14_Short_26_vrs/eye_gaze/general_eye_gaze.csv\",\n",
        "    \"hands\"     : f\"{base}/mps/mps_User_14_Short_26_vrs/hand_tracking/wrist_and_palm_poses.csv\",\n",
        "}\n",
        "\n",
        "dl_dir = pathlib.Path(\"mps_sample26\"); dl_dir.mkdir(exist_ok=True)\n",
        "def fetch(url, dst):\n",
        "    if dst.exists():\n",
        "        return\n",
        "    print(\"↓\", dst.name)\n",
        "    with requests.get(url, stream=True) as r, open(dst, \"wb\") as f, tqdm.tqdm(\n",
        "        total=int(r.headers.get(\"content-length\", 0)), unit=\"B\", unit_scale=True\n",
        "    ) as bar:\n",
        "        for chunk in r.iter_content(chunk_size=1 << 20):\n",
        "            f.write(chunk); bar.update(len(chunk))\n",
        "\n",
        "for tag, url in urls.items():\n",
        "    fetch(url, dl_dir / pathlib.Path(url).name)\n",
        "\n",
        "# --------------------------------------------------------------------\n",
        "# 2.  Visualize with Rerun (inline; downsample for speed)\n",
        "# --------------------------------------------------------------------\n",
        "from projectaria_tools.utils.rerun_viewer_mps import log_mps_to_rerun\n",
        "\n",
        "rr.init(\"IndEgo_MPS_Viewer_Sample26\", spawn=False)\n",
        "\n",
        "log_mps_to_rerun(\n",
        "    vrs_path                  = str(dl_dir / \"User_14_Short_26.vrs\"),\n",
        "    trajectory_files          = [str(dl_dir / \"closed_loop_trajectory.csv\")],\n",
        "    points_files              = [str(dl_dir / \"semidense_points.csv.gz\")],\n",
        "    eye_gaze_file             =  str(dl_dir / \"general_eye_gaze.csv\"),\n",
        "    wrist_and_palm_poses_file =  str(dl_dir / \"wrist_and_palm_poses.csv\"),\n",
        "    hand_tracking_results_file= None,\n",
        "    down_sampling_factor      = 8,     # <- larger factor = faster\n",
        "    should_rectify_image      = True,\n",
        "    should_rotate_image       = True,\n",
        ")\n",
        "\n",
        "iframe = rr.notebook_show(height=600)\n",
        "if iframe is None:                      # fallback to web viewer if inline fails\n",
        "    url = rr.serve_web(port=7000)\n",
        "    from IPython.display import IFrame, HTML\n",
        "    display(HTML(f\"<p>Inline viewer disabled – open in browser:<br><a href='{url}' target='_blank'>{url}</a></p>\"))\n",
        "    display(IFrame(url, width=\"100%\", height=600))\n"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 830,
          "referenced_widgets": [
            "6d69c7fe088c4cdabb7b6506dc7813da",
            "2e93afa71152452f9e0d6a13b043d1ec",
            "5ed03eb0229346af9b6c8253c484a713"
          ]
        },
        "id": "RN0RlqE-uzrg",
        "outputId": "2b7eec62-b854-4983-eea9-35eb9e105d4f",
        "cellView": "form"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "↓ closed_loop_trajectory.csv\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 6.70M/6.70M [00:00<00:00, 41.6MB/s]\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "↓ semidense_points.csv.gz\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 2.35M/2.35M [00:00<00:00, 6.77MB/s]\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "↓ general_eye_gaze.csv\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 60.9k/60.9k [00:00<00:00, 7.28MB/s]\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Loading and logging trajectory(ies)...\n",
            "Loading: mps_sample26/closed_loop_trajectory.csv\n",
            "Showing: mps_sample26/closed_loop_trajectory.csv as world/device_trajectory\n",
            "Loading and logging point cloud(s)...\n",
            "Showing: mps_sample26/semidense_points.csv.gz as world/points\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 221/221 [04:57<00:00,  1.35s/it]\n"
          ]
        },
        {
          "output_type": "display_data",
          "data": {
            "text/plain": [
              "Viewer()"
            ],
            "application/vnd.jupyter.widget-view+json": {
              "version_major": 2,
              "version_minor": 0,
              "model_id": "6d69c7fe088c4cdabb7b6506dc7813da"
            }
          },
          "metadata": {
            "application/vnd.jupyter.widget-view+json": {
              "colab": {
                "custom_widget_manager": {
                  "url": "https://ssl.gstatic.com/colaboratory-static/widgets/colab-cdn-widget-manager/2b70e893a8ba7c0f/manager.min.js"
                }
              }
            }
          }
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🔭 Vision: Egocentric AI for the Future of Industrial Work\n",
        "\n",
        "As industries grow more complex and collaborative, traditional automation alone cannot address the dynamic, high-context nature of real-world tasks. We believe **Egocentric AI**—AI grounded in first-person multimodal perception—is the next frontier for intelligent industrial systems.\n",
        "\n",
        "By combining real-time video, eye gaze, audio, hand tracking, and spatial mapping from wearable devices, **Egocentric AI enables machines to understand what workers see, do, and intend**. This opens the door to next-generation AI assistants that are:\n",
        "\n",
        "👀 **Context-aware** — understanding the workflow from the user’s visual perspective  \n",
        "🛠️ **Task-aware** — grounding perception in structured tasks like assembly, inspection, or repair  \n",
        "🧠 **Mistake-aware** — detecting errors, omissions, or suboptimal sequences early  \n",
        "🤝 **Collaboration-aware** — supporting coordination between humans and machines\n",
        "\n",
        "---\n",
        "\n",
        "## 🧪 IndEgo Benchmarks: Advancing Egocentric Industrial Intelligence\n",
        "\n",
        "To accelerate progress in this domain, we introduce **five research benchmarks** built on real-world industrial scenarios captured via wearable devices:\n",
        "\n",
        "**❌ Mistake Detection**  \n",
        "  Detect skipped, reversed, or incorrectly executed steps in procedural workflows.\n",
        "\n",
        "**🧠 Video QA with Reasoning**  \n",
        "  Answer task-specific and commonsense questions from egocentric video using vision-language models.\n",
        "\n",
        "**📝 Video Summarization**  \n",
        "  Generate coherent, structured summaries of industrial tasks from raw video.\n",
        "\n",
        "**🤝 Task Understanding from a Collaborative Perspective**  \n",
        "  Model shared task graphs and coordination across multiple egocentric views.\n",
        "\n",
        "**🎬 Action Recognition**  \n",
        "  Identify fine-grained user actions and human-object interactions in first-person video.\n",
        "\n",
        "Each benchmark captures a unique challenge for building perceptive, adaptive, and helpful AI systems in realistic industrial environments."
      ],
      "metadata": {
        "id": "R3waWyc7aFyC"
      }
    },
    {
      "cell_type": "markdown",
      "source": [
        "## 🧪 Mistake Detection\n",
        "\n",
        "In this example, two workers perform the same task: **Loading a trolley into a hatch**. One performs it correctly; the other makes a mistake.\n",
        "\n",
        "### ✅ Expected Steps:\n",
        "1. Open hatch  \n",
        "2. Put on gloves  \n",
        "3. Load trolley securely  \n",
        "4. Close hatch  \n",
        "5. Check if loaded securely\n",
        "\n",
        "Watch both videos side by side and consider:\n",
        "- Which worker made a mistake?\n",
        "- What step(s) did they skip or do incorrectly?"
      ],
      "metadata": {
        "id": "XTZU8eV2jh3q"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "from IPython.display import HTML, display\n",
        "\n",
        "# Correct and mistake video URLs\n",
        "correct_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/Mistake_Detection/Task_10/mp4_480/User_1_H_10c_3_480.mp4\"\n",
        "mistake_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/Mistake_Detection/Task_10/mp4_480/User_16_0611_10m_3_480.mp4\"\n",
        "\n",
        "# Display side-by-side videos\n",
        "display(HTML(f\"\"\"\n",
        "<table>\n",
        "<tr>\n",
        "  <th style=\"text-align:center\">Example 1</th>\n",
        "  <th style=\"text-align:center\">Example 2</th>\n",
        "</tr>\n",
        "<tr>\n",
        "<td>\n",
        "  <video width=\"480\" controls>\n",
        "    <source src=\"{correct_url}\" type=\"video/mp4\">\n",
        "    Your browser does not support the video tag.\n",
        "  </video>\n",
        "</td>\n",
        "<td>\n",
        "  <video width=\"480\" controls>\n",
        "    <source src=\"{mistake_url}\" type=\"video/mp4\">\n",
        "    Your browser does not support the video tag.\n",
        "  </video>\n",
        "</td>\n",
        "</tr>\n",
        "</table>\n",
        "\n",
        "<p><strong>🤔 Can you identify which step was skipped or done incorrectly in the second video?</strong></p>\n",
        "\"\"\"))\n"
      ],
      "metadata": {
        "id": "1MdkLnSKzBTk",
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 558
        },
        "outputId": "e5e7a2d5-7005-4bdf-9ee8-44be605affae"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "display_data",
          "data": {
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ],
            "text/html": [
              "\n",
              "<table>\n",
              "<tr>\n",
              "  <th style=\"text-align:center\">Example 1</th>\n",
              "  <th style=\"text-align:center\">Example 2</th>\n",
              "</tr>\n",
              "<tr>\n",
              "<td>\n",
              "  <video width=\"480\" controls>\n",
              "    <source src=\"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/Mistake_Detection/Task_10/mp4_480/User_1_H_10c_3_480.mp4\" type=\"video/mp4\">\n",
              "    Your browser does not support the video tag.\n",
              "  </video>\n",
              "</td>\n",
              "<td>\n",
              "  <video width=\"480\" controls>\n",
              "    <source src=\"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/Mistake_Detection/Task_10/mp4_480/User_16_0611_10m_3_480.mp4\" type=\"video/mp4\">\n",
              "    Your browser does not support the video tag.\n",
              "  </video>\n",
              "</td>\n",
              "</tr>\n",
              "</table>\n",
              "\n",
              "<p><strong>🤔 Can you identify which step was skipped or done incorrectly in the second video?</strong></p>\n"
            ]
          },
          "metadata": {}
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "### ✅ Ground Truth: Mistake Detection Annotations\n",
        "\n",
        "The table below shows the **step-by-step mistake analysis** for the two videos.  \n",
        "Each step is marked as correct (✅) or mistaken (❌), along with a short explanation where applicable."
      ],
      "metadata": {
        "id": "qlK0b9_hl5Tq"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "# @title\n",
        "import requests\n",
        "import json\n",
        "import pandas as pd\n",
        "from IPython.display import display, HTML\n",
        "\n",
        "# Annotation file URL\n",
        "annotation_url = \"https://huggingface.co/datasets/vivek9chavan/IndEgo_Demo/resolve/main/Mistake_Detection/Task_10/annotations/A_Task_10.json\"\n",
        "\n",
        "# Load the JSON\n",
        "annotations = requests.get(annotation_url).json()\n",
        "\n",
        "# Define expected steps\n",
        "steps = [\n",
        "    \"Open hatch\",\n",
        "    \"Put on gloves\",\n",
        "    \"Load trolley securely\",\n",
        "    \"Close hatch\",\n",
        "    \"Check if loaded securely\"\n",
        "]\n",
        "\n",
        "# Video keys (strip file extensions)\n",
        "correct_key = \"User_1_H_10c_3\"\n",
        "mistake_key = \"User_16_0611_10m_3\"\n",
        "\n",
        "# Helper to format results\n",
        "def parse_entry(entry):\n",
        "    return [\n",
        "        {\n",
        "            \"mistake\": \"✅\" if m == 0 else \"❌\",\n",
        "            \"description\": d if d else \"\"\n",
        "        }\n",
        "        for m, d in zip(entry[\"mistakes\"], entry[\"description\"])\n",
        "    ]\n",
        "\n",
        "correct_result = parse_entry(annotations.get(correct_key, {}))\n",
        "mistake_result = parse_entry(annotations.get(mistake_key, {}))\n",
        "\n",
        "# Create comparison DataFrame\n",
        "df = pd.DataFrame({\n",
        "    \"Step\": steps,\n",
        "    \"Correct\": [e[\"mistake\"] for e in correct_result],\n",
        "    \"Mistake\": [e[\"mistake\"] for e in mistake_result],\n",
        "    \"Mistake Description\": [e[\"description\"] for e in mistake_result]\n",
        "})\n",
        "\n",
        "# Display as styled table without using hide_index (compatible with older pandas)\n",
        "def render_table(df):\n",
        "    styled = df.style \\\n",
        "        .set_table_attributes('style=\"width:100%; border:1px solid #ccc;\"') \\\n",
        "        .set_properties(**{'text-align': 'left'}) \\\n",
        "        .set_caption(\"🔍 Step-by-Step Mistake Detection Results\")\n",
        "\n",
        "    return HTML(styled.to_html())\n",
        "\n",
        "display(render_table(df))\n"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 167
        },
        "cellView": "form",
        "id": "0bSgiRqdl8QA",
        "outputId": "20656c24-c817-41ec-8a57-24ae023e8a79"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "display_data",
          "data": {
            "text/plain": [
              "<IPython.core.display.HTML object>"
            ],
            "text/html": [
              "<style type=\"text/css\">\n",
              "#T_4ba27_row0_col0, #T_4ba27_row0_col1, #T_4ba27_row0_col2, #T_4ba27_row0_col3, #T_4ba27_row1_col0, #T_4ba27_row1_col1, #T_4ba27_row1_col2, #T_4ba27_row1_col3, #T_4ba27_row2_col0, #T_4ba27_row2_col1, #T_4ba27_row2_col2, #T_4ba27_row2_col3, #T_4ba27_row3_col0, #T_4ba27_row3_col1, #T_4ba27_row3_col2, #T_4ba27_row3_col3, #T_4ba27_row4_col0, #T_4ba27_row4_col1, #T_4ba27_row4_col2, #T_4ba27_row4_col3 {\n",
              "  text-align: left;\n",
              "}\n",
              "</style>\n",
              "<table id=\"T_4ba27\" style=\"width:100%; border:1px solid #ccc;\">\n",
              "  <caption>🔍 Step-by-Step Mistake Detection Results</caption>\n",
              "  <thead>\n",
              "    <tr>\n",
              "      <th class=\"blank level0\" >&nbsp;</th>\n",
              "      <th id=\"T_4ba27_level0_col0\" class=\"col_heading level0 col0\" >Step</th>\n",
              "      <th id=\"T_4ba27_level0_col1\" class=\"col_heading level0 col1\" >Correct</th>\n",
              "      <th id=\"T_4ba27_level0_col2\" class=\"col_heading level0 col2\" >Mistake</th>\n",
              "      <th id=\"T_4ba27_level0_col3\" class=\"col_heading level0 col3\" >Mistake Description</th>\n",
              "    </tr>\n",
              "  </thead>\n",
              "  <tbody>\n",
              "    <tr>\n",
              "      <th id=\"T_4ba27_level0_row0\" class=\"row_heading level0 row0\" >0</th>\n",
              "      <td id=\"T_4ba27_row0_col0\" class=\"data row0 col0\" >Open hatch</td>\n",
              "      <td id=\"T_4ba27_row0_col1\" class=\"data row0 col1\" >✅</td>\n",
              "      <td id=\"T_4ba27_row0_col2\" class=\"data row0 col2\" >✅</td>\n",
              "      <td id=\"T_4ba27_row0_col3\" class=\"data row0 col3\" ></td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th id=\"T_4ba27_level0_row1\" class=\"row_heading level0 row1\" >1</th>\n",
              "      <td id=\"T_4ba27_row1_col0\" class=\"data row1 col0\" >Put on gloves</td>\n",
              "      <td id=\"T_4ba27_row1_col1\" class=\"data row1 col1\" >✅</td>\n",
              "      <td id=\"T_4ba27_row1_col2\" class=\"data row1 col2\" >✅</td>\n",
              "      <td id=\"T_4ba27_row1_col3\" class=\"data row1 col3\" ></td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th id=\"T_4ba27_level0_row2\" class=\"row_heading level0 row2\" >2</th>\n",
              "      <td id=\"T_4ba27_row2_col0\" class=\"data row2 col0\" >Load trolley securely</td>\n",
              "      <td id=\"T_4ba27_row2_col1\" class=\"data row2 col1\" >✅</td>\n",
              "      <td id=\"T_4ba27_row2_col2\" class=\"data row2 col2\" >✅</td>\n",
              "      <td id=\"T_4ba27_row2_col3\" class=\"data row2 col3\" ></td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th id=\"T_4ba27_level0_row3\" class=\"row_heading level0 row3\" >3</th>\n",
              "      <td id=\"T_4ba27_row3_col0\" class=\"data row3 col0\" >Close hatch</td>\n",
              "      <td id=\"T_4ba27_row3_col1\" class=\"data row3 col1\" >✅</td>\n",
              "      <td id=\"T_4ba27_row3_col2\" class=\"data row3 col2\" >❌</td>\n",
              "      <td id=\"T_4ba27_row3_col3\" class=\"data row3 col3\" >only closed one</td>\n",
              "    </tr>\n",
              "    <tr>\n",
              "      <th id=\"T_4ba27_level0_row4\" class=\"row_heading level0 row4\" >4</th>\n",
              "      <td id=\"T_4ba27_row4_col0\" class=\"data row4 col0\" >Check if loaded securely</td>\n",
              "      <td id=\"T_4ba27_row4_col1\" class=\"data row4 col1\" >✅</td>\n",
              "      <td id=\"T_4ba27_row4_col2\" class=\"data row4 col2\" >✅</td>\n",
              "      <td id=\"T_4ba27_row4_col3\" class=\"data row4 col3\" ></td>\n",
              "    </tr>\n",
              "  </tbody>\n",
              "</table>\n"
            ]
          },
          "metadata": {}
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [],
      "metadata": {
        "id": "_lga-7gSjrGN"
      },
      "execution_count": null,
      "outputs": []
    }
  ]
}