{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n",
      "HERE!\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import os\n",
    "import numpy as np\n",
    "from PIL import Image\n",
    "\n",
    "def load_labels(label_file_path):\n",
    "    labels = {}\n",
    "    with open(label_file_path, 'r') as file:\n",
    "        for line in file:\n",
    "            index, label = line.strip().split(': ')\n",
    "            labels[int(index)] = label\n",
    "    return labels\n",
    "\n",
    "def match_indices_to_labels(unique_indices, labels):\n",
    "    matched_labels = {index: labels.get(index, 'Unknown') for index in unique_indices}\n",
    "    return matched_labels\n",
    "\n",
    "def add_object_set_to_images(merged_json_path, labels_txt_path, images_directory, output_json_path):\n",
    "    # Load the class labels from 'labels.txt'\n",
    "    labels = load_labels(labels_txt_path)\n",
    "\n",
    "    # Load the merged images data from the json file\n",
    "    with open(merged_json_path, 'r') as file:\n",
    "        images_data = json.load(file)\n",
    "\n",
    "    for image in images_data:\n",
    "        # Extract the filename without the extension and construct the path to the .png file\n",
    "        if image['data_source']!='COCO':\n",
    "            continue\n",
    "        filename_without_ext = os.path.splitext(image['filename'])[0]\n",
    "        image_file_path = os.path.join(images_directory, filename_without_ext + '.png')\n",
    "\n",
    "        # If the .png file exists, read it and extract label indices\n",
    "        if os.path.exists(image_file_path):\n",
    "            print(\"HERE!\")\n",
    "            with Image.open(image_file_path) as img:\n",
    "                img_data = np.array(img)\n",
    "            unique_classes = np.unique(img_data)\n",
    "            # Filter out the 'unlabeled' class index 255\n",
    "            adjusted_classes = unique_classes + 1\n",
    "            adjusted_classes = adjusted_classes[(adjusted_classes != 255) & (adjusted_classes != 0)]\n",
    "            # Match the indices to their labels\n",
    "            label_names = [labels.get(index) for index in adjusted_classes if index in labels]\n",
    "            # Update the 'object_set' in the image data\n",
    "            image['object_set'].extend(label_names)\n",
    "            # Remove duplicates\n",
    "            image['object_set'] = list(set(image['object_set']))\n",
    "\n",
    "    # Write the updated images data to the new json file\n",
    "    with open(output_json_path, 'w') as file:\n",
    "        json.dump(images_data, file, indent=4)\n",
    "\n",
    "# Usage example\n",
    "merged_json_path = ''\n",
    "labels_txt_path = ''  # Path to the labels.txt file\n",
    "images_directory = ''  # Directory where the .png files are located\n",
    "output_json_path = ''  # Path for the new updated JSON file\n",
    "\n",
    "# Run the function to update the merged_data.json with new object classes\n",
    "add_object_set_to_images(merged_json_path, labels_txt_path, images_directory, output_json_path)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "\n",
    "def add_data_source_attribute(input_json_path, output_json_path):\n",
    "    # Load the original data from the json file\n",
    "    with open(input_json_path, 'r') as file:\n",
    "        data = json.load(file)\n",
    "\n",
    "    # Add 'data_source': 'COCO' to each image entry\n",
    "    for image_entry in data:\n",
    "        image_entry['data_source'] = 'COCO'\n",
    "\n",
    "    # Save the modified data to a new json file\n",
    "    with open(output_json_path, 'w') as file:\n",
    "        json.dump(data, file, indent=4)\n",
    "\n",
    "# Specify the path to your original merged_data.json file\n",
    "input_json_path = 'merged_data_text_new_panoptic.json'\n",
    "# Specify the path where you want to save the new json file with the added 'data_source' attribute\n",
    "output_json_path = 'merged_data_text_new_panoptic.json'\n",
    "\n",
    "# Run the function\n",
    "add_data_source_attribute(input_json_path, output_json_path)\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "detectai",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
