{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "There are 1538 JSON files in the directory 'same_objects_0.01'.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "\n",
    "def count_json_files(directory):\n",
    "    json_count = 0\n",
    "    for filename in os.listdir(directory):\n",
    "        if filename.endswith(\".json\"):\n",
    "            json_count += 1\n",
    "    return json_count\n",
    "\n",
    "directory_path = 'same_objects_0.01'  \n",
    "number_of_json_files = count_json_files(directory_path)\n",
    "print(f\"There are {number_of_json_files} JSON files in the directory '{directory_path}'.\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The number of images in the dataset is: 660\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "\n",
    "def count_images_in_json(file_path):\n",
    "    # Open the JSON file and load the data\n",
    "    with open(file_path, 'r') as file:\n",
    "        data = json.load(file)\n",
    "    \n",
    "    # The number of images is the length of the list\n",
    "    number_of_images = len(data)\n",
    "    \n",
    "    return number_of_images\n",
    "\n",
    "# Example usage\n",
    "file_path = ''\n",
    "image_count = count_images_in_json(file_path)\n",
    "print(f\"The number of images in the dataset is: {image_count}\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import json\n",
    "\n",
    "def merge_json_files(source_directory, output_file):\n",
    "    merged_data = []\n",
    "\n",
    "    for file in os.listdir(source_directory):\n",
    "        if file.endswith(\".json\"):\n",
    "            file_path = os.path.join(source_directory, file)\n",
    "            with open(file_path, 'r') as json_file:\n",
    "                data = json.load(json_file)\n",
    "                merged_data.append(data)\n",
    "\n",
    "    with open(output_file, 'w') as outfile:\n",
    "        json.dump(merged_data, outfile, indent=4)\n",
    "\n",
    "source_directory = 'different_objects_0.01_selected'\n",
    "output_file = 'merged_dataset_heterogenous.json' \n",
    "merge_json_files(source_directory, output_file)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "\n",
    "def add_data_source_attribute(input_json_path, output_json_path):\n",
    "    # Load the original data from the json file\n",
    "    with open(input_json_path, 'r') as file:\n",
    "        data = json.load(file)\n",
    "\n",
    "    # Add 'data_source': 'COCO' to each image entry\n",
    "    for image_entry in data:\n",
    "        image_entry['data_source'] = 'COCO'\n",
    "\n",
    "    # Save the modified data to a new json file\n",
    "    with open(output_json_path, 'w') as file:\n",
    "        json.dump(data, file, indent=4)\n",
    "\n",
    "# Specify the path to your original merged_data.json file\n",
    "input_json_path = 'merged_dataset_homogenous.json'\n",
    "# Specify the path where you want to save the new json file with the added 'data_source' attribute\n",
    "output_json_path = 'merged_dataset_homogenous.json'\n",
    "\n",
    "# Run the function\n",
    "add_data_source_attribute(input_json_path, output_json_path)\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "mind_wandering",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
