{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "\n",
    "# Function to count the frequency of each object class in the annotations\n",
    "def count_object_classes(json_file_path):\n",
    "    # Open the JSON file and load its content\n",
    "    with open(json_file_path, 'r') as file:\n",
    "        data = json.load(file)\n",
    "\n",
    "    # Dictionary to hold the count of each object class\n",
    "    object_class_count = {}\n",
    "\n",
    "    # Get the list of all categories\n",
    "    categories = {category['id']: category['name'] for category in data['categories']}\n",
    "\n",
    "    # Count each occurrence of each object class in the annotations\n",
    "    for annotation in data['annotations']:\n",
    "        category_id = annotation['category_id']\n",
    "        category_name = categories.get(category_id)\n",
    "        if category_name:\n",
    "            object_class_count[category_name] = object_class_count.get(category_name, 0) + 1\n",
    "\n",
    "    return object_class_count\n",
    "\n",
    "# Path to the JSON file\n",
    "json_file_path = 'annotations/instances_train2017.json'  # Update this path\n",
    "\n",
    "# Call the function and get the count\n",
    "object_class_count = count_object_classes(json_file_path)\n",
    "\n",
    "# Sort the object classes by frequency\n",
    "sorted_object_classes = sorted(object_class_count.items(), key=lambda item: item[1], reverse=True)\n",
    "\n",
    "# Save the counts to a file\n",
    "output_file = 'object_class_counts_train.txt'\n",
    "with open(output_file, 'w') as f:\n",
    "    for class_name, count in sorted_object_classes:\n",
    "        f.write(f\"{class_name}: {count}\\n\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Object counts saved to total_frequency.txt\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import json\n",
    "from collections import Counter\n",
    "from joblib import Parallel, delayed\n",
    "\n",
    "def count_objects_in_file(file_path):\n",
    "    class_counts = Counter()\n",
    "    with open(file_path, 'r', encoding='utf-8') as file:\n",
    "        data = json.load(file)\n",
    "        for obj in data['objects']:\n",
    "            class_counts[obj['name']] += 1\n",
    "    return class_counts\n",
    "\n",
    "def parallel_count_objects(json_folder):\n",
    "    file_paths = [os.path.join(json_folder, f) for f in os.listdir(json_folder) if f.endswith('.json')]\n",
    "    results = Parallel(n_jobs=-1)(delayed(count_objects_in_file)(file_path) for file_path in file_paths)\n",
    "    total_counts = Counter()\n",
    "    for result in results:\n",
    "        total_counts.update(result)\n",
    "    return total_counts\n",
    "\n",
    "json_folder = 'data_json'\n",
    "\n",
    "object_class_counts = parallel_count_objects(json_folder)\n",
    "\n",
    "output_file = 'total_frequency.txt'\n",
    "with open(output_file, 'w') as file:\n",
    "    for class_name, count in object_class_counts.items():\n",
    "        file.write(f\"Class '{class_name}': {count} times\\n\")\n",
    "\n",
    "print(f\"Object counts saved to {output_file}\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "from collections import Counter\n",
    "\n",
    "def count_object_classes(merged_json_path, output_txt_path):\n",
    "    with open(merged_json_path, 'r') as file:\n",
    "        images_data = json.load(file)\n",
    "\n",
    "    name_counter = Counter()\n",
    "    for image in images_data:\n",
    "        for obj in image['objects']:\n",
    "            name_counter[obj['name']] += 1\n",
    "\n",
    "    with open(output_txt_path, 'w') as file:\n",
    "        total_classes = len(name_counter)\n",
    "        file.write(f\"Total different classes: {total_classes}\\n\")\n",
    "        for name, count in name_counter.items():\n",
    "            file.write(f\"{name}: {count}\\n\")\n",
    "\n",
    "merged_json_path = 'merged_data_text_new.json' \n",
    "output_txt_path = 'output_counts.txt' \n",
    "count_object_classes(merged_json_path, output_txt_path)\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "detectai",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
