{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "from Utils import *\n",
    "from Variables import *\n",
    "\n",
    "from pathlib import Path"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Compute the annotation times for different datasets"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Classification"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total annotation time for Classification virus dataset: [10.56302134] h\n",
      "Total annotation time for Classification virus dataset: [38026.8768084] s\n"
     ]
    }
   ],
   "source": [
    "paths_img = glob.glob(HERPES_TRAIN_DATA_PATH+\"/*\")\n",
    "paths = []\n",
    "for path in paths_img: \n",
    "    paths.extend(glob.glob(path+\"/*.pkl\"))\n",
    "\n",
    "virus_count, virus_timings = read_pickle(CLASSIFICATION_TIMINGS)\n",
    "virus_count = np.array(virus_count)\n",
    "time_binary = 0\n",
    "for i in range(10): \n",
    "    data_paths = [p for p in paths if (Path(p).stem).startswith(str(i)+\"_\") ]\n",
    "    if(i < len(virus_timings)):\n",
    "        if(np.sum(virus_count==i)>0):\n",
    "            time_binary += virus_timings[virus_count == i]*len(data_paths)\n",
    "    else: \n",
    "        # approximate time for patches with larger virus\n",
    "        if(len(data_paths)>0):\n",
    "            time_binary += i*np.mean(virus_timings)*len(data_paths)\n",
    "            print(\"Estimate time for # particles = \"+str(i))\n",
    "\n",
    "print(\"Total annotation time for Classification virus dataset: \" +str(time_binary/60/60)+\" h\")\n",
    "print(\"Total annotation time for Classification virus dataset: \" +str(time_binary)+\" s\")\n"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Location"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total annotation time for Location virus dataset: [16.97611186] h\n",
      "Total annotation time for Location virus dataset: [61114.00268726] s\n"
     ]
    }
   ],
   "source": [
    "paths_img = glob.glob(HERPES_TRAIN_DATA_PATH+\"/*\")\n",
    "paths = []\n",
    "for path in paths_img: \n",
    "    paths.extend(glob.glob(path+\"/*.pkl\"))\n",
    "\n",
    "virus_count, virus_timings = read_pickle(LOCATION_TIMINGS)\n",
    "virus_count = np.array(virus_count)\n",
    "time_binary = 0\n",
    "for i in range(10): \n",
    "    data_paths = [p for p in paths if (Path(p).stem).startswith(str(i)+\"_\") ]\n",
    "    if(i < len(virus_timings)):\n",
    "        if(np.sum(virus_count==i)>0):\n",
    "            time_binary += virus_timings[virus_count == i]*len(data_paths)\n",
    "    else: \n",
    "        # approximate time for patches with larger virus\n",
    "        if(len(data_paths)>0):\n",
    "            time_binary += i*np.mean(virus_timings)*len(data_paths)\n",
    "            print(\"Estimate time for # particles = \"+str(i))\n",
    "\n",
    "print(\"Total annotation time for Location virus dataset: \" +str(time_binary/60/60)+\" h\")\n",
    "print(\"Total annotation time for Location virus dataset: \" +str(time_binary)+\" s\")\n"
   ]
  },
  {
   "attachments": {},
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Bounding Boxes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total annotation time for BB virus dataset: [18.80200459] h\n",
      "Total annotation time for BB virus dataset: [67687.21652805] s\n"
     ]
    }
   ],
   "source": [
    "paths_img = glob.glob(HERPES_TRAIN_DATA_PATH+\"/*\")\n",
    "paths = []\n",
    "for path in paths_img: \n",
    "    paths.extend(glob.glob(path+\"/*.pkl\"))\n",
    "\n",
    "virus_count, virus_timings = read_pickle(BOUNDINGBOX_TIMINGS)\n",
    "virus_count = np.array(virus_count)\n",
    "time_binary = 0\n",
    "for i in range(10): \n",
    "    data_paths = [p for p in paths if (Path(p).stem).startswith(str(i)+\"_\") ]\n",
    "    if(i < len(virus_timings)):\n",
    "        if(np.sum(virus_count==i)>0):\n",
    "            time_binary += virus_timings[virus_count == i]*len(data_paths)\n",
    "    else: \n",
    "        # approximate time for patches with larger virus\n",
    "        if(len(data_paths)>0):\n",
    "            time_binary += i*np.mean(virus_timings)*len(data_paths)\n",
    "            print(\"Estimate time for # particles = \"+str(i))\n",
    "\n",
    "print(\"Total annotation time for BB virus dataset: \" +str(time_binary/60/60)+\" h\")\n",
    "print(\"Total annotation time for BB virus dataset: \" +str(time_binary)+\" s\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "abem_cams",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.5"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "da271c7ed0eaaaf76462cb7ed437e72b55d93fd2cbbde2ef06222f99cc55f15b"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
