{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# References\n",
    "- Optimization of dataflow pipeline: tf.data.(experimental.)AUTOTUNE, dataset.cache(), and dataset.prefetch(buffer_size=AUTOTUNE)\n",
    "    - https://www.tensorflow.org/tutorials/load_data/images#configure_the_dataset_for_performance\n",
    "    - https://www.tensorflow.org/tutorials/load_data/images#configure_dataset_for_performance\n",
    "\n",
    "- Interested readers can learn more about both methods, as well as how to cache data to disk in the data performance guide:\n",
    "    - https://www.tensorflow.org/guide/data_performance#optimize_performance\n",
    "\n",
    "- tf.data.Dataset methods\n",
    "    - https://www.tensorflow.org/api_docs/python/tf/data/Dataset"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# TL;DR\n",
    "   `ds = tfds.load(...)`\n",
    "\n",
    "-> `ds.map(...)`\n",
    "\n",
    "-> `ds.cache()` \n",
    "\n",
    "-> `ds.shuffle(...)` \n",
    "\n",
    "-> `ds.batch(...)` \n",
    "\n",
    "-> `ds.prefetch(buffer_size=tf.data.experimental.AUTOTUNE)`"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import tensorflow as tf\n",
    "import tensorflow.keras.applications as tka\n",
    "import tensorflow_datasets as tfds\n",
    "\n",
    "def set_gpu_devices(gpu):\n",
    "    physical_devices = tf.config.experimental.list_physical_devices('GPU')\n",
    "    assert len(physical_devices) > 0, \"Not enough GPU hardware devices available\"\n",
    "    tf.config.experimental.set_visible_devices(physical_devices[gpu], 'GPU')\n",
    "    tf.config.experimental.set_memory_growth(physical_devices[gpu], True)\n",
    "    \n",
    "set_gpu_devices(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "# Pre-defined\n",
    "batch_size = 10\n",
    "preproc = tka.resnet_v2.preprocess_input\n",
    "\n",
    "# Load dataset\n",
    "dstr, dste = tfds.load(\n",
    "    \"patch_camelyon\", \n",
    "    data_dir=\"/data/t-miyagawa/tensorflow_datasets\", \n",
    "    split=[\"train\", \"test\"])\n",
    "    # shuffle_files=False, bathch_size=None here \n",
    "    # because dataset.shuffle and .batch is more customizable.\n",
    "    \n",
    "# Dataset decoration\n",
    "# map -> cache -> shuffle -> batch -> prefetch with AUTOTUNE\n",
    "# Ref: https://www.tensorflow.org/tutorials/load_data/images#configure_the_dataset_for_performance\n",
    "dstr = dstr.map(\n",
    "    lambda x: (tf.cast(x[\"image\"], dtype=tf.float32), x[\"label\"])) # no AUTOTUNE\n",
    "dstr = dstr.map(\n",
    "    lambda x, y: (preproc(x), y)) # no AUTOTUNE\n",
    "dstr = dstr.cache() \n",
    "dstr = dstr.shuffle(buffer_size=10000, reshuffle_each_iteration=True).\\\n",
    "    batch(batch_size=batch_size, drop_remainder=False) # no AUTOTUNE in .batch\n",
    "dstr = dstr.prefetch(buffer_size=tf.data.experimental.AUTOTUNE)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 0\n",
      "0 1000\n",
      "0 2000\n",
      "1 0\n",
      "1 1000\n",
      "1 2000\n",
      "19.719565868377686 sec\n"
     ]
    }
   ],
   "source": [
    "import time\n",
    "tic = time.time()\n",
    "for j in range(2):\n",
    "    for i, feat in enumerate(dstr):\n",
    "        if i % 1000 == 0:\n",
    "            print(j, i)\n",
    "print(time.time() - tic, \"sec\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## without `dstr.cache()`\n",
    "\n",
    "### First run\n",
    "- j = 0: %CPU=430, %MEM=0--1.6\n",
    "- j = 1: %CPU=450, %MEM=1.6\n",
    "- 111 seconds\n",
    "\n",
    "### Second run\n",
    "- j = 0: %CPU=450, %MEM=2.8\n",
    "- j = 1: %CPU=450, %MEM=2.8\n",
    "- 103 seconds\n",
    "\n",
    "\n",
    "## with `dstr.cache()`\n",
    "### First run\n",
    "- j = 0: %CPU=430, %MEM=0--5.8\n",
    "- j = 1: %CPU=150, %MEM=5.8, \n",
    "- 73 seconds\n",
    "\n",
    "### Second run\n",
    "- j = 0: %CPU=150, %MEM=5.8\n",
    "- j = 1: %CPU=150, %MEM=5.8, \n",
    "- 15--24 seconds"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
