{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "ygcDisv0GMyx"
   },
   "source": [
    "### Setup:"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "Vi6hBDLgF4zj"
   },
   "source": [
    "Load in codebase and gridworlds from GitHub, and install necessary packages:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "R9wd2s469Va6",
    "outputId": "bdcb3c30-9aca-454b-b3cc-9855ed9c813f"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "fatal: destination path 'shutdown_problem' already exists and is not an empty directory.\n",
      "Requirement already satisfied: dill in /Users/alexroman/anaconda3/lib/python3.7/site-packages (0.3.2)\n"
     ]
    }
   ],
   "source": [
    "!git clone https://github.com/alexr314/shutdown_problem.git\n",
    "!pip install dill"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "bG8JMBpaGC9H"
   },
   "source": [
    "Perform lots of imports and tell python where to find the modules we wrote"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "id": "Cmc8mfA_Chsi"
   },
   "outputs": [],
   "source": [
    "import sys\n",
    "import os\n",
    "\n",
    "# Add the IPP directory to the Python path\n",
    "sys.path.append(os.path.abspath('./shutdown_problem/IPP'))\n",
    "\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from matplotlib import colors\n",
    "import random\n",
    "import itertools\n",
    "import time\n",
    "import dill\n",
    "from tqdm import tqdm as tqdm\n",
    "from copy import copy\n",
    "from IPython.display import clear_output\n",
    "from collections import Counter\n",
    "\n",
    "# My modules\n",
    "from grid_env import GridEnvironment\n",
    "from policy_agent import Policy_Agent\n",
    "from draw_gridworlds import draw_gridworld, draw_policy, draw_full_policy\n",
    "from rl_utils import run_episode, evaluate_agent, get_transition_dict, compute_entropy, get_discount_matrix\n",
    "\n",
    "# This doesn't work in colab for some reason:\n",
    "plt.rcParams[\"font.family\"] = \"Times New Roman\"\n",
    "\n",
    "def load_object(filename):\n",
    "    with open(filename, 'rb') as f:\n",
    "        return dill.load(f)\n",
    "\n",
    "filepath='./shutdown_problem/IPP/gridworlds'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "x7GUcXpMGPtk"
   },
   "source": [
    "### Load and Display Environment"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 494
    },
    "id": "TApSBQEFBXQR",
    "outputId": "fad3620d-dd29-4914-d533-4d6a93fdae78"
   },
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAcwAAAHBCAYAAADkRYtYAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAABcSAAAXEgFnn9JSAAAXVElEQVR4nO3de3Cd9X3n8Y/kG0jGxjbINubicAshkCACBBZSyIJTZw2BwJBkd5PpbrLJpE232zZp4m6ySXamzSbNbcmlW7ozuXbbbdxwKRBYSkIoCQETwNwLOGAM2MKW7zdsGWn/EEg+sjE/SUfnHHFerxnN6Hf8PEffZyTrPec5es5p6evrCwCwf631HgAAxgPBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKDBxNDsvXry4PcnWKs0yXnQkWVPvIWqsGY85ac7jbsZjTprzuJvxmPPFL36xZaT7eoQJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAUEEwAKTBzl/tuTdFRjkPGis7Ozu6WlpamOedWqVd1dXV1Ndcwv6U6T/XynOY85ac7jbsZjHpXRBrMtyZpqDDJetLS0dHR2djbVMff29nZ0dXU11TG/pCNN9vOd5jzmpDmPuxmPOUlaRrqjU7IAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaDAxFHuvz1JRzUGGS+uaT+l+5nNU+fXe45aenzub3Wf39raVN/nJJkzZ053V1dXUx13Mx5zkqxataoZj7s7Tfb7e7RGG8y2JGuqMch4ccgL6+d/ouu4FfWeo5a+MqdrfudhnSvqPUcddMydO7epfr7TnMec3t7ejq6urmY77o402e/vl7SMdEenZAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEMzx4EdfSC5srfz46u/UeyqApiKY48Fd1+992z03Jr29tZ8FoEkJZqPbtDZ5Yunet2/uTh67s/bzADQpwWx0d99Q+Uhy4uTBz++6rvbzADQpwWx0S28Y/PzwE5I3vX1wffcNe28PwJgQzEbWsyu57+bBdeeC/o+XPf1Q8vyKmo8F0IwEs5E9dFuyY8vg+tR3JJ3vqNxm6T7+IAiAqhPMRrZnDCdOTk4+L5l/UjLzsMHbnZYFqAnBbGR7xvCEs5ID2vs/3/O07IM/T3ZsreVUAE1JMBvVykeSricH16fuEck9g9mzM7nvn2o3F0CTEsxGNfS5yT2fu+xckLS07LGty0sAxppgNqo9gzltVnLMqYPr6YcmR58yuP71jUlfX81GA2hGgtmItqxP/uVXg+s3n5+0DvlW7XladuPzyeN312Y2gCYlmI3o1z9Jel8cXO8Zx4Hbhl5e4rQswFgSzEa0dMilIkPjmCQnnpNMaRtcu7wEYEwJZqN5cXdy7/8bXB9+QnLoEXtvN2lyctK5g+snlyXdz475eADNSjAbzcO3J9s2Dq47L3jlbU8dcqrWq/4AjBnBbDT7u5xkqKH/5rQswJgRzEZT8XJ4k/pfDu+VHHlicsjhg+sHfpbs3DFmowE0s4n1HoA9PPd4suqJwfXunuTyaeX779yRLLsleetF1Z8NoMl5hNlIqvEcpMtLAMaEYDaSagTz7p+M/j4A2ItTso1i68bkkV8Mrg8/IfnvhfH75kf6T8UmyfpVyfJ7k2NP3f8+AAyLYDaKe27qvwbzZZ0Lktnzy/Y9/d8MBjPpPy0rmABV5ZRsoxh6Sci+Xg7vlbi8BGDMCWYjePHF5J4bB9cTJla+is+rGXp5yfJ7kvWrqzcfAILZEB69o/8dSl72+jOTtoOGdx+n7PGKQH19HmUCVJlgNoK7h/x17CnnD/8+nJYFGFOC2Qj2ejm8YTx/+bJTLqh8z8xltyQ9O0c3FwADBLPeup5Mnnl0cN02LTn+jOHfz/RDkmP2+MvYF7Yl9/9s9PMBkMRlJfU35+jk+t7q3NfXl1bnfgDYi0eYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABUb7biXbk3RUY5DxovuAmd1fmdM1v95z1NKvVq5bOW/nQ031fU6Sww47rHvu3LlNddwze7/R3ZP58+s9R60dP/O27mU5sam+10m602S/v0drtMFsS7KmGoOMF5dsW9bROa1zRb3nqKV5Ox/qWLZsWVN9n5OktbW1Y+7cuU113D2ZP39O3ydW1HuOWnuq92Pzk6yo8xi11pEm+/39kpaR7uiULAAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQIHRvlsJwD49/Vxyz8PJ06uSbTuStgOTjpnJScclJx+fTJhQ7wlheAQTqJrdu5PvXJV8+2+TBx575e1mHZxc/K+T//z+5JQ3vPr9Pt+d3HFfcsey5Jf39od4V8/gv3/3C8l/ePdop4f9E0ygKh79TfK+j+8/lC9bt7E/rN+5Ktm4NJl+0N7bvLAz+ejn+wO5fGW1p4XhE0xg1JY+kCz8SLJhU+XtHbOSNx6bzJ6VbNySPL4iefKZym36+vZ9ny/sTL5/zVhMCyMjmMCoPNuVXPi7lbE89sjkf/5psvBtez9X+dhTyZV/n1z5o2T7juF/vRnTk4PakpWrRzc3DJe/kgVG5Q/+PFm7fnB97unJfVcli87b9x/2vP51ydcWJ4/fmLz9ra9+//PnJe+/KPlfn0sevDZZ96vkP15atfGhmEeYwIjddHty9S2D63mzk3+4Ipna/ur7zpud3PKdV/73g9qT525LDusY/ZxQDYIJjNiXhwTvMx9NDplRvn/rfs5xTZggljQWp2SBEXlmdfLzpYPrmdOdKuW1TTCBEfnRTUlv7+D6HWcnUybXbx4Ya4IJjMhdD1SuF/yr+swBtSKYwIjc90jl+sRj6jMH1IpgAsO244XkN0NegOC4o+ozC9SKYALDtm5j5Sv0TJ6UzBrGX8fCeCSYwLBt3lq5bjuwPnNALQkmMGybtlSu2w6ozxxQS4IJjFpLS70ngLEnmMCwHTTkpe+2jeBF1GG8EUxg2Ia+f+VI3nUExhvBBIZt5vTK9a6eZP3GuowCNSOYwLC1tyWvO7zytieers8sUCuCCYxI5xsq1w8vr88cUCuCCYzIGSdXrv/pjvrMAbUimMCIvOedlZeT3PzLZOeu+s0DY00wgRF53eHJ2acOrtdvSr57Vf3mgbEmmMCI/fHvVK7/7K+S7g3l+/f2Vr6nJjQywQRG7N0LkoVvG1w/93xy+R8mW7e9+r6r1yTv+NDer0sLjWpivQcAxre//Gxy6mXJxs39658v7V9/fXF/TCdMqNz+qWeTK/8++fbfJlu37/++uzfse5uXv9ae2614bu/tDj4oOXha+bHA/ggmMCqvOzy59lvJhb+bbHnpkeUTT/evO2YlJx2XzJ7V/4Lty1cmj68ov+9P/EXy/Wtefbs/+XL/x1Cf+1jy+d8v/3qwP4IJjNpvnZ7c/jfJ+z6e/MuTg7evWZf8bN3+9/XC7YwXnsMEquLNJyT3X5186zPJG47Z/7azDk4+eGly31V7vy4tNCqPMIGqmTw5+di/7/948pnknoeTZ7qSbdv732S6Y2Zy8vH9H0Of29yX7/2P/g9oBIIJjImjj+j/gNcKp2QBoIBgAkABwQSAAoIJAAUEEwAKCCYAFBBMACggmABQQDABoIBgAkABwQSAAoIJAAVG++Lr25N0VGOQ8aK9vb07TXbMW7dubbpjTpLHHnusu7e3t6mO+6zjHurumvqV+fWeo9amtN62Mjmxqb7XSZry//VojDaYbUnWVGOQ8WLbtm0dabJjnjp1atMdc9L/vV62bFlTHXdr6zs7Ojs7V9R7jlp7fP28jqS5vtfpj2WzHXOSjPgty52SBYACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABSaOcv/tSTqqMch40d7e3p0mO+YZrWd0n3LcYfPrPUettU/p6N4x+YGm+l4fe+yxTffznSRbt25txuNuxmMeldEGsy3JmmoMMl5s27atI012zNNnTZy/7smTV9R7jlo79PQt82cd2bmi3nPUWNP9fCfJ1KlTm/G4m/GYk6RlpDs6JQsABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGgwGjf3gsq/NlfX5RHn/rlfreZPOnAtB0wPYfOPDLHzOvMGSdfnNfPP7NqM/zk9m/n//zkv1Xcdun5n8xlFyyu2tcAmo9gUnO7enZkV8+ObNzSlSeeXpqb7rgyR8/rzIcv+0aOnPvGUd33hs2r8+OffqlKkwIMckqWhvDkc/fls395QR5aftuo7ueH1386L+zcWqWpAAZ5hMmY+v33/e8ce+TpFbf1P7pck+XP/Dq3Lv1+1m5YmSTp2b0zX//hB/KVj9+VGdPmDvtrPbT857nrwWuSJBNaJ+bF3t2jnh/gZR5hMqamHzQ7h844suJjXsfr88Zj3paLz/ujfOkP78gbjj5nYPsXdm3NVT/98rC/zu7du/K9az+ZpP850nNOfW/VjgEgEUzqbMrktnzwkq9W3Hb3w9elt7d3WPdz/e3fzOru5UmSRW/7WGZNn1e1GQESwaQBHHbocTl0xpED6y3b1qV74zPF+6/dsDLX3vq1JMmMaXNz4bn/peozAggmDeHgaXMq1pu3ri3e9wfXLc6unh1Jkvf+9mdzwOT2qs4GkAgmDaKnZ2fFuqWl7Efz3kdvyr2P3pQkOebwU3NO53uqPhtAIpg0gL6+vqxZv6LitpnTX/2vZHf17MgPrht8MYIPXPiFtLS0VHs8gCSCSQN45Mnbs/2FTQPrQ2ccVXRZyTW3fm3gkpSz3nxZjjvqjDGbEUAwqatNW9fme9f+ScVtC8784Kvut3rt8tzwz99M0n8Zyb9d+LkxmQ/gZV64gDG1acvzA48CX7arZ0c2bF6dR5/8ZX629PvZvK174N9OPPpt+e2zP/qq9/u9f/xkdr+4K8lLl5EcfHh1BwcYQjAZU9/6vx8u2u6AKVOz4MwP5dLzP5WJEybtd9s7H7g6Dy3/eRKXkQC1I5jU3RFzTswlb/94zjjpXWltnbDfbXfs3JK/ueEzA2uXkQC14jlM6u6Zrkfyzb/7UD7+1dPz8G9u3++2P77lS9mweXUSl5EAteURJmPq0x/+x5y4x2vFJv3PYW7Zvj5Pr3owdz5wde64/8fp6+vNmvUr8qXvXJY/+HffzWlvXLTXfa3seiQ33/HXA2uXkQC15BEmNTd50oGZNX1eTn3Dwvzee6/Mf/1P12TypAOTJC/27s5fLfm9rNv4bMU+fX19+d61nxh4B5Kz3nSpy0iAmhJM6u7Eo8/Je97x6YH1jp1bct1t36jY5p/v/bs8tuLOJP3Bfd87P1/LEQEEk8Zw7mnvr/iDnzsfvLri36+/7YqBz88+5fL09fVm7YaVr/ixfcemiv2379hU8e87d20f2wMCXnM8h0lDaDtgWuYcckxWrXk8Sf87lqzdsHLgXUx29bwwsO2td/8gt979g2Hd/013XJmb7rhyYP1H7//hPp8nBXglHmHSMNoPPLhivWnLmvoMArAPgknDGHqadMIEJ0CAxuE3Eg1h9+5d6er+TcVt06YeOvD5FZ+6f1j39+NbvpirfvoXA+tLz/9kLrtg8X72ANg/jzBpCHc9eO3Am0AnyayDD8+s6fPqOBFAJcGk7p567v784Po/rbjtzDe9u07TAOybU7KMqX29W0nP7p3ZvmNTVq19Ivc/fkvufui6gRckSJLpUzty8Xl/XOtRAfZLMBlTpe9W8rKpbTPzqQ/+Q9oPnD5GEwGMjGDSEFpaWnPGSe/KBy7888yYNrfe4wDsRTCpuUkTp+SAKVNzUPusHDH7xBx7xFvy1jdd4o98gIYmmFTVZz5yXb1HSJJcdsFil5EAVeWvZAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAqM9t1KtifpqMYg48Vjjz3W3dvb21THvOWZ2d1TD2mdX+85au3Be3tXHrT2+ab6Xnd1dXXPmTOnqY45SZ544onuNNnvsiTNeMyjMtpgtiVZU41Bxott27Z1LFu2rKmOOUlH1mVFvYeog46sa66f7yQdXV1dzXbMSX84mu24m/GYk6RlpDs6JQsABQQTAAoIJgAUEEwAKCCYAFBAMAGggGACQAHBBIACggkABQQTAAoIJgAUEEwAKCCYAFBAMAGgwGjf3gsAhu2iiy7K2WefXXHbkiVLcs8999RpolfnESYANTV37tyceeaZ9R5j2AQTgJq65JJLMmHChHqPMWyCCUDNnH766TnqqKOSJC+++GKdpxkewQSgJtra2rJw4cIkyebNm/PII4/UeaLhEUwAamLhwoVpb29Pktx8883ZtWtXnScaHsEEYMwdccQROe2005Ikzz77bEP/NewrEUwAxlRLS0suueSStLb2J+f6669PX19fnacaPsEEYEydddZZmTdvXpLkgQceyIoVK+o70AgJJgBjZurUqVmwYEGSpKenJzfeeGOdJxo5wQRgzCxatCgHHnhgkuQXv/hFNmzYUOeJRk4wARgTRx99dDo7O5P0X0Zy66231nmi0RFMAKqutbU1F1988cB6PF5GMpRgAlB155xzTmbPnp1k/F5GMpRgAlBV06dPz/nnnz+wvuGGG8blZSRDCSYAVXXRRRdlypQpSfovI3nqqafqPFF1CCYAVXP88cfnpJNOSjL+LyMZSjABqIqJEyfmXe9618B6vF9GMpRgAlAV5513Xg455JAkr43LSIaaWO8BAHhtOPfccwc+v+uuu9Le3j7w7iT7Mnny5Ip1W1tbZsyYMbDevHlzQ71npmACUBWTJk0a+HzBggUDL4lXatGiRVm0aNHA+oorrsjq1aurNt9oOSULAAUEEwAKOCULQFUsXrx4WNtffvnlectb3jKwXrJkSUO/IpBHmABQQDABoIBgAkABwQSAAoIJAAUEEwAKuKwEgLpYsmRJlixZUu8xinmECQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUKClr6+v3jMAQMPzCBMACggmABQQTAAoIJgAUEAwAaCAYAJAAcEEgAKCCQAFBBMACggmABQQTAAoIJgAUEAwAaCAYAJAgf8POLCr/D6A/2oAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 555x555 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "filename = '04_one_coin_only'\n",
    "env = load_object(f'{filepath}/{filename}.pkl')\n",
    "env.display(display_values=True, dpi=150)"
   ]
  },
  {
   "cell_type": "raw",
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 494
    },
    "id": "lZ9uwGpjKNR2",
    "outputId": "6d8946f6-340f-45e3-cc74-ee203ab08436"
   },
   "source": [
    "# Say we want to edit one of the coin values:\n",
    "\n",
    "env.inital_shutdown_time = 5\n",
    "env.delays[(4,1)] = 7\n",
    "\n",
    "env.max_steps = env.inital_shutdown_time + sum(env.delays.values())\n",
    "# env.coins[(2,0)] = 10\n",
    "\n",
    "env.reset()\n",
    "env.display(display_values=True, dpi=150)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_transition_dict(env):\n",
    "    \n",
    "    env_state_shape = env.env_shape + (2,)*env.n_flags\n",
    "    \n",
    "    transition_dict = {}\n",
    "    for i in range (np.prod(env_state_shape)):\n",
    "        env.reset()\n",
    "        state=np.unravel_index(i, env_state_shape)\n",
    "        env.steps_until_shutdown=5\n",
    "        \n",
    "        action_results={}\n",
    "        for j in range(4):\n",
    "            env.state=state\n",
    "#                 print(env.state, j)\n",
    "            env.step(j)\n",
    "            v = np.ravel_multi_index(env.state, (env_state_shape))\n",
    "            action_results[j]=v\n",
    "        transition_dict[state]=action_results\n",
    "            \n",
    "        env.current_episode -= 1 # Undo increment of current_episode\n",
    "\n",
    "    env.reset()\n",
    "    return transition_dict\n",
    "\n",
    "# Precompute transition dict.\n",
    "transition_dict = get_transition_dict(env)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "id": "bJjEiLVkDRE3"
   },
   "outputs": [],
   "source": [
    "ACTIONS = [\"up\", \"down\", \"left\", \"right\"]\n",
    "\n",
    "# Precompute transition dict.\n",
    "transition_dict = get_transition_dict(env)\n",
    "\n",
    "# Precompute occupied: This array is used if we decide to randomize the starting position\n",
    "occupied = env.walls.copy()\n",
    "for pos in tuple(env.coins.keys()) + tuple(env.delays.keys()):\n",
    "    occupied[pos] = 1\n",
    "\n",
    "def get_random_starting_pos(occupied):\n",
    "    starting_pos_index = random.randint(0, np.sum(occupied==0)-1)\n",
    "    return tuple(np.array(np.where(occupied==0))[:, starting_pos_index])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "S0j11zB_Gg2j"
   },
   "source": [
    "### Define Agent Parameters"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {
    "id": "ZY4HhiJ6Gdki"
   },
   "outputs": [],
   "source": [
    "# Reward Discounting Factor\n",
    "lambda_factor = 0.9\n",
    "meta_episode_size = 32\n",
    "\n",
    "# Agent Parameters:\n",
    "\n",
    "# - Time Discount Factor\n",
    "gamma = 0.9\n",
    "\n",
    "# - Epsilon\n",
    "epsilon_initial = 1.0\n",
    "epsilon_min = 0.001\n",
    "steps_to_decay = 1024\n",
    "epsilon_decay_factor=(epsilon_min/epsilon_initial)**(1/steps_to_decay)\n",
    "\n",
    "# - Learning Rate\n",
    "lr_initial = 0.25\n",
    "lr_min = 0.001\n",
    "lr_decay_factor = (lr_min / lr_initial)**(1/steps_to_decay)\n",
    "lr_scheduler = lambda current_lr : max(current_lr * lr_decay_factor, lr_min)\n",
    "\n",
    "agent_params = {\n",
    "    'discount_factor' : gamma                ,\n",
    "    'epsilon'         : epsilon_initial      ,\n",
    "    'epsilon_decay'   : epsilon_decay_factor ,\n",
    "    'epsilon_min'     : epsilon_min          ,\n",
    "    'learning_rate'   : lr_initial           ,\n",
    "    'lr_scheduler'    : lr_scheduler\n",
    "}\n",
    "\n",
    "\n",
    "# The \"discount_matrix\" efficently transfroms rewards into discounted returns\n",
    "discount_matrix = get_discount_matrix(256, discount_factor=gamma)\n",
    "# plt.imshow(discount_matrix, cmap='Blues')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {
    "id": "f1hTgN_5Hd1W"
   },
   "outputs": [],
   "source": [
    "def compute_trajectory_probs(env, agent, transition_dict):\n",
    "    ev, final_state_distribution = evaluate_agent(env, agent, transition_dict)\n",
    "    return final_state_distribution.sum(0).sum(0)\n",
    "\n",
    "\n",
    "def evaluate_agent(env, agent, transition_dict):\n",
    "\n",
    "    e_x = np.exp(agent.logits)\n",
    "    probs = e_x / e_x.sum(axis=-1, keepdims=True)\n",
    "\n",
    "    env_state_shape = env.env_shape + (2,)*env.n_flags\n",
    "    n_states=np.prod(env_state_shape)\n",
    "    transition_matrix=np.zeros((n_states,n_states))\n",
    "\n",
    "    for state_index in range(np.prod(env_state_shape)):\n",
    "        state=np.unravel_index(state_index, env_state_shape)\n",
    "        for i,p in enumerate(probs[state]):\n",
    "            j = transition_dict[state][i]\n",
    "            transition_matrix[j,state_index] += p\n",
    "\n",
    "    starting_state = env.starting_pos + (1,)*env.n_flags\n",
    "    starting_state_index = np.ravel_multi_index(starting_state, env_state_shape)\n",
    "\n",
    "    distribution = np.linalg.matrix_power(transition_matrix, env.max_steps)[:, starting_state_index]\n",
    "    distribution = distribution.reshape(env_state_shape)\n",
    "    return None, distribution # Temporarially removed feature which computes EV"
   ]
  },
  {
   "cell_type": "raw",
   "metadata": {},
   "source": [
    "def compute_DREST_factor(trajectory_counts):\n",
    "    excess_counts = trajectory_counts - trajectory_counts.mean()\n",
    "    return lambda_factor**excess_counts[delay_flag_state]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000
    },
    "id": "ArPmlX6oHISJ",
    "outputId": "2ab2ab68-9e79-445f-9e7f-dd6849097c92"
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 5. 27.]:  25%|██▌       | 257/1024 [00:06<00:20, 37.58it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training Run 1 failed, Retrying...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [10. 22.]:  25%|██▌       | 257/1024 [00:06<00:19, 39.98it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training Run 2 failed, Retrying...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 5. 27.]:  25%|██▍       | 254/1024 [00:06<00:20, 38.15it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training Run 3 failed, Retrying...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 5. 27.]:  25%|██▌       | 256/1024 [00:06<00:19, 38.40it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training Run 4 failed, Retrying...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 3. 29.]:  14%|█▍        | 142/1024 [00:04<00:27, 31.84it/s]"
     ]
    },
    {
     "ename": "KeyboardInterrupt",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-7-725b6b4a381f>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m     83\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mresults\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     84\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 85\u001b[0;31m \u001b[0mresults\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtrain_multiple\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     86\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     87\u001b[0m \u001b[0magent\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mresults\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'agent'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m<ipython-input-7-725b6b4a381f>\u001b[0m in \u001b[0;36mtrain_multiple\u001b[0;34m()\u001b[0m\n\u001b[1;32m     73\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mtrain_multiple\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     74\u001b[0m     \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m20\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 75\u001b[0;31m         \u001b[0mresults\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtrain\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     76\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mresults\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'found_coin_after_delay_count'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m10\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     77\u001b[0m             \u001b[0;32mreturn\u001b[0m \u001b[0mresults\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m<ipython-input-7-725b6b4a381f>\u001b[0m in \u001b[0;36mtrain\u001b[0;34m()\u001b[0m\n\u001b[1;32m     26\u001b[0m             \u001b[0;31m# Simulate episode and update according to REINFORCE algorithm\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     27\u001b[0m             states, actions, returns = run_episode(env, agent, discount_matrix,\n\u001b[0;32m---> 28\u001b[0;31m             starting_pos=env.starting_pos)\n\u001b[0m\u001b[1;32m     29\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     30\u001b[0m             \u001b[0mdelay_flag_state\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mstates\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m-\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m-\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/Library/Mobile Documents/com~apple~CloudDocs/Research/Machine Learning/IPP/paper/shutdown_problem/IPP/rl_utils.py\u001b[0m in \u001b[0;36mrun_episode\u001b[0;34m(env, agent, discount_matrix, starting_pos)\u001b[0m\n\u001b[1;32m     13\u001b[0m     \u001b[0;32mwhile\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mdone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     14\u001b[0m         \u001b[0mstate\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0menv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstate\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 15\u001b[0;31m         \u001b[0maction_index\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0magent\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchoose_action\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstate\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     16\u001b[0m         \u001b[0mold_state\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstate\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     17\u001b[0m         \u001b[0mnew_state\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreward\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdone\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0menv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0maction_index\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/Library/Mobile Documents/com~apple~CloudDocs/Research/Machine Learning/IPP/paper/shutdown_problem/IPP/policy_agent.py\u001b[0m in \u001b[0;36mchoose_action\u001b[0;34m(self, state)\u001b[0m\n\u001b[1;32m     22\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0mchoose_action\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstate\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     23\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrandom\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrandom\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m<\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mepsilon\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 24\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrandom\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchoice\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mactions\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     25\u001b[0m         \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     26\u001b[0m             \u001b[0maction_index\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msample_with_softmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlogits\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mstate\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
     ]
    }
   ],
   "source": [
    "def train():\n",
    "\n",
    "    # Iniitalize Agent\n",
    "    agent = Policy_Agent(env.env_shape, env.n_flags, ACTIONS, **agent_params)\n",
    "\n",
    "    meta_episode_histories = []\n",
    "    meta_expected_value_history = []\n",
    "    trajectory_probs_history = []\n",
    "\n",
    "    # n_episodes = 1024*16\n",
    "    meta_episodes = 1024 #n_episodes // meta_episode_size\n",
    "    found_coin_after_delay_count = 0\n",
    "\n",
    "    trajectory_counts = None\n",
    "    pbar = tqdm(range(meta_episodes), position=0)\n",
    "    for n_meta_episode in pbar:\n",
    "        pbar.set_description(f\"Last Meta-Episode Trajectories: {trajectory_counts}\")\n",
    "\n",
    "        episode_histories = []\n",
    "        trajectory_counts = np.zeros(2)\n",
    "\n",
    "        for n_mini_episode in range(meta_episode_size):\n",
    "            # # Randomize Starting Position\n",
    "            # starting_pos = get_random_starting_pos(occupied)\n",
    "\n",
    "            # Simulate episode and update according to REINFORCE algorithm\n",
    "            states, actions, returns = run_episode(env, agent, discount_matrix,\n",
    "            starting_pos=env.starting_pos)\n",
    "\n",
    "            delay_flag_state = states[-1][-1]\n",
    "\n",
    "            excess_counts = trajectory_counts - trajectory_counts.mean()\n",
    "            reward_attenutation = lambda_factor**excess_counts[delay_flag_state]\n",
    "            trajectory_counts[delay_flag_state] += 1\n",
    "\n",
    "            returns = returns * reward_attenutation\n",
    "            agent.update_policy(states, actions, returns)\n",
    "            episode_histories.append((states, actions, returns))\n",
    "\n",
    "            if states[-1][2:] == (0,0):\n",
    "                found_coin_after_delay_count += 1\n",
    "\n",
    "        # Book-keeping\n",
    "        meta_episode_histories.append(episode_histories)\n",
    "        agent.update_epsilon()\n",
    "        agent.update_learning_rate()\n",
    "\n",
    "#         trajectory_probs = compute_trajectory_probs(env, agent, transition_dict)\n",
    "#         trajectory_probs_history.append(trajectory_probs)\n",
    "\n",
    "#         # Occasionally visualize policy\n",
    "#         if n_meta_episode+1 in [1, 100, 200, 400, 800]:\n",
    "#             # draw_full_policy(env, agent)\n",
    "#             draw_policy(env, agent, (1,1))\n",
    "#             plt.suptitle(f'Meta Episode: {n_meta_episode+1}')\n",
    "#             plt.show()\n",
    "\n",
    "        if n_meta_episode > 256 and found_coin_after_delay_count < 10:\n",
    "            break\n",
    "\n",
    "    results = {'agent' : agent, \n",
    "               'meta_episode_history' : meta_episode_histories, \n",
    "               'trajectory_probs_history' : trajectory_probs_history, \n",
    "               'found_coin_after_delay_count' : found_coin_after_delay_count}\n",
    "        \n",
    "    return results\n",
    "\n",
    "# agent, meta_episode_histories, traj_probs_history, found_coin_after_delay_count = train()\n",
    "\n",
    "# draw_full_policy(env, agent)\n",
    "# plt.suptitle('Trained Agent')\n",
    "\n",
    "def train_multiple():\n",
    "    for i in range(20):\n",
    "        results = train()\n",
    "        if results['found_coin_after_delay_count'] > 10:\n",
    "            return results\n",
    "        else:\n",
    "            print(f'Training Run {i+1} failed, Retrying...')\n",
    "            time.sleep(0.2) # This prevents the prinout order from getting messed up\n",
    "    else:\n",
    "        print('Never found coin after delay')\n",
    "        return results\n",
    "        \n",
    "results = train_multiple()\n",
    "\n",
    "agent = results['agent']\n",
    "\n",
    "plt.figure(figsize=(3.5,3.5), dpi=150)\n",
    "# plt.figure(figsize=(3.5,2.42), dpi=150)\n",
    "draw_policy(env, agent, (1,1), True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 8. 24.]:  25%|██▍       | 254/1024 [00:06<00:20, 36.93it/s]"
     ]
    }
   ],
   "source": [
    "results = train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_keys(['agent', 'meta_episode_histoy', 'trajectory_probs_history', 'found_coin_after_delay_count'])"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Last Meta-Episode Trajectories: [ 8. 24.]:  25%|██▍       | 254/1024 [00:23<01:11, 10.77it/s]"
     ]
    }
   ],
   "source": [
    "results.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'agent' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-8-6b1eaa0a446f>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdraw_policy\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0menv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0magent\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m: name 'agent' is not defined"
     ]
    }
   ],
   "source": [
    "draw_policy(env, agent)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {
    "collapsed": true,
    "jupyter": {
     "outputs_hidden": true
    }
   },
   "outputs": [
    {
     "ename": "KeyboardInterrupt",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/ipykernel/kernelbase.py\u001b[0m in \u001b[0;36m_input_request\u001b[0;34m(self, prompt, ident, parent, password)\u001b[0m\n\u001b[1;32m    884\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 885\u001b[0;31m                 \u001b[0mident\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreply\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msession\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstdin_socket\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    886\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/jupyter_client/session.py\u001b[0m in \u001b[0;36mrecv\u001b[0;34m(self, socket, mode, content, copy)\u001b[0m\n\u001b[1;32m    802\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 803\u001b[0;31m             \u001b[0mmsg_list\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msocket\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecv_multipart\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmode\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcopy\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    804\u001b[0m         \u001b[0;32mexcept\u001b[0m \u001b[0mzmq\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mZMQError\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/zmq/sugar/socket.py\u001b[0m in \u001b[0;36mrecv_multipart\u001b[0;34m(self, flags, copy, track)\u001b[0m\n\u001b[1;32m    469\u001b[0m         \"\"\"\n\u001b[0;32m--> 470\u001b[0;31m         \u001b[0mparts\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mflags\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcopy\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrack\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtrack\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    471\u001b[0m         \u001b[0;31m# have first part already, only loop while more to receive\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32mzmq/backend/cython/socket.pyx\u001b[0m in \u001b[0;36mzmq.backend.cython.socket.Socket.recv\u001b[0;34m()\u001b[0m\n",
      "\u001b[0;32mzmq/backend/cython/socket.pyx\u001b[0m in \u001b[0;36mzmq.backend.cython.socket.Socket.recv\u001b[0;34m()\u001b[0m\n",
      "\u001b[0;32mzmq/backend/cython/socket.pyx\u001b[0m in \u001b[0;36mzmq.backend.cython.socket._recv_copy\u001b[0;34m()\u001b[0m\n",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/zmq/backend/cython/checkrc.pxd\u001b[0m in \u001b[0;36mzmq.backend.cython.checkrc._check_rc\u001b[0;34m()\u001b[0m\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: ",
      "\nDuring handling of the above exception, another exception occurred:\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-37-760d716a137a>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0minp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0minput\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      2\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0minp\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mACTIONS\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      3\u001b[0m     \u001b[0maction_index\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mACTIONS\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0minp\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m     \u001b[0menv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0maction_index\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      5\u001b[0m     \u001b[0menv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdisplay\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/ipykernel/kernelbase.py\u001b[0m in \u001b[0;36mraw_input\u001b[0;34m(self, prompt)\u001b[0m\n\u001b[1;32m    858\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_parent_ident\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    859\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_parent_header\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 860\u001b[0;31m             \u001b[0mpassword\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    861\u001b[0m         )\n\u001b[1;32m    862\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/anaconda3/lib/python3.7/site-packages/ipykernel/kernelbase.py\u001b[0m in \u001b[0;36m_input_request\u001b[0;34m(self, prompt, ident, parent, password)\u001b[0m\n\u001b[1;32m    888\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mKeyboardInterrupt\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    889\u001b[0m                 \u001b[0;31m# re-raise KeyboardInterrupt, to truncate traceback\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 890\u001b[0;31m                 \u001b[0;32mraise\u001b[0m \u001b[0mKeyboardInterrupt\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    891\u001b[0m             \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    892\u001b[0m                 \u001b[0;32mbreak\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
     ]
    }
   ],
   "source": [
    "inp = input(\"\")\n",
    "if inp in ACTIONS:\n",
    "    action_index = ACTIONS.index(inp)\n",
    "    env.step(action_index)\n",
    "    env.display()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(4, 1, 1, 1)"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "env.state"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{(4, 1): 4}"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "env.delays"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "ename": "ValueError",
     "evalue": "0 is not in list",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-22-f44779287e8f>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mACTIONS\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[0;31mValueError\u001b[0m: 0 is not in list"
     ]
    }
   ],
   "source": [
    "ACTIONS.index(0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_keys(['agent', 'meta_episode_histoy', 'trajectory_probs_history', 'found_coin_after_delay_count'])"
      ]
     },
     "execution_count": 96,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "results.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_moving_average(arr, n):\n",
    "    return np.convolve(arr, np.ones(n)/n, mode='valid')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {
    "collapsed": true,
    "jupyter": {
     "outputs_hidden": true
    }
   },
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'agent' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-8-dc5f01490b2d>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      2\u001b[0m     \u001b[0;32mfor\u001b[0m \u001b[0mj\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      3\u001b[0m         \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msubplot\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m+\u001b[0m\u001b[0mj\u001b[0m\u001b[0;34m+\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 4\u001b[0;31m         \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mimshow\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mevaluate_agent\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0menv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0magent\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransition_dict\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mj\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvmin\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvmax\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m.1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      5\u001b[0m         \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtitle\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mj\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      6\u001b[0m         \u001b[0mplt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcolorbar\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mNameError\u001b[0m: name 'agent' is not defined"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAMsAAACGCAYAAABzPX6BAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAAJF0lEQVR4nO3dX4wdZR3G8e8jFYiIsFBMiNLSxmIpaChsEEOiGLWUmhQSjLYJsTXVBgRM9ErDBabcoEZJSFBotAFM5O/VGiGkWpomhALbgBRqgLaithIpbOEGRFp+XsxbnR673d9u33POHvp8kpOdMzPved852Wdn5pzZ3ygiMLOJfaDfAzAbFA6LWZLDYpbksJglOSxmSQ6LWdKEYZG0TtKrkp4bZ7kk3Sppu6RnJZ3fWrZC0kvlsaLmwM16LbNnuRNYfJjllwHzymM18EsASacANwKfAS4EbpQ0dCSDNeunCcMSEZuAscOscjlwdzQ2AydLOh24FFgfEWMRsRdYz+FDZzat1Thn+Rjw99bzXWXeePPNBtKMfg8AQNJqmkM4TjjhhAvmz5/f5xHZ+9mWLVtei4jTJtuuRlh2A2e0nn+8zNsNXNIxf+OhXiAi1gJrAYaHh2N0dLTCsMwOTdJfp9KuxmHYCPCN8qnYRcCbEfEK8AiwSNJQObFfVOaZDaQJ9yyS7qHZQ8yUtIvmE64PAkTE7cBDwBJgO/AW8M2ybEzSTcBT5aXWRMThPigwm9YmDEtELJ9geQDXjrNsHbBuakMzm178Db5ZksNiluSwmCU5LGZJDotZksNiluSwmCU5LGZJDotZksNiluSwmCU5LGZJDotZksNiluSwmCU5LGZJqbBIWizphVJI7weHWH6LpGfK40VJb7SW7W8tG6k4drOeyvxb8THAbcCXacoZPSVpJCK2HVgnIr7XWv96YGHrJd6OiPOqjdisTzJ7lguB7RGxMyL+DdxLU1hvPMuBe2oMzmw6yYQlXSxP0mxgDrChNft4SaOSNku6YqoDNeu32kX2lgEPRsT+1rzZEbFb0lxgg6StEbGj3ahdZG/WrFmVh2RWR2bPMl4RvUNZRschWETsLj930hTZW9jZKCLWRsRwRAyfdtqkCwWa9UQmLE8B8yTNkXQsTSD+71MtSfOBIeDx1rwhSceV6ZnAxcC2zrZmgyBTN2yfpOtoqkkeA6yLiOclrQFGI+JAcJYB98bB9wo/G7hD0ns0wby5/Sma2SDRwb/b/edax9ZtkrZExPBk2/kbfLMkh8UsyWExS3JYzJIcFrMkh8UsyWExS3JYzJIcFrMkh8UsyWExS3JYzJIcFrMkh8UsyWExS3JYzJJqFdlbKWlPq5jet1rLVkh6qTxW1By8WS9VKbJX3BcR13W0PQW4ERgGAthS2u6tMnqzHupGkb22S4H1ETFWArIeWDy1oZr1V80ie1dKelbSg5IOlE5KtZW0uhTiG92zZ09y6Ga9VesE/3fAmRHxaZq9x12Taey6YTYIqhTZi4jXI+Kd8vRXwAXZtmaDokqRPUmnt54uBf5cph8BFpVie0PAojLPbODUKrL3XUlLgX3AGLCytB2TdBNN4ADWRMRYF7bDrOtcZM+OOi6yZ9ZlDotZksNiluSwmCU5LGZJDotZksNiluSwmCU5LGZJDotZksNiluSwmCU5LGZJDotZksNillSrbtj3JW0rBSv+KGl2a9n+Vj2xkc62ZoOiVt2wp4HhiHhL0jXAT4Cvl2VvR8R5dYdt1ntV6oZFxKMR8VZ5upmmMIXZ+0rNumEHrAIebj0/vtQE2yzpiskP0Wx6mPAwbDIkXUVTqvXzrdmzI2K3pLnABklbI2JHR7vVwGqAWbNm1RySWTVV6oYBSPoScAOwtFVDjIjYXX7uBDYCCzvbusieDYJadcMWAnfQBOXV1vwhSceV6ZnAxUBnQXGzgVCrbthPgQ8DD0gC+FtELAXOBu6Q9B5NMG8+RPV9s4HgumF21HHdMLMuc1jMkhwWsySHxSzJYTFLcljMkhwWsySHxSzJYTFLcljMkhwWsySHxSzJYTFLcljMkhwWsySHxSypVpG94yTdV5Y/IenM1rIflvkvSLq04tjNemrCsLSK7F0GLACWS1rQsdoqYG9EfAK4BfhxabuA5n/2zwEWA78or2c2cKoU2SvP7yrTDwJfVPPP+JcD90bEOxHxF2B7eT2zgVOryN5/14mIfcCbwKnJtmYDoWqRvalqF9kD3pH0XJ+GMhN47Sjqt59993ObPzmVRpmwZIrsHVhnl6QZwEnA68m2RMRaYC2ApNGpVN6ooV99e5t73/dU2lUpsleeryjTXwU2RFNjaQRYVj4tmwPMA56cykDN+q1Wkb1fA7+RtB0YowkUZb37aapQ7gOujYj9XdoWs+6KiGn1AFYfbX17mwej72lXkdJsuvLlLmZJfQvLkVxC04O+x71HZjf7ba13paSQVOXToky/kr5Wtvl5Sb+t0W+mb0mzJD0q6enyfi+p1O86Sa+O9zWEGreWcT0r6fwJX7RPx4zHADuAucCxwJ+ABR3rfAe4vUwvA+7rYd9fAD5Upq+p0Xem37LeicAmmtsNDvdoe+fR3Bd0qDz/aA/f67XANWV6AfBypb4/B5wPPDfO8iU0d6gTcBHwxESv2a89y5FcQtP1vqM798jMbDPATTTX1v2rQp/Zfr8N3BYRewGidY+dHvQdwEfK9EnAP2p0HBGbaD6ZHc/lwN3R2AycLOn0w71mv8JyJJfQ9KLvts57ZHat33IocEZE/L5Cf+l+gbOAsyQ9Vu79ubiHff8IuErSLuAh4PpKfU9k0pdiTYvLXaarce6R2a2+PgD8HFjZ7b4OYQbNodglNHvRTZI+FRFv9KDv5cCdEfEzSZ+l+b7u3Ih4rwd9T0q/9iyTuYSGjktoetH3uPfI7GK/JwLnAhslvUxzHD1S4SQ/s727gJGIeDeaq8NfpAnPkcr0vQq4HyAiHgeOp7lurNtSvwcHqXEyNYWTrxnATmAO/zvxO6djnWs5+AT//h72vZDmxHReL7e5Y/2N1DnBz2zvYuCuMj2T5vDk1B71/TCwskyfTXPOokrv+ZmMf4L/FQ4+wX9ywter9cswhQ1ZQvMXbAdwQ5m3huYvOTR/YR6g+R+YJ4G5Pez7D8A/gWfKY6QX/XasWyUsye0VzSHgNmArsKyH7/UC4LESpGeARZX6vQd4BXiXZs+5CrgauLq1zbeVcW3NvNf+Bt8syd/gmyU5LGZJDotZksNiluSwmCU5LGZJDotZksNilvQfW3XWBPtS8YMAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "for i in [0,1]:\n",
    "    for j in [0,1]:\n",
    "        plt.subplot(2,2,2*i+j+1)\n",
    "        plt.imshow(evaluate_agent(env, agent, transition_dict)[1][:,:,i,j], vmin=0, vmax=.1)\n",
    "        plt.title((i,j))\n",
    "        plt.colorbar()\n",
    "        plt.axis('off')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 105,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(0.0, 1.0)"
      ]
     },
     "execution_count": 105,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAX8AAAD8CAYAAACfF6SlAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAAAsTAAALEwEAmpwYAAAs6ElEQVR4nO3deXhV1b3/8fc3M0kgYRYS5kEGAcGo4Dyg4lC9DnVobau1Wtvaqtfan7b3WvW2915rq7W3WuehVqvWkapVW0VREQQUQeYwhykhQAYIZDjr98c6h3MSMgEnOZH9eT1Pnj2t7L3Ozs53772mY845REQkWJISnQEREWl/Cv4iIgGk4C8iEkAK/iIiAaTgLyISQAr+IiIB1GLwN7PHzazYzL5sYruZ2R/MrNDM5pvZhPhnU0RE4qk1T/5PAlOa2X4mMCz8cw3wpwPPloiItKUWg79zbjqwtZkk5wF/dt5MINfM+sQrgyIiEn8pcdhHHrAuZrkovG5jw4Rmdg3+7YCsrKwjRowYEYfDi4gEx9y5c7c453oe6H7iEfxbzTn3MPAwQEFBgZszZ057Hl5E5CvPzNbEYz/xaO2zHugXs5wfXiciIh1UPIL/VODb4VY/E4Ey59xeRT4iItJxtFjsY2Z/BU4CephZEfBLIBXAOfcg8CZwFlAI7ASubKvMiohIfLQY/J1zl7Ww3QE/iluORESkzamHr4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAC1Kvib2RQzW2pmhWZ2SyPb+5vZNDP73Mzmm9lZ8c+qiIjES4vB38ySgfuBM4FRwGVmNqpBsv8AXnDOjQcuBR6Id0ZFRCR+WvPkfxRQ6Jxb6ZyrBp4DzmuQxgFdwvM5wIb4ZVFEROKtNcE/D1gXs1wUXhfrduByMysC3gR+3NiOzOwaM5tjZnNKSkr2I7siIhIP8arwvQx40jmXD5wFPG1me+3bOfewc67AOVfQs2fPOB1aRET2VWuC/3qgX8xyfnhdrKuAFwCcc58AGUCPeGRQRETirzXBfzYwzMwGmVkavkJ3aoM0a4FTAcxsJD74q1xHRKSDajH4O+dqgeuAt4HF+FY9C83sTjM7N5zsJuBqM/sC+CtwhXPOtVWmRUTkwKS0JpFz7k18RW7sutti5hcBx8Y3ayIi0lbUw1dEJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCqFXB38ymmNlSMys0s1uaSHOxmS0ys4Vm9mx8sykiIvGU0lICM0sG7gdOA4qA2WY21Tm3KCbNMOBW4Fjn3DYz69VWGRYRkQPXmif/o4BC59xK51w18BxwXoM0VwP3O+e2ATjniuObTRERiafWBP88YF3MclF4XazhwHAz+9jMZprZlMZ2ZGbXmNkcM5tTUlKyfzkWEZEDFq8K3xRgGHAScBnwiJnlNkzknHvYOVfgnCvo2bNnnA4tIiL7qjXBfz3QL2Y5P7wuVhEw1TlX45xbBSzD3wxERKQDak3wnw0MM7NBZpYGXApMbZDmVfxTP2bWA18MtDJ+2RQRkXhqMfg752qB64C3gcXAC865hWZ2p5mdG072NlBqZouAacDNzrnStsq0iIgcGHPOJeTABQUFbs6cOQk5tojIV5WZzXXOFRzoftTDV0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRCSAFPxFRAJIwV9EJIAU/EVEAkjBX0QkgBT8RUQCSMFfRGRfLf8nvPmz9jteKAS1u+O6SwV/EZF99cxF8OlDUFnil+tq2vZ47/wCftULZj8Wt12mxG1PIhI8Zeth6woYdEKic5IYDx4LSSlQvh6ufAv6HQ1JbfBMPfMBP33j3+O2Sz35i0jjQqGW07x1Czz1NXjv11Bb3fZ56iiSws/NlZt94Ad4Ygrc2RXm/dWfuyVvQs2uAz9WqO7A99EIBX+RjqSyGDYtSHQuYMV7PpC9fM3e2yo2wWvXwXu/grJ1ft303/ifplRtg1d+AKUr2ia/7al6B4Rqm97++o2wdgY8dxm89sMDP96WZQe+j0Yo+It0BBvmwe058Nth8OBx+7+fqm3w9xtg59YDy88Hd/vp/Ofh2UthR2l023v/BZ8/DdPvhg2fw4TvQPYhfrmp466dCV88C/83ATZ+cWB5S7SKTX56yn9G153xP3468lyorYInz/bLa2fu/3He+5W/Jh6Y6JePu3H/99UIBX+R5lRtgy3L2/44C/5Wf3nbmn3fR2UJ3DUQ5j4Bj5ziix52bIFlb7euCCdWdWV0ftk/YPFrfr5kKXz+l/ppewyDAcf4+RXvRdc7F52PFI0AzHli3/LS0ZQV+WneETDpOjj/IZj0Q/jFZjjiivppy9fDmzfDPaP2vfhm+t31l0+5DX6+cb+z3ZCCv0hzXrsO/ljgA2hbihSfRLx01b79fslS+O3Q6PK2Vb7oYepP4NmL/Xxr1dVGi2cGHu+nhe/Cx/fB/Uf55ZN/EU3ffSicd380HwB/vx4eO93v5x+3wBs3Rff35UtQvKTxY6+d5X/39hzYON/ffEv2o9jj6Qv8Pt6/q3XpnYN1s+vfsJpSEs57r5Fwxq9h3KV+OTUDBp8EJ95SP/2nD/ubwDv/SatFWhFF/HyDr0hOy2z9Plqg4C/SlFXTYcnrfv7Ziw+8KKUpoRAse6f+uvWf+Xbdsx/z8y1Z+Gp0/qzf+umGebD0DT//5Nnw3DfhibOgvJmnx6I58OZNULMDLnocrngdjvyeb9f+0b3RdMffFJ3vO8EHpV6jYN0sX8k590ko+tQX88z6k083/nI4/JuwuxweOBp2V8I/b4Nd5dF9PX66/12ABS/Aqz+E+4/0T8GfPhJNt242TP+tP3fr50a3PX4m/O0KWPGuX37/v+GBSS2/+cx+FB6bDEveaD4dwOaF0KkrZPfee1tSMpx8K1z+MvzoUzjn99FtsW9FTaks8TfKyI181L/BfxRDWlbLv7uPWtXU08ymAPcBycCjzrn/bSLdhcCLwJHOuTlxy6VIeyjf4Is0Jl3ng9m7d9bfPvtROLENOvas+diXE/c/xpfrmvl25P+6A2be71uW3Fba/D4qNvjpj2ZD14Hw5k992/BYkRvZq9fCxU9DRpf62zfMg0dPjS73GO6nE38IXzzvn8In/ggGHe+D3EVP+CDbORwEh5zin3IXvrJ3/q6bCz2GQk2VPz7A/+T56cf3we1lexeLrJsN68Jl5u/9yk+PuBKSU/xNY+0MWPsJFP7Lb5v7FGyOVJYbHHmVf3so+hSmXgf/9kDT52/VB37amsrV4sXQa7T/OzVlaPg89jwUCq6Eaf8NH/zG3xhTM+qnranyN7ekVJj1IOza7tf3nwRff7L54xyAFoO/mSUD9wOnAUXAbDOb6pxb1CBdZ+B6YFZbZFSkTX1yP7z9cz/f+RBfgVk0G069zQecZy+Bab+G7WvgzLvj8/q9q9wH1O1r/fLX7oOew32TyfQcH/ih+ZYlEWXroc/h/vcbuvhpeOFb0eWV78Njp8HoC+CYH0c/y+s31P+97EP8tPsQuH4e7Crz8xGHXeB/IgafDJ/80Qf3pFQIhTs+jfyaD/wAqZ3g/IfhlQatiGp3RytJI9Y1Uln6xo2+CK5ys1+OBH6ICfzAiLPh7N/5G/o9I2HeM76oKidv732Wb/DnD1qu33HOB/9IUU9rdR8GOH/uLcnfbE78GWTkwPJ34MPf7f07bRj4oXXFPkcBhc65lc65auA54LxG0v0XcBcQh4atIu0sEvjBlzt//mc/P+brkNkNJt/ulz//S/Pl53Ofgtf/PVr2XVMFFZubOOatcN/YaJDLyffTlDQYNjmaru/4lvNfvgG6xAS2q6dF50edC+c9AIddGF1XssQXiUSKZAC2rqq/z8zu0fmsHvUDf2Ny+0fnL3zUnzuA039VP92g4yGrZ/11JUv8zbZzX5/3lE7RbTctg9Hn+/nP/hwN/LHGXx6d79QNJt/h5zv3ia6/d1TjRWj3jIQN4fVfPOvrHCI35Fi7K+HF70J1hS/v3xeRm99fL4Fnv+5vko9P8esaFgeNvQQufMw/hLSh1gT/PCC2NqoovG4PM5sA9HPONVtgZmbXmNkcM5tTUlLSXFKR9rPqQz/tP8k/oc37Cyz+O4w4JxrQBh4L3wuXI29f1/h+KjbB338Ccx6LVnC+fDX8bjgsmlo/7eqPo61mPvszpGXXf5vI7BGd31XWfP6d8xXGXfpG1+VN8AHk2o/98vhv+jL88+4PP4WGbVvjy8z/cqEvbjj9V3D0tf6tYF97qmbHBPRR5/kbzk+X+2KoWF36ws2Fvjx7fPiN5L1f++nZv/N5//dwwYIl+2Kli56I3rwycnzF8U3L4PvT4Zfb4eyY+oj/tyoabM3gp4XRPDx1bv28rJsdne89xk/nPgn/VwCbF9VPO+dxWPiyn8+b0OLpqKf70L3XFS/yf/u5T0LPkf7Nb/IdcM69MOaifdv/fjjg4R3MLAm4B7iipbTOuYeBhwEKCgpaUa0u0g4++SOkZsGZv/Fls6XhV/++h9dP13e8L38vmuPLcRta/Pfo/OoPfWuTiBe+5W8e+QV++eP76v/u4JPqL/ef6MeOyT/SH690RdNP3pWbfSVqjwZFPo0FkPGX+5+Zf/K9cz97yv9EdBvsi4L2R0ZudN7Mv8Fk92o6/cVP+RvX1pWwPNyaqvdoP83sBhc84svMI/v72h+gx6G+WWV6Z78+Ut+QkgZDT4PBJ+59nOye/ib4P3m+yCVWZLiE0RfAeX+EnaX+qf/p830dzzn3RNMuD1fKDznFF7Hti0h+c/v7iuAty+ChE2Bq+FwXfHfvZqJtrDW39vVAv5jl/PC6iM7AYcD7ZrYamAhMNbOCeGVSpEXTf+uD7RfPwaLXWt+TtGqbrzQc/W/QZyyc/6APYpk9/BNwrKRk/zbw5Uu+OWRDi17zwen70+uvPylcpLTuU1+2PeshWP2R7xw17jK/7bQGlcuHXeCDxIWPAq75liKbv/TTXiNa95kBJv7AV2zH6jEcBjUSPFvLzN+sYjs/teZ3Yo8ZW3Q09mLoMy66nJ4NJ/2/aCBt6PIXm75xpWfDCT/zN8nI325XmQ/0vcf4t6K0LH/8gcf5t5IvX4o2/azd7Yuljv4BfOuV/SuLv3GRvwmldvKfa/QF/kYy4dsw7pJ9398Bas2T/2xgmJkNwgf9S4FvRDY658qAPe+oZvY+8FO19pF245zvdQrwyvej629vobikrsZ3ioLoE3mnXLilmQ5WI86BRa9CyWI4ZEx0/Y4tvtXO8Tf5f+wr3oTFU31l54BjfcerjV/4p8lI/cLA4+DQs+CU/4iW98fqeaj/bJk9/L6PuAKSU/dO98ZPAfNNLvfF5Nv9Ww/4SuFR5zabvFW+96+W0zR0yGF+esLNbVrB6cvQHewogS594OM/+KKuy1/e+7j9jvJNTcs3+Eri9Z9B7S5f/Le/GlY2fz2xnd1afPJ3ztUC1wFvA4uBF5xzC83sTjOLw9UicoB2h9uJdx1Uf/2MPzb/e7GtS1r7xBsp610/t/76dbPAhWDY6X554LFw5l0+wJv5G8KGz33giRg+xT+RNhb4I8x8peXCV/ywDQ199HvfoStvgt/XvkhO9X0CrvpnfAL//jr0LLjm/fodx9pCpAK1ItzPoXS5r//IP2LvtL3DN6QvX/LTf9zsp/2Pads8tqNW1eg45950zg13zg1xzv06vO4259zURtKepKd+aVc7tvjpiT+DQ8ZGy74btnNvaF24VfKk61puyRLRbbCvH3j7F74lT0SkdUi3JvaTVwBblvp25wDffXvvdvZNKQ5XPM5rMKxC6Qr41y/9/ITvtG5fDR11tX/KTSQzX5/Slk/94FvoJKXAIyf7FlmrP2q86Sf4Opf8I32l/Gs/8oPt9R4DWd0bT/8VpB6+8tW3M9wBKqsnXPuhLyvfs62JXrmxHYr2paLNDOqq/dg3b/wUnr/cD3q2fR2kZvqKysb0P9pPV7zr3w76T2z9MU8Nl6Fndq//pSFzHvfTkedGm0JK07oNDteh4Ftk7Syt3zw2VqQuYkvMWEYn3dJ42q8oBX/56lsTbs4Yac5nBpc+6+e3rWr0V/YMpDbqPD8w2b74xnN+GmkS+tYtvkNWepemn15jm/rtaxvx426Ec8MtUSKfFWDbat9E8JJGeutK40afD5f+NbrcsBlqrKwe9ZeHTm483VeUgr98tdVW++GH846oH8Qj5f8NOy5FRHqGnnl349ubM3Syr/iNWPCCnyanNf072TEddgbsR6VhpAlj7GiflcXNN6WUxo04C64Id0kafkbT6WL7Wvxn6d7DMnzFKfjLV9viqX4QssjokxGRJ7rGuuuXb/TfsjT20mg78X11+Df3Xvfdt5pOn5TkhzU4+gcw5NSm0zWlc1/f4Wl7bPDf3PjgYtKygcfBbdvqNyXdS7iZZ4/hfjyhg8zB94nk4LVhHuT0q1/ptvojP47MqbfVT5uW6d8GPnvKt2nvlBvdtnKav2Ec+b39z8uIs+Ann0PRXN/OPjmt6crDiHGX7H977uQU/2YT+SIU5/Tkf6Ba6sE8/AzfqzjyRS0HGT35S8e2o9S3zNi2Bh4+EV76bv3taz6GISf7DlgNnfAz36xv3af115cs8TeM1oyZ05xug2Hs1+G0O+CUNm6mCP7LwdfP9a2bimb7kUD15N92MnJ856/9fTvs4PTkLx3bold9y4w5j/nlrSuj20J1UFroO1I1JtJxa9lbMPz06PqSZf4p+qv2Kt9tkO+RfHdMc1IFf9lPX7GrXwKjssSPw96wzD53QHR+51bfsaqpABgZlXLOY75D0yn/6TtClSw+8Kf+RIgd+iDiIH0qlbanYh/peDYv8t9k9Nw3/JDD2b39aJM9Do32kH3/rui3HTUcHjjCDI682s/PetAP7LV+rm8i2X9Sm3+MuMtvpDPWQdTjVNqXnvyl41n0Wv3l0+70X55RscmPRbN5kR+LPqK5oo+Gg4C9fqOfjjh777QdXW4//12uyel+FMwew/1oliL7QU/+0rFUbIYPwt8SesMCOPue6DjuQ0720z9N8s0ev/4knPwfvht+U/LC47ZEmmZu/ALSOjfds7OjS8vydRUjzt73zmkiMfTkLx3Lpw9F53P7++9hjYhtH+/qWjekwchz4MaFfvC01EyY/YgfBK2tx5ER6eD05C8dS6RZZmOBPTZgDz+z9fuMjJo58Qd+tMZz7m0+vUgA6MlfOo5QyH859uGXw7/d33iaq9/zX7t41DWNb29O9yHwg49bTicSAAr+0nGsmwk7t/gv+G5K3hHRcnwR2W8q9pGOY96zfqz8pjptiUjcKPhLx1BbDfOf94E/LSvRuRE56Cn4S8fw0An+S1L6NdNsU0TiRsFfEq90hR9yAfb+Hl4RaRMK/pJ4K6f56df+AENOSWxeRAJCwV8Sb80n0KkbTPi2Ol+JtBMFf0msornw5Yv+awoV+EXajYK/JNbq6X56ws2JzYdIwCj4S+JUFsOH90D3odB7dKJzIxIoCv6SOB/cBbvL4djrE50TkcBR8JfE2FUOsx/zX8Qy4duJzo1I4Cj4S2KsmQE4+Np9ic6JSCAp+EtilK3z07yCxOZDJKAU/CUx3vypnzb1/bsi0qYU/KX9Ve+IzifpEhRJBP3nSfvbttpPT7szodkQCTIFf2l/z3/LT/uOT2w+RAJMwV/aV9U22LrCz+cfldi8iASYgr+0r7Uz/fSKNyA1I7F5EQmwVgV/M5tiZkvNrNDMbmlk+7+b2SIzm29m75rZgPhnVQ4Kqz+C5DR9D69IgrUY/M0sGbgfOBMYBVxmZqMaJPscKHDOjQVeBH4T74zKQWLNDN+2P7VTonMiEmitefI/Cih0zq10zlUDzwHnxSZwzk1zzu0ML84E8uObTTko1NXCpvnQT2X9IonWmuCfB6yLWS4Kr2vKVcA/GttgZteY2Rwzm1NSUtL6XMrBoWwthGqhx7BE50Qk8OJa4WtmlwMFwN2NbXfOPeycK3DOFfTsqZ6dgVKxGR4Jf0Vjt8GJzYuIkNKKNOuBfjHL+eF19ZjZZOAXwInOud3xyZ4cNOY87pt5AvSdkNi8iEirnvxnA8PMbJCZpQGXAlNjE5jZeOAh4FznXHH8sylfeTvCxXwXPqYmniIdQIvB3zlXC1wHvA0sBl5wzi00szvN7NxwsruBbOBvZjbPzKY2sTsJqs1fQv9JMOaiROdERGhdsQ/OuTeBNxusuy1mfnKc8yUHk1AINi+EcZclOiciEqYevtL2NnwO1ZVwyGGJzomIhCn4S9v75P/8VF/cItJhKPhL2yvfCN2H6slfpANR8Je2t30t5B+Z6FyISAwFf2lbmxZAxQboMy7RORGRGAr+0raKF/vpUDUIE+lIFPylbVWG+/zpi9pFOhQFf2lbO4r9+P0ZOYnOiYjEUPCXtlW8GDofAmaJzomIxFDwl7ZTvRMK34WR57acVkTalYK/tJ3NC8HV+TF9RKRDUfCXtlO63E97jkhsPkRkLwr+0nZKV/hpjr7VU6SjUfCXthEKwYe/haxeGr9fpANS8Je2UVrop6PPT2w+RKRRCv7SNopm++mRVyU2HyLSKAV/ib/l/4TXfujnuw9LbF5EpFEK/hJ/797hpxN/CEm6xEQ6olZ9jaNIq1Vt9yN5HncjnHJbi8lFJDH0WCbxtXGenw48Tk/9Ih2Y/jslvpa9A8np0O/oROdERJqh4C/xVbIEeo+C9M6JzomINEPBX+Jr+1rI6ZfoXIhICxT8JX6qd/rg33VgonMiIi1Q8Jf4WTkN6nbD0FMTnRMRaYGCv8TPimmQmgn9j0l0TkSkBQr+Ej8rp8GAYyElLdE5EZEWKPhLfKx4zw/mNuTkRjfvrq3j1c/XUxdyrCipZEbhFgDqQo7q2lBcsvDOwk1MX1YSl32JHOzUw1cO3IIX4e83gCXB8Cl7Vu+qqeOlz4oIhRzPzFrLkk0V3PD8vD3bzx7bhzfmbwTgwcuPYMphh1BTFyI1uXXPJNW1IVKSjKQkY0VJJdc8PReAwl+fSUor9yESVOacS8iBCwoK3Jw5cxJybImjqu1w10BIToPrZkPXAQA45xh3xzuU76pt9a5yM1PJy+3E6z8+Dov5wvfK3bVkp9d/Tpm+rIRvP/4pVxwzkFNG9OLut5eyYH0ZAMcO7c7dF42jb26nA/54Ih2Nmc11zhUc6H705C8HZumbgINvvbIn8AN8tnb7nsD/87NG0LtLBqeN6k16SjK1oRDTlhTzzKy1XH38YLbtrOb65+axfWcN23fW8Pt/LSe/ayfOH5/HR4VbuOKJ2Zw9pg/3XnI4AN94ZCZz1mwD4MkZq3lyxmrM4DcXjeX+aYV8XFjK/3tpPk9deRRJSdYwx01yzhFykLwPvyPyVaUnf/Hqav2XraekU1sXwsxaDoJrPoEnpkB6F/jZKkj2zxLlu2q49KGZlFTu5q3rj6d7dnqLh//5Kwt49fP17Kyu26dsFwzoyrad1bz8g2PJyUxlY1kVN73wBTNWlAJww+Rh3DB5eJO/75zDzFi3dSeXPjyTpCR46sqjWLyxgveXFjOqbxe+NXEAKclJbCyrYnP5bg7vl7tPeWyOc47X5m0gMy2ZrllpFJfvZnz/XA7pkrFPNy4Jjng9+Sv4C9TVUHvfeKyymDVZY5hR0YvlGWM4fVAajDyHiqRczhjdu15RDABv3QozH4DLX4Khk3HO8cGyEq54wn+RywPfnMBZY/q0KguhkKPOOT4u3MLs1Vu5f9qKPdueuPJI/rFgIy/MKdqz7s2fHM/w3tmkJCftVU+wuXwXFz04g3VbqwA4fVRvbj93ND2y00lL8emfmrGaNxZs5PO128nL7cT67VXN5u/aE4fw6IcrqQ05vn5EPuP65TJ5ZG96dU4n5BzJSYaZURfy87tr6ygsruSQLhl73fyqa0Okpfj8vvr5+nr1IBEpScb3jh/MzWccesBvIpEbnBwcFPwDJvJ3ivc/cXVtiOlP/ZLJ6/7Q6PbNLpcpu/+XKyYX8OOTBpI0+2Go2AgDT4BXvg99D6f6spe44+8LeWbWWgDSU5J4+NsFnDi8537nyznH8uJKKnbVcsSArvW2tbZSeMfuWn7xygJenbehVce8+YxD6dk5nWdmrWXioG7065bJtCXFvLukeE+awT2yWLllx16/m5mWzOCeWSzfXEle106sLPFp0lKSuP7UYWwsqyLJjLlrtrFwQznnj8+jpi7E6+EK78E9ssjOSGHi4O4sKCrjk5X+zeU3F43l4oLocBn7Esi3VO7mLzPX8NSM1dx90ThOGdELoNk3igVFZWwsqyI7PYWjB3dn0YZyzOCwvJxWHTPIIv+jzsHSzRV0z06jV+f4f3+1gv9XzMqSSh54fwWH9e1CbmYaPTunc8yQ7tSGHPOLypjQP7fJf+qauhCn3zudupBjTH4OOOickUJykrF9Zw3j++fyveMHtzov84u2k5kcosf2+Tzyzmdcv/VXVFsGU1IeZUdlGa9e1oeeK19j7rJVHF81jSVJw5iy8w5+1+01Ltz5fL19zZjwO+5aN5Iv1m0H4IpjBnLlsQMZ0D1rv89VvN368gL++unaeutuPuNQrj1xCFU1dby7eDPj8nMZ2GPvPNeFHE/OWM2f3i/kv847jDPH9GFt6U6e+XQNWyqqWbt1Bzt217FoYzlpyUkM7ZUNwIg+nfm4cAuby3fX29/gnln06pzOzJVbARjeO5sbJw/nzAZvSM45Trt3OoXFlVw4IZ9zD+/LjMIt/G1uESHnmDS4O0lmnDC8Bxcd0Q8DPlhWQlVNHRu2V3H/tEK27azZ6/N0Sk3moiPyueLYgazdupM+ORn07pxBVU0dd7+9lFc+X9/oOfzFWSMZm59D9+w0hvbyg/Zt3VHNrJWlrN9excyVpZw8ohfdMtOYOLg7XbMOrK/H9p3VbCrfxYhDuhzQfg5U2c4aNpRVMbJP8/mYvqyEHz7zGZW76zdwuOficQzpmc3Y/BzMjFDI8fGKLVTsqqV/t0wOy8th+eYKdteGWn2Dbdfgb2ZTgPuAZOBR59z/NtieDvwZOAIoBS5xzq1ubp8jxxzuXnz7A5yDDduryM1M48iBXdlSWc0X67YzcUj3vVp47KuFG8pYv82/zh96SGcGdM/as657djqllf4fs3t2Ok/NWM3AHll0yUhh1ZYdTBrSnbTkJEIODsvrQn7XzHr7rq0LsWhjOWPycqJBe9MCKCuCgcexdft2Pnr/Ld5aWMyHNYdS4fZueTIuP4f568twDo4c2JXzDs+jYlctizeW70lTubuWmStL95SFpyQZtaG9/2YTB3fj7LF96dMlg09WlvLG/I1sKt9FN8o5MnkpBbaMXraNbKqYlLSITKsflPjO6zDoeMqqasjplBpdP+2/4YO7ovlxGVxVczMXJH3I+6Fx/CN0NGnJSdx+7mi+cXT/1v9x2lFNXYiibVX0zc3AOaiuC9ElI7XlX9wH5btqSDLb65ot31XDlordLN5YQX7XTowL1xdE3gR6d2n6yfCluUXc9LcvGt2Wl9uJ8l01VDTTmmpsfg6j++bQJyeDBevLGN23CzNWlPLpqq17pc1MS8Y5f3OaPLI37y0pZsH6MvJyO1EbCtW7iRUM6IoZzF69rdHjpiQZvzh7JFccM7BVbymFxRXcP20FU7/YsOfpOXKJt1R0WFy+iyufnE1GajJ5uZ3ok5PBhAFdMSAr3b9JNSw2c87x0mfrmbtmK0cP6s7IPl3YUrmbP3+ymrcXbgbg95cczvyiMh7/eNWe3ztiQFfOHtOHLZW7qXOOa08YQk6nVO58fRFPzlhN18xURhzShbH5OZTvqmXWytI9b4kZqUl0zkilrKqmyX4tE/rncv3k4aQlJ/FRYQm1dY7vnziE7TurKSyuZH5RGV2z0vje8YPbJ/ibWTKwDDgNKAJmA5c55xbFpPkhMNY5d62ZXQqc75y7pLn9dukzwF1w5dUNjuVfmZaH8qnunE/njJR6lWuLN1bQIzuNeeu20zenE6Pzonfj7PQUqqrreGvhJnbXhnDOUVNX/7OlJSdRXbd/HYrOH59Hl4wU8rp2YtmGbQxd+hA9a/0re45VcZQtoovtBGCN5dMjVEJWTIDdkjmYtPwJ1NSFKNuxizmdjmHT+jVcGvo7ubWlNPwz7EzK5I2U01iZNIALbBojqr+EroNwfQ4n5By1dQ5nSVT0O4UH1+axedFH7Kr1N4jOVHFsyhKO4Qv6J0U7PZUm96SsJpny5Fw6paVS4TLoduTFDD5yCuQ2Ebh3V8KsP1G2ZSOFX37KrVWXM/6IYzh5RC9G9+3Czuo6+uRmxD2Yile+q4ZpS4pZUbKD9JQkrjpuELtq6sjNTKO2LsSLc4t4b0kx7yzaTM/O6Tx91VEkmdE9K63JinZfp1LI+0tLGNg9k65ZadTUhfiv8w5jfP9oEdv2ndXkZqZRF3JMW1LMHa8vZEtFNX1yMiirqqF0RzU/PmUoXxvXl9VbdpCemoxzjl+9sZjC4krAN989ZUQvTh3Rm8y0ZL9j84G0S0Yq7y7ezLV/mUtNneP88Xnkd/UPSTur63h+9joqd9cyqk8Xrj1pCNOXlfDu4s3siGkUUBdy1IUcXTNTSU9JZlP5rnqf9fB+uYzJyyEjNYnSHdUArCjZsedNNVa3rDS2htNEDO+dTW2d45DwDbSpm+0Zo3vzk1OHMbpv9Ol9Z3Utf5m5hv9+c8medWPzc7i4oB9j8nJ4dd56npqxmpF9unBY3xyen7Ou0X03tOauc9ot+E8CbnfOnRFevhXAOfc/MWneDqf5xMxSgE1AT9fMzgv6Jrs512Q3edwd+Kc0M4jct0POzyclGQ13HXlSSE4yksJPG2aQHJ6vCYUIhdjTKSjkHElmGOx5kk5NNhz+GJG919SFqK1zJFnMMQjRyaopSe5Narjiblt6PjPqRrGqugsX736Z7OQ6qkZdwsBRE0heNR1WfwS1VX7ky51bohnPPgQOu4DapFRWFFeycEM5p4/qTfba96A4fH+1ZDj0TNiy3O8jomKzH0itKb1G+x63g06EnsOh60C27ag+oFfykord9OzccusdaV+FxZXkZqbSoxUtq9paTV2I7zz+KbV1/h+2sTcNgKy0ZHbW1DG6bxfuunBsvcAJULGrhoc+WMnjH6/a8+Z71MBujB+QixH9Hz97TJ89RSZrSnfsCdBvfbmJP04r3LO/bllpe25AfXM68cdvjGfdtp3MKPT1K9+eNJDsjBTWb6uifFcNWekpDIopCqytC7FscyWd0pIpqdjNfe8u4+PCUm6YPIzrTx3W5FtObV2Iil211IZcs/87yzdX8PLn6+ndOZ0ThvekdEc105YUk56SzMTB3eienUZ1rWN0Xk67Bf+LgCnOue+Fl78FHO2cuy4mzZfhNEXh5RXhNFsa7Osa4Jrw4mHAlwf6AQ4SPYAtLaY6+Ok8ROlcROlcRPUAspxz+9+aIqxdO3k55x4GHgYwsznxuHsdDHQuPJ2HKJ2LKJ2LqPC5GBiPfbVmAJT1QOxXM+WH1zWaJlzsk4Ov+BURkQ6oNcF/NjDMzAaZWRpwKTC1QZqpwHfC8xcB7zVX3i8iIonVYrGPc67WzK4D3sY39XzcObfQzO4E5jjnpgKPAU+bWSGwFX+DaMnDB5Dvg43OhafzEKVzEaVzERW3c5GwTl4iIpI4GvRcRCSAFPxFRAIoIcHfzKaY2VIzKzSzWxKRh/ZiZv3MbJqZLTKzhWZ2fXh9NzP7p5ktD0+7htebmf0hfG7mm9mExH6C+DOzZDP73MxeDy8PMrNZ4c/8fLhhAWaWHl4uDG8fmNCMx5GZ5ZrZi2a2xMwWm9mkoF4TZnZj+H/jSzP7q5llBOWaMLPHzaw43Fcqsm6frwMz+044/XIz+05jx2qo3YN/eLiI+4EzgVHAZWY2qr3z0Y5qgZucc6OAicCPwp/3FuBd59ww4N3wMvjzMiz8cw3wp/bPcpu7Hlgcs3wXcK9zbiiwDbgqvP4qYFt4/b3hdAeL+4C3nHMjgHH48xG4a8LM8oCfAAXOucPwjUouJTjXxJPAlAbr9uk6MLNuwC+Bo4GjgF9GbhjNcs616w8wCXg7ZvlW4Nb2zkeifoDX8OMkLQX6hNf1AZaG5x/Cj50USb8n3cHwg+8n8i5wCvA6fjSNLUBKw+sD38JsUng+JZzOEv0Z4nAOcoBVDT9LEK8JIA9YB3QL/41fB84I0jUBDAS+3N/rALgMeChmfb10Tf0kotgn8seOKAqvO+iFX1HHA7OA3s65jeFNm4De4fmD/fz8HvgZEBlhrzuw3TkXGTEr9vPuORfh7WXh9F91g4AS4Ilw8dejZpZFAK8J59x64LfAWmAj/m88l+BdE7H29TrYr+tDFb7txMyygZeAG5xz5bHbnL9dH/Rtbs3sHKDYOTc30XlJsBRgAvAn59x4YAfRV3sgUNdEV+A8/A2xL5DF3sUggdWW10Eign9rhos4qJhZKj7wP+Ocezm8erOZ9Qlv7wNEvi7qYD4/xwLnmtlq4Dl80c99QG54WBCo/3kP1mFDioAi59ys8PKL+JtBEK+JycAq51yJc64GeBl/nQTtmoi1r9fBfl0fiQj+rRku4qBhZobvAb3YOXdPzKbYITG+g68LiKz/drhmfyJQFvMK+JXmnLvVOZfv/MBUl+KHAfkmMA0/LAjsfS4OumFDnHObgHVmdmh41anAIgJ4TeCLeyaaWWb4fyVyLgJ1TTSwr9fB28DpZtY1/CZ1enhd8xJUwXEW/gtiVgC/SHSFSxt/1uPwr23zgXnhn7Pw5ZTvAsuBfwHdwukN3xpqBbAA3woi4Z+jDc7LScDr4fnBwKdAIfA3ID28PiO8XBjePjjR+Y7j5z8cmBO+Ll4Fugb1mgDuAJbgh3h/GkgPyjUB/BVf11GDfyO8an+uA+C74XNSCFzZmmNreAcRkQBSha+ISAAp+IuIBJCCv4hIACn4i4gEkIK/iEgAKfiLiASQgr+ISAD9f1EFzGd+AsemAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "meta_episode_histories = results['meta_episode_histoy']\n",
    "meta_episodes = len(meta_episode_histories)\n",
    "\n",
    "n = 20\n",
    "\n",
    "button_no_coin_frac = [np.mean([x[0][-1][2:] == (1,0) \n",
    "                      for x in meta_episode_histories[i]]) \n",
    "                         for i in range(meta_episodes)]\n",
    "\n",
    "plt.plot(get_moving_average(button_no_coin_frac, n))\n",
    "\n",
    "\n",
    "button_coin_frac = [np.mean([x[0][-1][2:] == (0,0) \n",
    "                      for x in meta_episode_histories[i]]) \n",
    "                         for i in range(meta_episodes)]\n",
    "\n",
    "plt.plot(get_moving_average(button_coin_frac, n))\n",
    "plt.xlim(0,meta_episodes-n)\n",
    "plt.ylim(0,1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 159,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 159,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "found_coin_after_delay"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 160,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([-3.47212663,  2.10944682, -0.96714821,  2.32982802])"
      ]
     },
     "execution_count": 160,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "agent.logits[1,0,1,1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 161,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 502
    },
    "id": "hwlSU2kbHKIa",
    "outputId": "a132aa75-608a-453d-db52-09053d436fe4"
   },
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAbQAAAHJCAYAAADtiMxZAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8vihELAAAACXBIWXMAABcSAAAXEgFnn9JSAABExElEQVR4nO3de5Aj12Ee+u90A5gHZgYDzO7szHAfXIlckeKK5JJckRK5u3Qky7TMq1h24khOLFt2nFxdJ/ZNbsqWU76xKuWqKJYlxa7YFeu6LCbX8ZV9LcVJMbauxeVLu5REaklKXEomKT6XnJmdnQHmgcFggO4+949uYAAsGmi8+nHw/apQsxh0A+csMOfDOX36tJBSgoiIKOq0oAtARETUDww0IiJSAgONiIiUwEAjIiIlMNCIiEgJDDQiIlICA42IiJTAQCMiIiUw0IiISAkMNCIiUgIDjYiIlMBAIyIiJTDQiIhICQw0IiJSAgONiIiUwEAjijghxJ8IIaQQ4h8EXZZ+EkJ8xKnX/x10WSgaBC/wSa0IIQSAvwfgpwHcBmAWgAngMoAlAE8C+DqAs1LKzYZ9/3cA0wD+Ukr57IDKN/DXCDMhxB2w34PnAdwsG/6ghRDXArgHwO2w378TACadh49KKV/zqZw/BOCXAdwFIAPgCoBHAXxOSvm0yz4agOcA3AjgDrftiCoYaORKCDEN4C8BnKn5tQFgE8AUgFjN7z8upXygYf/XABxp9lgfyzjw1wgzIcRjAE4D+PtSyr9o8vgDAH7WZXdfAk0I8SkAv+nclbA/PynnvgHgE1LKP3LZ9yMA/h8Aj0gp/86Ai0oRxyFHauW/wA4zE8BnARwDMCKlnAEwBuAWAL8G4DuBlXCICSHugh1mywD+m8tmFoCXAfw5gE8C+HV/SmcTQvwU9sLsDwHsl1JOAzgE+8tSDMB/EkK8x+Up/gLAKoAfcnqjRK5i7TehYSSEuB7A/+Lc/Q0p5adrH5dSGgC+69x+Wwgx5nMRCfhfnZ9fklKaLtv8Yu1jQoh7B12omtfSAfy2c/erUspKeSGlfNM55ncBwHFnu1ONzyGlNIQQfwbglwD8UwDfHnjBKbLYQyM3t9b8+7+321hKuVP5txDiU0IICXsoEAC+6Bzcr95q9xVCHHf2eVgI8bIQYkcIsSmEeEYI8VtCiH2Nr9fpa9Ts92NCiC8LId4SQuwKIXJCiMeFEJ8QQiTa1TMshBBTAH7Kufunbtu1CDo/nMHe+/PvGh+UUpYA/I5z9x4hxFGX56nU76NCiIn+FpFUwh4aeXEQwPc72D4Pe9LIfthfmjYB7LTY/kHsNXxFAAUAadiheiuAnxNCvE9K+UK3r+H0IP8L7AkuFZVjOaec28eEEB+UUua8VDJgZ2AP+24DCOtkiR92fm4BOO+yzV/X/PsDsIclGz0F+3ORhP0+/XWTbYjYQyNXT8E+gA8AnxVCHPO6o5Tyd6SUcwAuOb/6FSnlXO2tYZfHAPwcgCNSyjHnGN0ogPfDnsF3DRp6IV28xhdgh9krAP4hgJSUMgVgHMDfdX5/F4A/9lrPgJ12fj4dcC+slePOz++7lVFKuQJ7xiMA3OSyTRl7oX2m2TZEAAONXDiz3yozz94F4G+FEE8LIX5fCPHzzjCh6NNr/ayU8j9LKd+o+V1JSnkWwPtg98RuE0Lc083zCyFOAfhHAFYA3Cul/NPKKQZSyqKU8n/Abii3Afy4EOLWDp//5xqHOzu83dtFte50foZ5Qs6C8/OtNttVHl9osc0zzk+3ySNEHHKklv432DPo/iXs4Z4Tzq1iRQjxXwH8eynl5UEUQEqZd6am/xTs86nOdfE0v+D8/K9SykvNNnAmKTwC4H4APwLg2Q6efwd26Har1MU+lcb/SsutglU5363QZrvK45Mttll1frYKPRpyDDRy5cxk/DdCiM/CnvF4BsBJ2Ce6JmCfZP0vAPyMEOLHpJRPdvtaQoj7AfyM8/wHYA8FNjrY5dPf7fz8BSHET7fYrnJu1JEW21xFSvlnAP6sm4L1YL/zM+vz6walUs/9LbeiocZAo7aklBsA/sS5QQgxCru39Muwg24fgC8LIa6XUhY7eW5nNYg/AfDRml8bAHLY67mkYB9TS3ZZhcq3+inn1k6zMA2bUefnbqClaG3L+dnu/7Py+FaLbSoTfkZbbENDjsfQqGPOcaeHpJQfAvCfnV8fBHBfF0/3C7DDzATwbwFcD/vk7UzN5I7KChjdHrPTnZ+fkFIKD7ef6/J1/LTm/EwHWorWFp2f17TZrvL4YottMs7PtRbb0JBjD4169QXsLa30ji72/4jz84+klL/psk3jjMVOLcMeRuxoKNEr5wTh3+3hKX5CSvlEh/tcATCPvYY+jC7CPiZ5oxBCbzbTUQgxi71hxOdbPFelnmE+ZkgBYw+NepWv+Xfj8Jfl/GzVszrk/Hym2YPOibR3Nnusg9eonAN1f4ttejEG+7hft7duTuj+nvPzbb0UfMC+5vycBPBel21qe/V/0+K5Kiddd3I+JA0ZBho1JYQ46vHcs9qFbxtP8K2svj/dYv8N5+ctLo//n2g9+83La3zB+XlcCPGJFttBCJHsdMUQKeUDHocy3W6PdvJ6jsedn+/uYl+/PAbgdeffn2x8UAgRB/B/OHfPSSlfbfFclS81j/WveKQaBhq5uQnA94UQ/1MI8THnMiQA7IZICHFCCPFF2FP6AfsE6MYp9Redn39PCOF2rOerzs9fFEL8k0qYCCHmhBCfB/CraH3cpO1rSCkfA/BF5+7vCyE+L4So9myEECNCiLuEEL8NuwGebfF6YfGo8/OIEOKA20bOe7WvcsPeTE4ASNc+5gRM4/4PtFpKrBVniPFXnbsfFEL8gRAi4zzvNQC+BOBm2MdPf7X5s9ifBQCHnbsMNHInpeSNt6tusM/Fkg23XdjhYjX8/gKAhSbPcbpmWwP2Qf/XALxWs8007GGkynOZsGc4Vvb7TwAecP79QDev4WyXAPB/NZR7C/Z0cLPh99cE/f/v8T161invL7bY5t4m76Pb7d4m+1f+72UP5fxUzWtYzvtbuV8G8I/b7P9PnG2fCfr/nLdw39hDo6aklP8f7BmHvwLg/4UdOruwA6gA4CXYlyT5CICTUsqrZqhJKR8H8GMAHgKwDvt4Ud3kDCnlOuzjK/8BdhCZsIPpUQAflTUrtLuUs+1rONuVpJS/6LzWA7AvqaIDmIC9gsijsGdZ3iylbLeyRVhU1j38hwN8jcoMxG91+wRSyk/BXvHlL2H/X4/DXh3kTwHcJV2uhVajUr9m6zwSVfECn0QRJYSYBPAm7GOMR6WUr7fZpdPnT8D+kjAG4P3SXorMV85Q9yuwe9MHpZStzlWjIcceGlFEOY37p2HP8Py1AbzEXbDD7OEgwszxa7Dr9+8YZtQOe2hEEeas2vIi7KHW66TLWpVdPvdvwj7+dZeUsushxx5e/xCAH8A+j/AdssNVaGj4MNCIIs5Zrf9eAF+TUrpddyxynKsrvB/AI9KeqUrUEgONiIiUwGNoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmhpwt8fvKTnxyWOf+zsNegUx3rqRbWUy3DUs+JT3/609vd7MgeGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmBgUZEREpgoBERkRIYaEREpAQGGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmBgUZEREpgoBERkRIYaEREpAQGGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmBgUZEREpgoBERkRIYaEREpAQGGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmBgUZEREpgoBERkRIYaEREpAQGGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESYj3uP9uXUoTciRMnVoUQvtZ1+pVXYutve5vh52suLi6uLi8vD8N7uorh+OyynmoZlnoWut2x10Bb6XH/SBBCzJ44ccK3uoqdHej79sE4dMivlwQAWJY1u7y8PAzv6SyG47PLeqplWOo5AWC7mx055BhCejYLPZsNuhhERJHCQAshfW0NWrEIkc8HXRQioshgoIWMKBSg7ewAAGLspRERecZACxl9ba3+31IGWBoiouhgoIVM7bEzUSpB47AjEZEnDLQQEfk8tGKx7ne1PTYiInLHQAuRZsfM9GyWw45ERB4w0MJCyqZT9UW5DG1rK4ACERFFCwMtJLR8HmJ3t+ljHHYkImqPgRYSrU6k5rAjEVF7DLQwkLJlL0wYBrSNDR8LREQUPQy0ENC2tiDK5ZbbcNiRiKg1BloIeAkrPZcDLMuH0hARRRMDLWgusxsbCdOEtr4++PIQEUUUAy1g2sYGhOHtsmdc25GIyB0DLWCdHBvTcjnANAdYGiKi6GKgBcmy7GNjHgnLgs5hRyKiphhoAdLW1yE67HHxwp9ERM0x0ALUzTExbX0d8HjMjYhomMSCLsBQsiw7mHZ2YE1ONt9GSkCIpg/F3noLxvw8kEgMroxERBHDQPOLE2J6NgvdGWrcvekmWBMTzbc3DCDW/O0Z+c53EF9ehjU5CTOTgZnJQDLciGjIMdAGyTShOyGmra9D9PnEaG1rC9rWFuKvvw5rYgJmOm2H2+hoX1+HiCgKGGj9ZhjQcznouZx9jplPq3to+Ty0fB7xS5dgjY/bPbd0GnJ83JfXJyIKGgOtH8plO8SyWeibm4GvjK8VCtAKBcTffBPW6OjesGQyGWi5iIgGiYHWJVEqQctm7RDL5wMPMTdasQhtcRHxxUVYo6OwnGFJ12N3REQRxUDrgNjdtQMsl4vkVaS1YhHa0hJiS0uQiUS152ZNTLjOqCQiigoGmgf7L15MJMbH+79Kh2m6n1M24HPNRKmE2PIyYsvLkCMjKB05MtDXIyIaNAaaB1eOHy8dPHYM2tZW9ViZKJV6f2Jdd52aD6D1Yz2SmgYrlbJ7adPTA30tIiI/sBXzSghYU1OwpqZQPnwY2va2PR0/l4NWLAZdOk+kptnH0NJpO8R0PegiERH1DQOtG0LAmpiwjz0dPgzhhJuezYYu3KSuw5yeto+VTU8DGlc7IyI1MdD6QCaTMJJJGIcOQRQK1WFJrVAIpjyxWPUka2tqiiFGREOBgdZncnwcxvg4jGuugSgW92ZF5vODfd14vHoytTU1xVmLRDR0GGgDJEdHYSwswFhYsKf8V3pufZryL0dG9npinHpPREOOgeYTOTICY24OxtwcUCpBz2YRe/NNSJfZhUJKSJeAsiYnUXr72yF5cjQRURUDLQiJBMy5Oeibm4itrXW2rxDYOXECiMcHUzYioojibIEAmTMzne8zNcUwIyJqgoEWIHN6GrLDGYjdhCAR0TBgoAVJ1+1zw7wSAmY6PbDiEBFFGQMtYJ30uLhEFRGROwZawDoZdjQzmQGXhogouhhoQdM0T8OI0uN2RETDioEWAl6GHS0uJkxE1BIDLQSsVAqyTVhxdiMRUWsMtDDQtJbHx6Sm2RNCiIjIFQMtJFr1wMx0mivmExG1wVYyJKypKdd1HTncSETUHgMtLIRoOuwodR1WKhVAgYiIooWBFiLNemJmJsPhRiIiD9hShog1OQmZSNT9jsONRETeMNDCpGHYUcZi9tWniYioLQZayNT2yMxMhlehJiLyiIEWMtbEBOTICAAONxIRdYKBFkJGJgOZSMCanAy6KEREkcFrkYSQOTMDISWHG4mIOtBroM32pRQhl0wmV+FjXWUyifiFCyPlI0d2/XpNADh27NiqpmnKv6dzc3Ory8vLrKciFhcXh6KeAHxthwJU6HbHXgNtpcf9I2F7e3sWftZVShRPnPDt5SomJydnT5w44et7qm1uBjGTc3Z+fp71HIAg6mlZ1uzy8vIwtEX+tkPBmQCw3c2OPIYWQtrGBvTLl4MuxsCJnR3E33wz6GIMnmEg/uqrgJRBl2SwpLTraRhBl4SGFAMthPS1Nei5HGCaQRdloPS1NWhbWxC7vo6s+k7P5aAVi9Dy+aCLMlDa1ha0YhH6+nrQRaEhxUALG8uCnstBWBb0jY2gSzNQ+tqa/TObDbgkg1Wtp/NTVcNSTwovBlrIaBsbEE7PTOWGQRQK0IpFAGrXE+Uy9M1NAE5wqzrsKGX1i4m+sQGUywEXiIYRAy1kaht3bX1d2WHHunpub0M44aYaPZerhpgol6E54aYabXMTonLsTEq73kQ+Y6CFiWnWNQTCGX5UUeMwo6q9tMZ6sZ5Eg8NACxF9YwPCsup/p2DDIPL56nBjhYr1RKkEfWur7ld6Ngs0vMeRZ1lXf0HZ2gJKpYAKRMOKgRYizRp1fWNDuWnQsSaTQLSdHYhC1+dThlKzY2bCNKEpNtmn9rhvVc0xNSK/MNDCwjTtY2aNVGsYpHTtjanWS2sW3IB69XSrj1v9iQaFgRYSlan6TR9TqAHU8nkIl6EolYJblErQGoYbK/RcTp1hxxbHebWtLdf3mmgQGGgh0Sq0VDoe0aqeWrEIsd3Vijeh06qewrKa98YjSF9fd/0iBqj1JYXCj4EWBobR+iRqVaZBexg+VaU32q4eqgzHtaunKu8nRQMDLQS8nHCrQsOgbW5CtDnhVoWGXhSL0Nr0NDUVljZzO+5bQ8vnlT3HkMKHgRYCXoZldAWOR3ipp9jdjfyah57qaVmRX/Ow3XBjdTsFvqRQNDDQglazNFI7kW4YOpitGfXeqNfys55E/cVAC1gn6/tFuWHQNjb2lkZqQ19bi+yah2JnB5rH8+m0KJ9jaBiez6fTCgWInZ0BF4iIgRa4TkJKy+cje6mVTuopymXXKe9h11E9I7y0WavTTJpuH+EvYxQdDLQAiSZLI7UTyYahi4Y7kvVE5+VmPYn6h4EWoG6OiUWxYdDW169eGqmNKF5qRWxvX7VGZTv65mb0LrXSwXHfCpXOMaTwYqAFqJtwiuLxiG6m4osOjtGERVdfNiK4tFm3Xzai+GWMoiUWdAGGjmlCX1+HvrYGM5mEsX9/8+0sC9Caf9+Iv/IKrHQaZiYDOTo6wML2wLKgbWxAz2YhNQ2lo0ddt3OrZ2xxEVY+b9dzfHyAhe2BlNA2N+0hVcPoqp76+jq03V2YmQysZBIQYoAF7pKU0La3oWezEMViV/XUNjcRf+01mOk0rKmpcNaTIo2B5gfDgJ7LQc/l7Nl+zsF046abYE1MuO6DWPO3J7a0hPilS4hfugRrfBxmJmM3+mNjg6qBN6YJ3QkxrWbSQOm662DOzDTfp0U99WwW8bfeQvytt2CNjsKshLjb/5lfLMsOsWzWnhzhzFQsHzoEc3a2+T4t6qltbyO2tITY0hJkImG/n+k0rMnJYBt9KaFtbdmf3Wy2eh6kMTvbVT2FYSB+6RJily9DxmLV99OamnINQaJOMNAGpVyuNgT65ubAjgdphQK0QgHxN9+0G/1KuCWTA3m9qxiG3ePM5exjZQNadFcrFqEtLSG+tAQ5MrLX6E9M+NPoO+sv6tmsfULxgFb5EKUSYsvLiC0vQ8bj9Y2+H/Ws9DgrYT2g43vCMBC7cgWxK1cgdR3m9LRdz+lphht1jYHWR6JUgpbN2o1BPu/7pAatWIS2uIj44iKs0dHqsKRrL7Bb5bIdYtmsvZyVzyvHi93d+h5NpZ797tFUhodzuboep19EuYzYygpiKyt2j6bS6KdS/W30a4aH9fV1z+cL9oswTcTW1hBbW4PUNPtzm07DnJ4GdN3XslC0MdB6JHZ3qz2xMJ07VenR1A1jVcKtm0a/VNrrcW5thWYGoiiVELt8uX/DWJUeZzZbNzwcNGEYiK2uIra6Wu3RWJkMzFSqu0bfGR7WBtzj7JSwLOhra9Ar4ZZK2Z/d6WnXoUyiCn5CuiCKRbthz2bbLkIbBt0OYwXd4+zUVcNYzjf9tsNYPg0P90ulR4NKo+/03Nr2aJyrOujZ7ECHh/ulcuK5nssBQsCcmqoONSMeD7p4FEIMNI9EobAXYhGbNl/rqmGsSqPvDGOJ3d29ekZ4kWBhmns9msowVm2PplSqHicKU4+zU8Kyqu+X1DRYtY1+LLY3ISmg4eG+kdIO440N4LXXYE5O7tWTyMFA82D/xYuJ2MwMtFyu4xNnWzJN97X8fDiOIQwD+toahGXBEALxt96KmalU/0PbsrqrZ59CRljW3uVapITY2dGg6/0P7RDUU9/YqNZTahqEadpDeP3sYUvZXT37FaZSQnfCWVgWkisrnEVCABhonlw5frx08PBh4PBhCOdcHD2b7T3cdL31cYEBHTNwm1W2Oz1tAIBx8CDEzs7eN/teh1U1rbt69jjBozocV5lgsPc6FgAY8/P28mOV97PXY6AB1bPdcJx54EB/h1WF6K6efZjIYlV6ZpkMZCIBANheXLSwuNjzc1P0MdA6JJNJGMkkjEOH7GHISqPvcYX1oHQ6YUKOjcEYG4OxsBCpYcimw4uttk8kYMzNwZibC+3El2aqEyacIeO2X37icZiV88dczosMJSHqhxedECNqhoHWAzk+DmN8HMY114RyooiMx/fO1+rhPCY5MgJjfr7aownbRJHqBJBep7QnEjAPHKjv0eRy9jBeGOrZyQSQVmIxmPv3w9y/f+/UhDBNFBECZu3sRk4AIY8YaH0iR0dhLCzs9WgCmsrflyn67Z5/bg5mbY8ml/N9dqCMxfbCOpXq/0nHjT2agKbyD/ykY12HOTNjr+RimvXno/k4lZ9T9Kkf+KkZADky4uswVmDLQjX2aAZ8svVAT6JuJRaDuW8fzH37XJf36qdms099oeuwMhlYmQzKlZOtnS8sgzjZutPhYaJ2GGiD1mwYq/bAvFvAtXoMgDU2thdifi1z1Uo87jqM1XU9pdxb5iosC/fqerU81eWwKudK9VLPIJa5asUJGyudRrlhOaye6tnJ+YFEHWKg+al2GKtcxuh3vtPVsM7u0aOw3BaHDYOGYayRixeRePnljp+mtLCA0o03DqCAfaJpdT2axAsvYOzNNzt+mvLMDIonTgQfYm6EgJVKwUqlUL72WsRefhljTz7Z8dOYU1Mo3nYbQ4wGhp+soDg9mk7JWAxWF/sFRtft3mmnhLCP00WFpsHopp4AzPn58IZZIyHs8nbBOHCAYUYDxU9XgFwvqdJqn0wmOo2fw8xkOt9naipys9us6WnIDo8DWaOj4Rgy7oBMJmF1eB0+qev2ECPRADHQAmRNTECOjHS0TzchGDSZSMCcnOxonyjWE5rW8VJMkawnOi+3mU6zd0YDx09YwIwOei8yHrdn90VQJw2g7CIYwqLjhj6qgdZhrzuq9aRoYaAFrJOGwZyZidxwY4WZTnsuu5VKRfY8JCuVgvRYdmt8PPirjHdJjo/D8lh2GYvZ7ynRgDHQAiYnJjwfj4j0t9wOhh0jXU8hPPcuI11PeC9/FI/7UjQx0ELASy9Njoz0/8rTPvPSAEpNs1eKiLCOGvoI81zPiAc3RQcDLQS8/MFHvfEDvH1Tt3pZozAkrKkpyDYzNK1kErLDmYJhI0dH7ZPdW20T4eO+FD0MtBDwcjyik8kjoRWL2UsctaDEt3kh2n4BUaKeaF8PDjeSnxhoIdGqYbBGR/1do3GAWtVTheHGirYN/bAEmiL1pGhgoIVEqz98FYYbK8zpaUiX85FUOlfJmpioXoDyqscmJ10fixqZSLgOKcpEIvLHfSla1Gg9FNDqeIRS33JjMdcVI5SqpxCu9VFi+LiGW32ifJoJRRMDLUSaNYDW2Bjk+HgApRmcZvWUuq7cuUpNG3oPx9eixu04mWrBTeHHQAuRZg2dUr0Wh5lKXTXsaGYyygw3VjQ7x9CcnAQUGW6sanKOoUrHfSk61GpBIq7ZuWYqBhp0HVbDycdK1hO46iRrZevZ8GVMtV4oRQMDLWRqGzwVzlVyUzscJWMx+6KWCqoLsA5WEYmaxmFHVYObwo2BFjK1Db3KjULtpVZUnjxQe6kVM5WK3CVxPIvH7Uv+QM3jvhQNDLSwqTkeofSwTc2K+krXE3tfTFhPosFioIWQOTPT1bXSosacmWl5HpMqzJmZSF8SxysznbbrqfDIAoVbNK/RoTgzkwGkDLoYA2elUjBmZ5UdbqyQY2Mw5ucje0kcz2IxGPPzkb0kDkVfr39hs30pRcglk8lV+FnXeNzzNbX66emnn16VUvr6nsaKRRjLy36+JBYWFlbn5+d9rafXSwT1U8b6vdUyrr3W1xedKACWv8fPjmUeW30W7xyGtsjfdig4hW537LXVXOlx/0jY3t6ehZ91LZchDMO3l6uQUs4+++yzyr+nmqbNzs/P+1pPrViE5ecLAijj2mvn5L96zdcX3QTg8wjyq9YvXQvgNX9fNRD+tkPBmQCw3c2OPIYWQno2i9jaWtDFoD4ROzuILS0BAXxJ8ZUBYBHATtAFoWHFQAshfW0NWj4PsbsbdFGoD/S1NQjLgp7LBV2UwcoBkACyQReEhhUDLWxKJehbWwDsnhpFn+70tpV/PyvV4+ACBYSBFjKxmkZP57Bj5IntbWjFIgBA39gAyuWASzQgZQAbzr+L6OGwPlH3GGghUxti2vY2hNMYUjTVfSmRUt1hx8ZqKd4ZpXBioIWI2N2Fls/X/Y69tGhrDDBl38/GAFO0mhRuDLQQaXaMRdkGcAiIfL463Fihb20BpVJAJRqQEuzp+rV20eXEa6LuMdBCpFl4aTs7EAUekIiiWLNJIFKqNznEbRSV38XIZwy0kBDFIrTt5l9p2UuLICld37emQRdlbh/PNdjT+Il8wkALiVahpdw3+iGg5fMQLkOL2taW62ORUwKQd3ms3OIxogFgoIVEq0DTikWIPFuGKGnXq1am192uGopUk6KBgRYColCAttN6vSDlhqlU5uE4mTKB1u5jWVk9hMgHil/PIhq8NG56Novy4cM+lIZ6pW1uQrQ5gbpyjqEMYBX+viniqpmMr68CF16zf27vAuMjwOyLwPGbgXcdA5yLlBMNBAMtBLwcI6uco2ZNTPhQIuqF196Xns3CWFgYcGkGyKmmYQJ//Djw+2eB715y33xmGvi7fwf45/8IuPVGX0pIQ4ZDjgFrdq6SG2WGqVTWwWogkX8/s8D3F4HbfxP4pw+0DjMAWFsH/vgrwImfADa2/CggDRv20ALWyQxGfW3NHnZU/ArPUaZtbHi+lp1WKEDs7ETzCs8F4MmLwH2fBXINw46zU8BN1wAHpoD1AvDiMvDKlfpthuCC7BQABlrAOpnsIcplaFtbsKamBlgi6kWnvS59bQ3GwYMDKs3gvPkicP/n68PsugPAf/hp4L6bAb1h7OeFIvCHTwB/+OdAgddLowHhkGOAurnmWeSHqVTWxTXPovp+/vLngCs1w4ZnbgCe+bfAj916dZgBwDuSwOd+FXjxr4EfutO3YtKQYaAFqJvGTM9mOV4TUtr6OoRpdrZPsQjhskJMWH31a8B/e2rv/jVp4C/+GTDRasKmCWADuOYA8NAfA1Oc20QDwEALSrkM/cqV9ts1EIYBrYv9aMAsC7HLl7vaVV9ais6XFAl85o/qf/UbHwL2TXrYdxmABWiafSPqNx5D81O5DD2Xg57NQt/cxO6NN7pPwzcMINb87Rn57neBpSWYmQzMTAYymRxgocmVZUFbX7ffz/V1GPPzKN1wQ/NtW7yf8Vdfxegzz8BMp2FmMvYx0jBN/JGwV9PPApdeBh69uPdQJgV8/F8ASDi/MODeqiwCeAbANIAMgBT4lZr6ioE2aKWS3eDlcvalQ2q/iQvh3nC1egz2UJW2uIj44iKs0VGY6TSsTIbnqQ2aaUJfX4eey0HL5SAsa++xbt9PISDKZcRWVhBbWYGMxWBOT9vhlkoF052xYF+BOgdgHXZQAfjz80BtlT9wNzAyUrOfcG7NCNhDj2vOTUN9uPGka+oRA20AxO5utSembQ3+hButWIS2tAQsLUEmEtWemzUxEa5v+lFlGHaIZbP2tPzaFn0AhGEgtrqK2OoqpK7Xh9sgl9pwjnNVQ6zJ4cBvvVx//4ff28PrWbCXzsrCDrsU7HCbBlsm6go/Nn0iikW7J5bNul4GxpdylEqILS8jtrwMGY+Hdxgr7BqGh4M6xiVME7G1NcTW1iA1DZYTbub0dH/CzYQdXlnYYdYmq595o/7+O9/eexEA2MOa684NsMMt7dzifXoNUh4DrQeiUKgOJ2ohvAjnVcNY6bQ9NBnUMFbYlUp7IdY4PBwCwrKqX5qkpsGamrLDLZ12PT7XlAG7F5aDHWIeq7lTAl5eqf/d9Ue8v2xHNpzbawCmsNdzS7jvQsRA65DI5/eGEz0uWRUGwjAQu3IFsStX6oexpqeHOtz8Hh7uF2FZ9jDo+jogBMzacIs36dKUYPd+KiHWhbV8fcYn4sBMurvn6simcwOACdjhlgYw4roHDSkGmgf7L15MxGdmoGezHZ8I3ZJp2rPfmvG4fFI3mg1jGfv3D+z1wmZ8ZUWLLS1BX1vr7/CwZXX3fvbaE5QS+sYG9I0N4LXXYE5MwJyZAUYKwA7sCRh9yOrNhhU+xkdRnSxS1epj248Ob965vQEgCSADxHMFzU46GnYMNA+uHD9eOrRvH6Sm9Xd4UddbDxV1MozUheowZOUY25AozM5axsyM/X7qev+GFzWtu/ezT8c2pabBSqWqQ8vQxoEx2BMudHQ0vNjMRmOgjaF5C+L2X9DPQ7g1w5Dl3fHBztKhyGCgeSTHx2GMj8M4eDA0E0C6wYkijkQC5oEDMA8c2JsAksvZvZyQHTtrpeVEEQv2X/h+59bhBJB2fP/oTDs3ThQhFwy0LsjRURgLCzAWFiJxDIZT+duIx2HOzsKcnfV9in43up7KrwOYcW4mqidLu03RbzTZsLTV9qAXGeZUfuoQPyI9kiMjMObmYMzNtT6J2mc82bpLsRjMfftg7ttnn0S9sWGHW+NJ1D7r+yxVHXvT4l1Oom6UarjKzUBWzefJ1tQDBlo/JRIw5+Zgzs0Fch6TNTZWHU7kclh9oOvVnm11mStnaLLTRYi74dvwsIa9cKtZ5grrAMp7m2UavheVykB2HchM9/j6teHK5bCoBwy0QfFpGMsaH99b0zGKF4qMCk2ze7uZDMqWBW1zs9ob93pBTy8CHx6uDPOlYIdbHtXVPJIAju4HXq1ZG/ul14E7p7t4nRj2QmwKDDHqCwaaHxqHsSrhtroK4TZj0rJch5VkLIby4cMw02nI0VbX7KCBcCZiWNPTKEsJbWvLPqWjUIC+stJ8nxbvpyiXYczP74VYWAgAk87tMIBt4MSx+kB7/mngzvmafSTcZzMWAMzCHk6cbLEdUZcYaH7TdZgzMzBnZjDy/PPQurjkSPHmm9kbCwshYE1NwZqaQuyNN5B49dWOn6J07bX2bMswEwAmgHffCXzl/N6vv/YY8PM3eXyOeQCHBlA2Igc7+gEyZ2Y63scaH2eYhVQ37yeEsI/RRcRP/Wj9KOjfXAR2y+7b14lONSmiGGgB6qYh66rRJF/IZBJWh0PA5tRU86WqQuroQeDu2/buZ7eBL37dw46jsA/CEQ0QAy1AMpGAOenlUr97GGjh1un7E8X381/+bP393/ofwGq7UzBrqmlZ9ddUI+oXBlrAOmnQrIkJyBGuyBpmnbyfUtPsJaoi5sM/DNx39979t3LA3/+PQL7VWt3OYMTSCvCBXwA28wMtIg0pBlrAzEzG89TsKH6bHzZybAzW+Linba1UauDrdQ7KH3wKmK4ZQnz0b4Hb/g3wP58FzMbe1zjw6hrwyc8Cx34UOPtNHwtKQyWaf00qicdhTk3Zawi2EaXJA8PMnJnxtIB1lL+gHD0I/Pd/D9z/r4Atp2f20mXg/s8Ds1PA8YPAgSl7QeMfrAEvvhlseWk4MNBCwMxk2gaaOTkJmeDVDaPAzGQQv3Sp5TZS0+zFhCPs9L3A138D+MjvA3+7tPf7lU3g4e+13pfLidIgcMgxBLwMO0b52/ywkaOjsNosPWal094XFQ4rHbjlZuA7vwX8x58BblxovfnMNPDzPwE88xUg1dlcKCJP2EMLg1gMZiplX324GSEiOXlgmJkzMy0vLWSoMnw8AyRywC+93769sgJceA24lAW2d4HxA8DsEeBdx+xb1DOcwo2BFhLmzIxroJmTkwCHGyPFnJlB/I03mj5WuYaZEqZhj/M4E0HeNmvfqm4FwI8u+YRDjiFhptOQLmv9cbgxemQiAcvlHEP7atKK/OlVVupvZgIMM/KVIn9VCtD15t/aI7Y0Eu1xG1ZU7guK28dTsWpS+DHQQqRZQ2dG+FylYddsso/Udfv8M5W4XYiTh33JZwy0EDFTqauGHZX7Nj9MmixtZmYy6gw3Vmi4upc2BQ43ku8U+8uKOF2vm80Y1aWRaE/jFxJlv6A0BhpHySkADLSQqW3wrOlpznOOODOdrg47yngc1tRUwCUakCnUz5nm9zAKAAMtZKxUCtIJMWW/zQ8TZ2kzoLN1OyNHYC/EpgFE54o4pBAGWtg4w4xS0+wJIRR5lS8myn9BqVSPw40UEE6fCyFzZgaQksONijDTaVijo7AmJoIuymBNAhiB3UMjCgADLYSsVIphppJYDOWjR9UdbqwQAI6CrQoFpteP3mz7TaIvmUyuws+6CoHRZ54ZKZw+vevbawLI5/P+1jMgL7zwwqplWcrX8z3XX1xdnvida/18zYkHvjqf/5X7ltpv2T8j2mNvAO9U/v0EMBR/nwDaX3vJRa+BttLj/pGwvb09Cx/rKra3UT5yxK+Xq5qYmPC1nkHZ3t6effbZZ5Wvp6b96OyJEyde8/M1k68+hC3zR4G4f7NCXsxeMwuo/37CDrNhqOcEAPeVvVvgpJAQ0tfWoK+t2cfRiCIi/tprGPv2tzF24ULQRaEhxUALoVg2C1EuQ9vaCrooRJ4lz561fz70UMAloWHFQAsZLZ+H2LUPnelrawGXhsgjKTHxta8BAJKPPw6USgEXiIYRAy1kakNMz2Y57EiRkPjBD6rXf9PyeYx/61sBl4iGEQMtTKS0Q8whDAPa5maABSLypnGYsTL8SOQnBlqIaFtbEA1DNRx2pNCTEhONgfb44xDFYkAFomHFQAuRZuGlZ7OAZQVQGiJvRr7/fcSW6k89E8Uixp94IqAS0bBioIVFw3BjhTBNaBsbARSIyBu3WY2c7Uh+Y6CFhLa5CWEYTR/jsCOFlmW5Hi8bf+IJiO2uzo8l6goDLSRahZaey3HYkUJp5LnnELtypeljolRC8tw5n0tEw4yBFgaW1XS4sUJYFvT1df/KQ+RR5dwzN8k2jxP1EwMtBLSNDQjTbLkNhx0pdAwDyUceabnJ2JNPcsUb8g0DLQS8hJW2vg60CT0iP40+84w9HN6CMAyMP/aYTyWiYcdAC5pltW0UAGfY0cN2RH5pPPfMdTsOO5JPGGgB09fXITxO+Gh1nI3IV+Uyko8+6mnTsQsXoPGzSz5goAWsk2Nj+vo64DK1n8hPY0895f3YmGV5Dj+iXjDQgmSa9rExr6TksCOFgtfhxur2HHYkHzDQAtTJcGN1H852pICJUgnjjz/e0T6j3/0u9JVhuNgyBYmBFqBuwknf3ATK5QGUhsibsSeegFYodLaTlEg+/PBgCkTkiAVdgKFUKlUXHTZmZppuIqSEFKLpY/FLl2DOzsKamBhkKYmuZprQNjeR/8AHmj4symXIeLz5Y6WSfeqJrg+yhDTEGGg+Ebu70HM56Nls9WD67k03uYeSYQCx5m/PyHe+g9iVK5CJBMxMBmYmYz+PSwAS9cQ0AdO0h8elRP6++5D/0IeabiryeUi3z3S5vHd5JF2H1DQ73Pi5pT5hoA2QKBahZ7N2iA1gkVZRKiG2vIzY8jJkPA4znbbDbWqKjQR1T0rAsuzVawZ1Mr9p2s9fLjPcqG8YaH0mCgU7xHK5zo8z9PK65TJiKyuIraxAxmJ2uKXTsFIpQOOhUmpDyr1emN8r0jDcqE8YaH0gtrf3emIhuEqvMAzErlyxhyV1Heb0tN1zm55muNGeIEPMTW24aRqkrjPcyDMGWjekhFYTYmJ3N+gSuRKmidjaGmJra5CaBssJN3N6mgfnh1EYQ8yNZdnlrISbptnHlRlu5IKB5pWU0La2qsOJ1YPbESKcy9To2awdbqnUXri5TEAhBUgJGIYdDlG9rl4l3AxjL9x0nSMOVIetmAf7L15MJMbH+39NMtN0X8pqwEtcVRY71nM5yJERlI4cGejrUUDKZdcrofdEyua/TiRcH+ubmnCT/CJGNfhp8ODK8eOlg+94R9Op9z3R9dY9owH+sXLK/5CIx+3zwhqm3vfM7fOSSPT+3O1w4gi5YKB1QI6MwJibgzE3Vz05Ws/loG9tDf5baR9Yo6P2zMdKiNHwcCZXSKD/4eYHXd+bIELkgoHWrUQC5twczLk5oFyu9tz0zc1QNRLW2Fj1/DSZTAZdHAqDKISbEHu9MIYYecRA64d4HObsLMzZWcAwoK+v28OSGxsdLz7cD9b4eHU4UY6N+f76FCG14eYclwos3Bhi1CMGWr/FYjD37YO5bx9gmna45XLQcrmBhps1MWGHWDoNOTo6sNchhWkakEjshVvlnLBBhhtDjPqIgTZIug5zZgbmzAxgWdCcnpu+vm43FD2yJif3emJ+HIyn4aFp9vT4eHwv3Po17b8SYrEYp91TXzHQ/KJp9mSMTAZly4K2sYHYq69CuH0rldJ1Bpc5PY3d+Xl/ZpQRVcINsAPNWeuxY0JAjowwxGhgGGhB0DRY6TSwtgatw2uiSU2DcewYT4SmYGha94HGafY0YPyqFCAjk+l4H4urelDQug0lhhkNGAMtQNb0tH1uTQfMLkKQqO86DSeGGfmAgRYkTYOZTnveXGqave4iUdAYaBRCDLSAmTMznre10mlObaZwYKBRCDHQAmalUp4XWO3mmBvRwHgNKYYZ+YSBFjQhPB0Xk7puTwghCgsGGoUMAy0EvAw7muk0z9+hcGGgUciwhQwBa3LSXpGhhU6OtRH5pl1YMczIRwy0MBCiZWDJWAxWKuVjgYg8YqBRiDDQQqLVcTQzk2HDQOHEQKMQYaCFhDUxYa9z1wSHGynU3EKLYUY+Y6CFhctsRxmPw5qcDKBARB4x0CgkGGgh0uw8Mw43UugJ0fwzys8t+YyBFiJyYgJWw8U5OdxIkdAYXgwzCgADLWRqhx1lIgFrYiLA0hB5xECjEGCghUxtj8ycmWHDQNFR+1nl55YCwEALGTk+DmtsDADXbqSIqYQYw4wCwkALIXNmBtboKCSHGylKGGgUMF76OITMTKa7S9wTBc1txiORD3oNtNm+lCLkksnkKnysqxwbg765GTMAw6/XBIBjx46tapqm/Hs6Nze3ury8rHw9r7vuOl8/twACWUA7n8/7X89gDEs9C93u2GugrfS4fyRsb2/Pws+6SondY8d8e7mKycnJ2RMnTvj7npZKQCLh60sCmJ2fn/e1nqJUggygnvD5b3T80UdRuPdeP18SExMTvtczIMNSzwkA293syGNoYWQYEKVS0KUYPMOAtrsbdCkGz7Igtrv6+4yWchn7PvtZaLlc0CWhIcVACyFRLkMYBiBl0EUZKFEuA4YBmGbQRRkoUSpBSGn3RhU29u1vQ8/lkHz00aCLQkOKgRY2UtphBgDlcrBlGbBKL1T13uiw1DN59iwAYML5SeQ3BlrYlMvVnplQOdAMozqTU+l6Wlb1C4oolZTtdYtSCcmvfx0AMPrss9BXVwMuEQ0jBlrI1DbuKg871vVWTNMOOAXV1lNA3fAe++Y3odUcJ0w+/HCApaFhxUALk9rhRoeqDWBjvZStZ8Mwo6rDjsmGYcbG+0R+YKCFSbNGXcUGsFy+6sRxJRt607zqCwoUHHYUOzsYP3eu7nejzz+P2NJSQCWiYcVAC5FmvRRhmsqtGtK0N2ZZyg07NgtpFYcdx594ounpFxx2JL8x0MKiyXBjhdvvo8qtN6ZaL21Y6uk2vMhhR/IbAy0kWn5rV6kBrJnF2Uipnotp2r3rZhQadhT5PMa/8Y2mj428+CJily75XCIaZgy0sGgRWioNO7bsnSg07NiqnqLN41GSPHeu5RcRnpNGfmKghYFluX+bd6jSe2lXD1UaetFmSS9V6pl86KHWjzPQyEcMtBDwcoxMiUDzMNSmRD0NA6JNj1q0GHqNCm1zE2NPPdVym8SrryL+8ss+lYiGHQMtDLx8W1dg2NFTWFlW5Jf88tr7inovLfnYY21HFgBggrMdyScMtKB5GG6siHTvRUrP5Y96Qz80gdZmuLFuu4j3RikaGGgB6ySkIh1oHQyxRbqeHoYbK0STE8yjQs9mMfr00562jb/1FhIvvjjgEhEx0ALXUeNtmpG91EpHvZEIX2ql015XVHtpyUcesS+J43V7Tg4hHzDQgmRZHQdUJHsvLU4adxPJeqL97Marto9qoHUYUBMcdiQfMNAC1E2jHcVVQ7qZ0RfJWYDlcke9FsB5PyM27KivrGD0u9/taJ/YygpGnn9+QCUisjHQAtRVLySKl1rpphcSwWHHbntbnfbqgtbtGo1eJ5EQdSsWdAGGjmlC7O5ClEqwEglgZKTjp9j3mc/AWFjAzh13YPeGGwBdH0BB+8CyACkhEwlIt3pKCQjR9KF9n/kMZCyGwqlTKN5+O2QiMcDC9kDKaj3NeLzpJgKAW98t/YUvIHblCgpnzqBw552QyeTAitoTKQHLws5tt2Hp859vuolWLMIaHW2++8gIRLEIqetALOb6vhN1i4HmB8OAKJXsIKs9ZpZMAi4NYKuGXt/YwMj3v4/k2bOwJiawc/vtdrjddJPdUATFadirt4p43L3xalFPLZ/H2JNPYuJv/gZybAyFu+5C4dQp7Lz73ZAujaZvmtWzRSMtW9WzVELy0UeRfPRRyHgcO+9+tx1u730vrMnJQZTeOyfEautZvu46lLXmgzsin4ecmGj+XKUSRLls/w2USoCuM9yorxhog2IY1Z6Y1/PMuqHl80g+9hiSjz0Ga3wcxVtvxc7Jk9h917v86dG4hVifiZ0dJB95BMlHHoEcGcHOyZMonDqFwl13+dej8aOe5TLGz5/H+PnzgK5j57bbUDhzBtv33AMrnR7Y69apBNigj2FWFnBmuFGfMND6qVzeC7EADvRrhQLGn3gC4088ATkyguItt2Dn5EkUb7mlvz0an0LMjdjdxfi5c/ZFJWMx7Nx+ux1u730vrKmp/r5YgPWEaWLsqacw9tRTmPnc51C85RZsnz6NwunTMPft6+9r+RVibhrDTdPscHPpCRI1w0DrValkB1hAIeZG7O5i7MknMfbkk5DxOIo334ziHXdg59Zbu+vRBBxirgwDY9/6Fsa+9S3M6Ppeo//e98LKZLp7zjDW07Iw+swzGH3mGcz83u9h953vxPaZM9g+cwbm3FznzxfW9xPYC7dyGdC0vZ4bw43aYKB1o1SC5oRYFKZci3IZYxcuYOzCBUzHYti98Ua753b77a2P0VQauwjUEQBgmhh9+mmMPv00Zn73d7F7/Di2T51C4dQpmPv3u+8X1obdjZQYef55jDz/PDJ/8AcoHTuG7Xvvxfbp0zAOHWq5X+Tqaln2F0WGG3nAQPNALxb3emERCTE3wjAw+txzGH3uOeCLX7TD7Y47sHP77fYxmqiFmBspMfLccxh57jm70b/hBjvcTp+GMT8fvYa9hcSLLyLx4otIf+ELKL3tbSicPo3tM2dgzM1Bjo2pU9dm4RbWGb4UCAaaB7HdXVFddqqfDX2LRkYUi+779asMUkJfXbVvuVx9oPVTixl+olh0rU8/TyLXr1xB7PJlxC5fhplK2Q29j0S57H4VgT7WM7a6Wq0nLEsvv/3t9gM+hZlMJv15LSkhpLRnjxI5GGge7KZSUo6N2Y2gZe1Nwe91eSYh3Kd5j466z/bqcbjFWFjAzsmT2Dl5EuVDh+pfp/a5m0zZ7kqLWWut6il7PAXBOHAAhXvuQeH0aezeeOPV/2+V1/WhByMTCcBt1mmP9TTTaRROncL2mTMo3npr7fPZ02uFsOvuR+97kDMUhaifDUnUgJ+KTmka5Oio3RBLWR9uIf62WD5yxB5aPHkSxsKCt52cBgRA/8JtwIxrrrEnhZw6hdL113trYGu/WERkeM7cvx/bp05h+957sXv8uLeht0o9/Qq3fhACiMU4vEieMNB6IQTkyIi9CkYl3CrH2ULQIJbe/nY7xO64A+aBA709WWO4hagxLF97rR1i99yD8tGjvfUSQhxuxvw8ts+cQeHMGXuFmF566s3CLSx1ZYhRlxho/dIYbjXnpPnWSAiB3WPHsHPHHSiePAmz22nrHl4n6G/6peuvtyc/3HNP65l9vQhBuJUPH8b2vfeicPo0StddN5ghPbd6+llXhhj1AQNtEISw1y9MJPbCbVAzJDWtOg1/57bbYE1P9/f52/Ex3Hbf+U77BOpTp2B0c+5VL3wMt9J111VnKpavvXYgr+HKz3DjNHzqMwbaoNWGG1B/DpthdLXGoXROIN654w77XDK3tfP85jaMZVmtexZujaWmoXjLLXaI3XNP/1fH6FazRr/y7y6fb/fGG+0QO30axsGD/Slnr1qFm1tdW3xuISVDjAaKgea3RMJeZR/2VPJuejMr//pf2wsbh1lNYyh2drq60vaVX//18K48X1Hb6Hd5RfHsJz4R/GLL7dTW01mntFNS03w/XYKGC78iBairP25dD3+YNeh2+r0cH+9zSQasyx6H66V1wqrbY1ycak8DxkALkNVFQxb6b/LNdNOQRXHV9W7K2+JcxNCqDCsPeh+iDvETFqR4vOPGvpsQDJwzg60TvZ5UHZhOG+2INvKyw3J3uj1RN/gpC1hHAaXr7hcEDTnZyTBV7TlvUdNNzyWKOn1/ovp+UqQw0ALWyRBiJIcbKzrpcUVxuLGikyHEKA43VnQyhMjhRvIJP2VBi8U897oiOdxY0cGwY0e9uTDyGlIRb+S9DiNyuJH8wk9aCHgKqg6CL6w8HRfr4nhb6HhtwKPe0Hv94hH1LygUGRH/i1KDl6HESPfOKnS9fe8l6mEGeBtKjOpQYy0vQ4kcbiQf8ZMWBroO2ab3FenjZxUeJntEfrixol1gKdLItxtO5HAj+YmftpBoeXJtF9P7w6rlsKMKw40V7RpyVRr6dl9AVPmCQpGgyF9V9LXqgSkx3FjRagajKmEGtB52VGG4saLVkCKHG8ln/LSFRYthRyWGG2u5BFdkT6Z2M6ArjoeN2zAxhxvJb/zEhUiz4JLxuHLDNk0bwCifTO3GrUFXraF3q49qX1Ao9BT7y4q2poGm0nBjRbNhx4ifktBUs2FH1cIMsC+R1FgvTVNraJUiQcG/rgjTtL3rpjmUG26saPj2rszsxkaNDb2qjXzD+8fhRgoCP3UhUxtgKg43VtQdL9M0Zes5FD004Or3T9X3k0JN0b+u6JIjI9VGUNneGVB/krXKx1pqhx1VDTNHtVfG4UYKiNp/YVFUM+yodKAB1SBTdrixotLQq97IO+8jhxspKPzkhZAcHbVDTfGGQcZiag83VgxJD636Pqr+flJoKTzWE11KzmxsxsOSX0pQ8ZQEFzLKl/6hyOs10Gb7UoqQe+GFF1Yty1K+rsvLy6tzc3OspyKGpZ4vvfTSKoajLRqWeha63bHXQFvpcf9I2N7enn322WeHoa6zy8vLrKc6hqaeGI62aFjqOQFgu5sdFR/UJyKiYcFAIyIiJTDQiIhICQw0IiJSAgONiIiUwEAjIiIlMNCIiEgJDDQiIlICA42IiJTAQCMiIiUw0IiISAkMNCIiUgIvH0NERHWmpqZw6NAhpFIp6LqOjY0NLC8vY2Ul3GsjM9CIiAgAMD8/jx/5kR/BsWPHoDW5IO2bb76Jhx9+GN/73vcCKF17DDQiIsLtt9+OH//xH0e8xUV3Dx48iI997GM4d+4cHnzwQR9L5w0DjYhoyF133XX4yZ/8ybpeWaFQwKVLl2AYBhYWFpBOp6uP3XPPPdjZ2cHZs2eDKK4rBhoR0RAbGxvDRz/60bowe/LJJ/Hggw+iVCoBAIQQuPPOO/GhD32out373vc+/OAHP8Drr78eSLmb4SxHIqIhdvfddyOZTFbvX7x4EV/5yleqYQYAUkp885vfxF/91V9Vf6dpGt7//vf7WtZ2GGhEREMqFovhPe95T/W+YRgtj42dP38ely9frt6//vrrsbCwMNAydoKBRkQ0pN72trfV9c5eeuklrK+vu24vpcSFCxfqfnf8+PFBFa9jDDQioiF17NixuvvPP/98230uXrzY8jmCxEAjIhpS1157bd39N954o+0+2WwW29vb1fsLCwtIJBL9LlpXGGhERENq//791X+Xy2VcuXLF036Li4vVf2uahn379vW9bN1goBERDaHJyUmMjIxU729ubkJK6WnfjY2NuvsMNCIiCsz09HTd/a2tLc/7bm5u1t2vPek6SDyxmohoCI2OjtbdLxQKdfdPnjyJ973vfYjFYrhw4QK++tWvVntwOzs7ddvW9vSCxEAjIhpCjWs2GoZR/ffhw4fx4Q9/uLoqyJkzZ5DP5/H1r3/9qm0BcFIIEREFpzGEakPqyJEjV622f/To0abbAleHY1AYaEREVOett9666ne1U/q9Th7xGwONiGgI1a7VCNjLYFW88sorePDBB7G5uYnt7W2cP38ejz/+eNNtAXvKfxjwGBoR0RBqDKHGkDp37hzOnTvXdN/GbRvDMSjsoRERDaHd3d26+2NjY573HR8fb/lcQWGgERENoVwuV3d/amrK876N2zY+V1AYaEREQ2hra6uuZzU1NQUhhKd9U6lU3f3V1dW+lq1bDDQioiFVG0TxeLxubcdWaq+BZlkW1tbW+l62bjDQiIiG1Kuvvlp3/9ChQ233yWQydddQW1xc5DE0IiIK1osvvlh338vFOhu3aXyOIDHQiIiG1CuvvFJ3bbPrr7/+qkWLawkhcPvtt9f9zstFQf3CQCMiGlKGYeAb3/hG9X4sFsP999/vuv3dd9+NAwcOVO+/9NJLTVcVCQoDjYhoiJ0/f76ul3b8+HF8+MMfrlvrUQiBu+66Cx/84Aerv7MsCw899JCvZW2HK4UQEQ2xnZ0dfOlLX8LHP/7x6oLEd955J44fP45Lly7BMAxcc801V13z7OzZs3j99deDKLIr9tCIiIbcSy+9hC9/+ct1y2Elk0nccMMNOH78+FVhdv78eZw9e9bvYrbFHhoREeHChQtYXFzEfffdh+uvv/6qy8cA9ir8Z8+exfe+970AStgeA42IiAAAS0tL+OIXv4ipqSkcPnwYqVQKmqZhc3MTy8vLuHz5ctBFbImBRkREdTY3N3Hx4sWgi9ExHkMjIiIlMNCIiEgJDDQiIlICA42IiJTAQCMiIiUw0IiISAkMNCIiUgIDjYiIlMBAIyIiJTDQiIhICUJKGXQZiIiIesYeGhERKYGBRkRESmCgERGREhhoRESkBAYaEREpgYFGRERKYKAREZESGGhERKQEBhoRESmBgUZEREpgoBERkRIYaEREpAQGGhERKYGBRkRESvj/ASqcmFvVU5+MAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 525x525 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.figure(figsize=(3.5,3.5), dpi=150)\n",
    "draw_policy(env, agent, (1,0), subplot_mode=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "F8ksCe4rH91H"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
