{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import pandas as pd\n",
    "from scipy.ndimage import gaussian_filter\n",
    "import seaborn as sns\n",
    "import os\n",
    "import glob\n",
    "import pickle\n",
    "sns.set_theme()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "experiment_name = \"FullTrackUnlimitedBuffer\"\n",
    "exp_paths = [\n",
    "            f\"./Experiments/pointbot/UARF/{experiment_name}NoSkip\",\n",
    "            f\"./Experiments/pointbot/BICHO/{experiment_name}\",\n",
    "            f\"./Experiments/pointbot/BASELINE/{experiment_name}\",\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "exp_summaries = [pd.read_csv(p + os.sep + 'joined_run.csv')[0:1000] for p in exp_paths]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "save_file_prefix = f\"{experiment_name}_\"\n",
    "colors = ['blue', 'red', 'green', 'brown', 'cyan', 'yellow', 'teal']\n",
    "labels = [\n",
    "     'UARF',\n",
    "     'BICHO',\n",
    "    'BASELINE',\n",
    "]\n",
    "figsize = (4,2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_paper_plot(summaries, metric, ylabel, labels, colors, y_lim, save_file_prefix=save_file_prefix, divide_by_1000=False):\n",
    "    plt.figure(figsize=figsize, dpi=400, facecolor='w', edgecolor='k')\n",
    "    for i, s in enumerate(summaries):\n",
    "        v = s[metric] if metric != \"percent_new_experience\" else s[\"percent_new_experience\"] * s[\"buffer_last_train\"]\n",
    "        v = v/1000 if divide_by_1000 else v\n",
    "        plt.plot(gaussian_filter(v if metric != \"ep_reward\" else v * -1, sigma=2) if metric != \"percent_new_experience\" else v, color=colors[i], #, linestyle='solid',\n",
    "                linewidth=0.5 , label=labels[i],marker='o', linestyle='solid', markersize=0.5)\n",
    "        plt.vlines(30, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(60, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(90, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(120, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(150, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(180, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "        plt.vlines(210, -15000, 40000, color=\"teal\", linewidth=0.5, linestyle='solid')\n",
    "    if metric == \"percent_new_experience\":\n",
    "        plt.vlines(range(0,210), 0, exp_summaries[0][\"trained\"] * 200, label=\"UARF Trained\", color =\"c\", linestyle=\"dashed\", linewidth=0.5)\n",
    "    \n",
    "    plt.ylim(y_lim)\n",
    "    if metric == \"ep_reward\":\n",
    "        plt.legend(loc=4, prop={'size': 14})\n",
    "    elif metric == \"percent_new_experience\":\n",
    "        plt.legend(loc=1, prop={'size': 14})\n",
    "    else:\n",
    "        plt.legend(loc=2, prop={'size': 14})\n",
    "   \n",
    "    plt.xlabel('Episode')\n",
    "    plt.ylabel(ylabel + \" [1e3]\" if divide_by_1000 else ylabel)\n",
    "    plt.savefig(\"./images/\" + save_file_prefix + metric + '.png', bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# increase fonts size for this plots\n",
    "MEDIUM_SIZE = 18\n",
    "plt.rc('ytick', labelsize=MEDIUM_SIZE)    # fontsize of the tick labels\n",
    "plt.rc('font', size=MEDIUM_SIZE)          # controls default text sizes\n",
    "plt.rc('axes', titlesize=MEDIUM_SIZE)     # fontsize of the axes title\n",
    "plt.rc('axes', labelsize=MEDIUM_SIZE)    # fontsize of the x and y labels"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# increase the aspect ratio just for this plots\n",
    "figsize = (4,3)\n",
    "generate_paper_plot(exp_summaries, 'ep_reward', \"Episode Reward\", labels, colors, [0, 2.100], save_file_prefix, True)\n",
    "generate_paper_plot(exp_summaries, 'buffer_size', \"Buffer Size\", labels, colors, [0, 20], save_file_prefix, True)\n",
    "generate_paper_plot(exp_summaries[:1], 'buffer_size', \"Buffer Size\", labels, colors, [0, 1.3], \"FullTrackUnlimitedBuffer_UARF_only_\", True)\n",
    "generate_paper_plot(exp_summaries, 'run_wall_time',\"Per Episode Wall Time\", labels, colors, [0, 50], save_file_prefix)\n",
    "generate_paper_plot(exp_summaries[:2], 'percent_new_experience',\"Experiences Added\", [\"UARF\", \"BASELINE/BICHO\"], colors, [-5, 120], save_file_prefix)\n",
    "\n",
    "# set back to default\n",
    "figsize = (4,2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def load_buffers(path):\n",
    "    replay_buffers = []\n",
    "    buffer_paths = sorted(glob.glob(path))\n",
    "    for i in range(len(buffer_paths)):\n",
    "        with open(buffer_paths[i], 'rb') as f:\n",
    "            replay_buffers.append(pickle.load(f))\n",
    "    return replay_buffers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_maneuvers(buffers):\n",
    "    maneuvers_by_method = pd.DataFrame([x['maneuvers'] for x in buffers])\n",
    "    maneuvers_by_method = maneuvers_by_method.transpose().rename(columns={0: 'BASELINE', 1 : 'BICHO', 2: 'UARF'})\n",
    "    maneuvers_by_method.fillna(-1, inplace=True)\n",
    "    maneuvers_by_method = maneuvers_by_method.astype('int32')\n",
    "    return maneuvers_by_method"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "replay_buffers = load_buffers('Experiments/pointbot/*/FullTrackUnlimitedBuffer/run6/buffers/replay_buffer.pkl')\n",
    "replay_buffers.append(load_buffers('Experiments/pointbot/*/FullTrackUnlimitedBufferNoSkip/run6/buffers/replay_buffer.pkl')[0])\n",
    "maneuver_lengths = {\n",
    "\n",
    "            \"c1\" :          100,\n",
    "            \"c1_i\" :          100,\n",
    "            \"c14\" :        100,\n",
    "            \"c14_i\" :        100,\n",
    "            \"straight\" :      100,\n",
    "            \"chicane\" :    50,\n",
    "            \"chicane_i\" :    50\n",
    "}\n",
    "maneuvers_list = ['c1', 'c1_i', 'chicane', 'chicane_i', 'c14', 'c14_i', 'straight']\n",
    "maneuvers_by_method = get_maneuvers(replay_buffers)\n",
    "maneuvers_by_method"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "x = list(maneuvers_by_method.columns)\n",
    "\n",
    "method_maneuver_percentages = []\n",
    "maneuvers_total_counts = []\n",
    "for column in x:\n",
    "    maneuvers_total_count = maneuvers_by_method[column].replace(-1, np.nan).count()\n",
    "    maneuvers_total_counts.append(maneuvers_total_count)\n",
    "    maneuvers = list(maneuvers_by_method[column])\n",
    "    method_maneuver_percentage = []\n",
    "    for maneuver in range(len(maneuvers_list)):\n",
    "        method_maneuver_percentage.append(maneuvers.count(maneuver))\n",
    "    method_maneuver_percentages.append(method_maneuver_percentage)\n",
    "\n",
    "y1 = np.array([item[0] for item in method_maneuver_percentages])/1e4 \n",
    "y2 = np.array([item[1] for item in method_maneuver_percentages])/1e4\n",
    "y3 = np.array([item[2] for item in method_maneuver_percentages])/1e4\n",
    "y4 = np.array([item[3] for item in method_maneuver_percentages])/1e4\n",
    "y5 = np.array([item[4] for item in method_maneuver_percentages])/1e4\n",
    "y6 = np.array([item[5] for item in method_maneuver_percentages])/1e4\n",
    "y7 = np.array([item[6] for item in method_maneuver_percentages])/1e4\n",
    "    \n",
    "plt.figure(num=None, figsize=figsize, dpi=400, facecolor='w', edgecolor='k')\n",
    "plt.bar(x, y1, color = colors[0], label = maneuvers_list[0])\n",
    "plt.bar(x, y2, bottom = y1, color = colors[1], label = maneuvers_list[1])\n",
    "plt.bar(x, y3, bottom = y1 + y2, color = colors[2], label = maneuvers_list[2])\n",
    "plt.bar(x, y4, bottom = y1 + y2 + y3, color = colors[3], label = maneuvers_list[3])\n",
    "plt.bar(x, y5, bottom = y1 + y2 + y3 + y4, color = colors[4], label = maneuvers_list[4])\n",
    "plt.bar(x, y6, bottom = y1 + y2 + y3 + y4 + y5, color = colors[5], label = maneuvers_list[5])\n",
    "plt.bar(x, y7, bottom = y1 + y2 + y3 + y4 + y5 + y6, color = colors[6], label = maneuvers_list[6])\n",
    "\n",
    "plt.ylabel('Buffer Size [1e4]')\n",
    "plt.title('Diversity of Final Trained Buffer')\n",
    "plt.legend(loc=3, prop={'size': 5}, ncol = 3)\n",
    "plt.savefig('images/' + 'FullTrackUnlimited_diversity.png',bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(num=None, figsize=(3,4), dpi=400, facecolor='w', edgecolor='k')\n",
    "plt.bar(x[2], y1[2], color = colors[0], label = maneuvers_list[0])\n",
    "plt.bar(x[2], y2[2], bottom = y1[2], color = colors[1], label = maneuvers_list[1])\n",
    "plt.bar(x[2], y3[2], bottom = y1[2] + y2[2], color = colors[2], label = maneuvers_list[2])\n",
    "plt.bar(x[2], y4[2], bottom = y1[2] + y2[2] + y3[2], color = colors[3], label = maneuvers_list[3])\n",
    "plt.bar(x[2], y5[2], bottom = y1[2] + y2[2] + y3[2] + y4[2], color = colors[4], label = maneuvers_list[4])\n",
    "plt.bar(x[2], y6[2], bottom = y1[2] + y2[2] + y3[2] + y4[2] + y5[2], color = colors[5], label = maneuvers_list[5])\n",
    "plt.bar(x[2], y7[2], bottom = y1[2] + y2[2] + y3[2] + y4[2] + y5[2] + y6[2], color = colors[6], label = maneuvers_list[6])\n",
    "\n",
    "plt.savefig('images/' + 'FullTrackUnlimited_diversity_UARF_ONLY.png',bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "path = \"../mbrl_rb_crop_results/Experiments/pointbot/UARF/REWORK/Sector1UnlimitedBufferNoSkip/run0/episodes/\"\n",
    "episodes = sorted(glob.glob(path + \"episode*.csv\"))\n",
    "episodes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_episodes_csv = {}\n",
    "for i, episode in enumerate(episodes):\n",
    "    df = pd.read_csv(episode)\n",
    "    all_episodes_csv[episodes[i][100:-4]] = df\n",
    "all_episodes_csv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def plot_recalculation_schedule(df, image_name, episode_num):\n",
    "    fig, ax1 = plt.subplots(figsize=(2.,2), dpi=400, facecolor=\"w\", edgecolor=\"k\")\n",
    "    ax2 = ax1.twinx()\n",
    "    x = df.index\n",
    "    add_to_buffer = df[\"Added to Buffer\"]\n",
    "    reward = df[\"Rewards\"] * -1\n",
    "    ax1.plot(x, reward, color=\"red\", label=\"Reward\", linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5)\n",
    "    ax1.legend(loc=2, prop={'size': 6})\n",
    "    ax1.set_ylabel(\"Reward\")\n",
    "    ax1.set_title(f\"Sector1: Episode {episode_num}\")\n",
    "    ax1.set_xlabel(\"Steps\")\n",
    "    \n",
    "    ax2.plot(x, add_to_buffer.cumsum(), color=\"blue\", label=\"Cum. Adds to Buffer\", linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5)\n",
    "    ax2.fill_between(x, add_to_buffer.cumsum(), color=\"blue\", alpha=0.1)\n",
    "    ax2.legend(loc=1, prop={'size': 6})\n",
    "    ax2.set_ylabel(\"Steps\")\n",
    "    ax2.set_ylim((-10,300))\n",
    "    \n",
    "    fig.savefig(image_name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def plot_recalculation_schedule_test(dfs, image_name, episode_num):\n",
    "    fig, axs = plt.subplots(1,len(dfs), figsize=(8,2), dpi=400, facecolor=\"w\", edgecolor=\"k\")\n",
    "    for i, ax in enumerate(axs):\n",
    "        x = dfs[i].index\n",
    "        add_to_buffer = dfs[i][\"Added to Buffer\"]\n",
    "        reward = dfs[i][\"Rewards\"] * -1\n",
    "        line1, = ax.plot(x, reward, color=\"red\", label=\"Reward\", linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5)\n",
    "        ax.set_title(f\"Sector1: Episode {episode_num[i]}\")\n",
    "        \n",
    "        \n",
    "        ax_ = ax.twinx()\n",
    "        line2, = ax_.plot(x, add_to_buffer.cumsum(), color=\"blue\", label=\"Cumulative Steps to Buffer\", linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5)\n",
    "        ax_.fill_between(x, add_to_buffer.cumsum(), color=\"blue\", alpha=0.1)\n",
    "        ax_.set_ylim((-10, 300))\n",
    "        \n",
    "        if i == 0:\n",
    "            ax.get_yaxis().set_visible(True)\n",
    "            ax.set_ylabel(\"Reward\")\n",
    "        else:\n",
    "            ax.get_yaxis().set_visible(False)\n",
    "            \n",
    "        if i == 1:\n",
    "            ax.legend(handles = [line1, line2],loc='upper center', \n",
    "             bbox_to_anchor=(0.5, -0.4),fancybox=False, shadow=False, ncol=2)\n",
    "            ax.set_xlabel(\"Step\")\n",
    "        \n",
    "        \n",
    "        if i == len(dfs) - 1:\n",
    "            ax_.get_yaxis().set_visible(True)\n",
    "            ax_.set_ylabel(\"Steps\")\n",
    "        else:\n",
    "            ax_.get_yaxis().set_visible(False)\n",
    "        \n",
    "            \n",
    "        fig.savefig(image_name, bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_recalculation_schedule_test([all_episodes_csv[\"episode1\"], all_episodes_csv[\"episode4\"], all_episodes_csv[\"episode99\"]], \"images/Sector1UnlimitedBufferAddToBufferSchedule.png\", [1, 4, 99])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_recalculation_schedule(all_episodes_csv[\"episode1\"], \"images/Sector1UnlimitedBufferAddToBufferSchedule1.png\", 1)\n",
    "plot_recalculation_schedule(all_episodes_csv[\"episode4\"], \"images/Sector1UnlimitedBufferAddToBufferSchedule4.png\", 4)\n",
    "plot_recalculation_schedule(all_episodes_csv[\"episode99\"], \"images/Sector1UnlimitedBufferAddToBufferSchedule99.png\", 99)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "path = \"<>/Projects/mbrl_rb_crop/Experiments/pointbot/*/FullTrackUnlimitedBuffer*Test/run0/episodes/\"\n",
    "episodes = glob.glob(path + \"episode*.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_episodes_csv = {}\n",
    "labels = [\"BASELINE\", \"BICHO\", \"UARF\"]\n",
    "for i, episode in enumerate(episodes):\n",
    "    df = pd.read_csv(episode)\n",
    "    all_episodes_csv[labels[i]] = df\n",
    "all_episodes_csv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def plot_cumulative_rewards(dfs, image_name, flip_sign = False):\n",
    "    flip_sign = -1 if flip_sign else 1\n",
    "    colors = ['blue', 'red', 'green', 'green', 'brown', 'cyan', 'yellow', 'green', 'teal']\n",
    "    fig, ax = plt.subplots(figsize=(4,2), dpi=400, facecolor=\"w\", edgecolor=\"k\")\n",
    "    x = df.index\n",
    "    #reward_baseline = flip_sign * dfs[\"BASELINE\"][\"Rewards_mean\"].cumsum()\n",
    "    reward_bicho = flip_sign * dfs[\"BICHO\"][\"Rewards\"].cumsum()\n",
    "    reward_uarf = flip_sign * dfs[\"UARF\"][\"Rewards\"].cumsum()\n",
    "    reward_baseline = flip_sign * dfs[\"BASELINE\"][\"Rewards\"].cumsum()\n",
    "    #ax.plot(x, reward_baseline, color=colors[0], linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5, label = 'BASELINE')\n",
    "    ax.plot(x, reward_bicho/1000, color=colors[1], linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5, label = 'BICHO')\n",
    "    ax.plot(x, reward_uarf/1000, color=colors[0], linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5, label = 'UARF')\n",
    "    ax.plot(x, reward_baseline/1000, color=colors[2], linewidth=0.5 , marker='o', linestyle='solid', markersize=0.5, label = 'BASELINE')\n",
    "    ax.set_ylabel(\"Reward [1e3]\")\n",
    "    ax.set_xlabel(\"Step\")\n",
    "    plt.legend(loc=3, prop={'size': 9})\n",
    "    plt.savefig(image_name,bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plot_cumulative_rewards(all_episodes_csv, \"./images/FullTrackUnlimited_TestRewards.png\", True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
