{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.ticker as ticker\n",
    "from matplotlib.backends.backend_pdf import PdfPages\n",
    "\n",
    "matplotlib.use('PDF')\n",
    "matplotlib.rcParams['ps.useafm'] = True\n",
    "matplotlib.rcParams['pdf.use14corefonts'] = True\n",
    "matplotlib.rcParams['text.usetex'] = True\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\admin\\AppData\\Local\\Temp\\ipykernel_28520\\1193690165.py:32: UserWarning: Matplotlib is currently using pdf, which is a non-GUI backend, so cannot show the figure.\n",
      "  plt.show()\n"
     ]
    }
   ],
   "source": [
    "with open('Data/Training-reward.pkl', 'rb') as f:\n",
    "    data = pickle.load(f)\n",
    "\n",
    "ours_goal_rates0 = data['ours_goal_rates0']\n",
    "coptidice_goal_rates0 = data['coptidice_goal_rates0']\n",
    "ours_goal_rates25 = data['ours_goal_rates25']\n",
    "coptidice_goal_rates25 = data['coptidice_goal_rates25']\n",
    "ours_goal_rates50 = data['ours_goal_rates50']\n",
    "coptidice_goal_rates50 = data['coptidice_goal_rates50']\n",
    "ours_goal_rates75 = data['ours_goal_rates75']\n",
    "coptidice_goal_rates75 = data['coptidice_goal_rates75']\n",
    "\n",
    "plt.figure(figsize=(8, 6))\n",
    "plt.plot(ours_goal_rates75, label='Ours with 75\\% optimal data', linestyle='solid', color='red')\n",
    "plt.plot(ours_goal_rates50, label='Ours with 50\\% optimal data', linestyle='dashdot', color='red')\n",
    "plt.plot(ours_goal_rates25, label='Ours with 25\\% optimal data', linestyle='dashed', color='red')\n",
    "plt.plot(ours_goal_rates0, label='Ours with 0\\% optimal data', linestyle='dotted', color='red')\n",
    "\n",
    "plt.plot(coptidice_goal_rates75, label='COptiDICE with 75\\% optimal data', linestyle='solid', color='blue')\n",
    "plt.plot(coptidice_goal_rates50, label='COptiDICE with 50\\% optimal data', linestyle='dashdot', color='blue')\n",
    "plt.plot(coptidice_goal_rates25, label='COptiDICE with 25\\% optimal data', linestyle='dashed', color='blue')\n",
    "plt.plot(coptidice_goal_rates0, label='COptiDICE with 0\\% optimal data', linestyle='dotted', color='blue')\n",
    "\n",
    "\n",
    "plt.legend(fontsize=10)\n",
    "plt.text(1.0, -0.037, r'$\\times 10^3$', verticalalignment='center', horizontalalignment='left', transform=plt.gca().transAxes, fontsize=15)\n",
    "plt.xlabel('Training step', fontsize=15)\n",
    "plt.ylabel('Reward', fontsize=15)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.savefig('Figure/Training-reward.pdf', dpi=1200, bbox_inches='tight')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "C:\\Users\\admin\\AppData\\Local\\Temp\\ipykernel_28520\\2755004986.py:31: UserWarning: Matplotlib is currently using pdf, which is a non-GUI backend, so cannot show the figure.\n",
      "  plt.show()\n"
     ]
    }
   ],
   "source": [
    "with open('Data/Training-cost.pkl', 'rb') as f:\n",
    "    cost = pickle.load(f)\n",
    "\n",
    "ours_cost_0 = cost['ours_cost_0']\n",
    "ours_cost_25 = cost['ours_cost_25']\n",
    "ours_cost_50 = cost['ours_cost_50']\n",
    "ours_cost_75 = cost['ours_cost_75']\n",
    "coptidice_cost_0 = cost['coptidice_cost_0']\n",
    "coptidice_cost_25 = cost['coptidice_cost_25']\n",
    "coptidice_cost_50 = cost['coptidice_cost_50']\n",
    "coptidice_cost_75 = cost['coptidice_cost_75']\n",
    "\n",
    "plt.figure(figsize=(8, 6))\n",
    "plt.plot(ours_cost_75, label='Ours with 75\\% optimal data', linestyle='solid', color='red')\n",
    "plt.plot(ours_cost_50, label='Ours with 50\\% optimal data', linestyle='dashdot', color='red')\n",
    "plt.plot(ours_cost_25, label='Ours with 25\\% optimal data', linestyle='dashed', color='red')\n",
    "plt.plot(ours_cost_0, label='Ours with 0\\% optimal data', linestyle='dotted', color='red')\n",
    "\n",
    "plt.plot(coptidice_cost_75, label='COptiDICE with 75\\% optimal data', linestyle='solid', color='blue')\n",
    "plt.plot(coptidice_cost_50, label='COptiDICE with 50\\% optimal data', linestyle='dashdot', color='blue')\n",
    "plt.plot(coptidice_cost_25, label='COptiDICE with 25\\% optimal data', linestyle='dashed', color='blue')\n",
    "plt.plot(coptidice_cost_0, label='COptiDICE with 0\\% optimal data', linestyle='dotted', color='blue')\n",
    "\n",
    "plt.legend(fontsize=10)\n",
    "plt.text(1.0, -0.037, r'$\\times 10^3$', verticalalignment='center', horizontalalignment='left', transform=plt.gca().transAxes, fontsize=15)\n",
    "plt.xlabel('Training step', fontsize=15)\n",
    "plt.ylabel('Cost', fontsize=15)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.savefig('Figure/Training-cost.pdf', dpi=1200, bbox_inches='tight')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['datasizes', 'except_bc_seed', 'alg_goalrate', 'coptidice_goalrate', 'ours_holerate', 'coptidice_holerate', 'alg_goalrate_bc', 'alg_holerate_bc', 'seed_bc'])\n"
     ]
    }
   ],
   "source": [
    "import json\n",
    "import numpy as np\n",
    "\n",
    "with open('Data/datasize_figure.json', 'r') as f:\n",
    "    data = json.load(f)\n",
    "\n",
    "print(data.keys())\n",
    "coptidice_goalrate = np.array(data['coptidice_goalrate'])\n",
    "coptidice_goalrate_fig = np.delete(coptidice_goalrate, [4,5,6,7], 1)\n",
    "datasize = data['datasizes']\n",
    "alg_goalrate = np.array(data['alg_goalrate'])\n",
    "alg_goalrate_bc = np.array(data['alg_goalrate_bc'])\n",
    "\n",
    "avg_alg_goalrate = np.mean(alg_goalrate, axis=1)\n",
    "half_std_alg_goalrate = np.std(alg_goalrate, axis=1) / 2.0\n",
    "avg_alg_goalrate_bc = np.mean(alg_goalrate, axis=1)\n",
    "half_std_alg_goalrate_bc = np.std(alg_goalrate, axis=1) / 2.0\n",
    "avg_coptidice_goalrate = np.mean(coptidice_goalrate_fig, axis=1)\n",
    "half_std_coptidice_goalrate = np.std(coptidice_goalrate_fig, axis=1) / 2.0\n",
    "\n",
    "lower_bound_alg_goalrate = avg_alg_goalrate - half_std_alg_goalrate\n",
    "upper_bound_alg_goalrate = avg_alg_goalrate + half_std_alg_goalrate\n",
    "lower_bound_alg_goalrate_bc = avg_alg_goalrate_bc - half_std_alg_goalrate_bc\n",
    "upper_bound_alg_goalrate_bc = avg_alg_goalrate_bc + half_std_alg_goalrate_bc\n",
    "lower_bound_coptidice_goalrate = avg_coptidice_goalrate - half_std_coptidice_goalrate\n",
    "upper_bound_coptidice_goalrate = avg_coptidice_goalrate + half_std_coptidice_goalrate"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib.ticker as ticker\n",
    "from matplotlib.backends.backend_pdf import PdfPages\n",
    "\n",
    "matplotlib.use('PDF')\n",
    "matplotlib.rcParams['ps.useafm'] = True\n",
    "matplotlib.rcParams['pdf.use14corefonts'] = True\n",
    "matplotlib.rcParams['text.usetex'] = True\n",
    "plt.figure(figsize=(8, 6))\n",
    "plt.plot(datasize, avg_alg_goalrate, label='Ours', linestyle='solid', color='red')\n",
    "plt.fill_between(datasize, lower_bound_alg_goalrate, upper_bound_alg_goalrate, color='red', alpha=0.2)\n",
    "plt.plot(datasize, avg_coptidice_goalrate, label='COptiDICE', linestyle='solid', color='blue')\n",
    "plt.fill_between(datasize, lower_bound_coptidice_goalrate, upper_bound_coptidice_goalrate, color='blue', alpha=0.2)\n",
    "plt.legend(fontsize=12, loc=(0.7, 0.7))\n",
    "plt.xscale('log')\n",
    "plt.xlabel('Datasize', fontsize=15)\n",
    "plt.ylabel('Reward', fontsize=15)\n",
    "plt.ylim(bottom=0.4)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.savefig('Figure/Reward-with-datasize.pdf', dpi=1200, bbox_inches='tight')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('Data/Datasize-cost.pkl', 'rb') as f:\n",
    "    cost = pickle.load(f)\n",
    "\n",
    "ours_cost_list = cost['ours_cost']\n",
    "coptidice_cost_list = cost['coptidice_cost']\n",
    "\n",
    "avg_ours_cost = np.mean(ours_cost_list, axis=1).squeeze()\n",
    "avg_coptidice_cost = np.mean(coptidice_cost_list, axis=1).squeeze()\n",
    "\n",
    "std_ours_cost = np.std(ours_cost_list, axis=1).squeeze()\n",
    "std_coptidice_cost = np.std(coptidice_cost_list, axis=1).squeeze()\n",
    "\n",
    "ours_cost_lower_bound = avg_ours_cost - std_ours_cost\n",
    "ours_cost_upper_bound = avg_ours_cost + std_ours_cost\n",
    "coptidice_cost_lower_bound = avg_coptidice_cost - std_coptidice_cost\n",
    "coptidice_cost_upper_bound = avg_coptidice_cost + std_coptidice_cost"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize=(8, 6))\n",
    "plt.plot(datasize, avg_ours_cost, label='Ours', linestyle='solid', color='red')\n",
    "plt.fill_between(datasize, ours_cost_lower_bound, ours_cost_upper_bound, color='red', alpha=0.2)\n",
    "plt.plot(datasize, avg_coptidice_cost, label='COptiDICE', linestyle='solid', color='blue')\n",
    "plt.fill_between(datasize, coptidice_cost_lower_bound, coptidice_cost_upper_bound, color='blue', alpha=0.2)\n",
    "plt.legend(fontsize=12)\n",
    "plt.xscale('log')\n",
    "plt.xlabel('Datasize', fontsize=15)\n",
    "plt.ylabel('Cost', fontsize=15)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.savefig('Figure/Cost-with-datasize.pdf', dpi=1200, bbox_inches='tight')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "osrl",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.0"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
