{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "38be6d14",
   "metadata": {},
   "source": [
    "## This notebook is used to generate pgf plots from .npy files, generated using the notebook Generating_experiment_results.ipnyb"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c420d9c8",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c8c6f2bb",
   "metadata": {},
   "outputs": [],
   "source": [
    "n_iter = 10**7\n",
    "n_mc = 20\n",
    "list_mu1 = [0.8,0.1,0.1,0.1,0.1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fe266f11",
   "metadata": {},
   "outputs": [],
   "source": [
    "def kl(x, y, eps = 1e-15):\n",
    "    x = min(max(x, eps), 1 - eps)\n",
    "    y = min(max(y, eps), 1 - eps)\n",
    "    return x * np.log(x / y) + (1 - x) * np.log((1 - x) / (1 - y))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7c40a6f5",
   "metadata": {},
   "outputs": [],
   "source": [
    "def d_eps(x, y, epsilon, prec = 1e-15):\n",
    "    if epsilon > np.log(min(max(y, prec), 1 - prec) / min(max(x, prec), 1 - prec)) + np.log((1 - min(max(x, prec), 1 - prec)) / (1 - min(max(y, prec), 1 - prec))):\n",
    "        return kl(x, y, prec)\n",
    "    return kl( y/(y + (1 - y)*(np.exp(epsilon))), y , prec) + epsilon * (y/(y + (1 - y)*(np.exp(epsilon))) - x)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c822810c",
   "metadata": {},
   "outputs": [],
   "source": [
    "marker_list = ['o', '*', 'v', 'x', 'D', 'p', 's', 'h', '<']"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e8427c9a",
   "metadata": {},
   "source": [
    "# Comparaison of algorithms"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b3d65188",
   "metadata": {},
   "outputs": [],
   "source": [
    "n_iter = 10**6 # The horizon T\n",
    "n_mc = 20 # number of times each experiment is repeated\n",
    "list_mu1 = [0.75,0.70,0.70,0.70,0.70]\n",
    "list_mu2 = [0.75,0.625,0.5,0.375,0.25]\n",
    "list_mu3 = [0.75,0.53125,0.375,0.28125,0.25]\n",
    "list_mu4 = [0.75,0.71875,0.625,0.46875,0.25]\n",
    "eps1, eps2, eps3, eps4, eps5 = 0.01, 0.1, 0.25, 0.5, 1\n",
    "list_mu = [list_mu1, list_mu2, list_mu3, list_mu4]\n",
    "epss = [eps1, eps2 ,eps3, eps4, eps5]"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "852328b1",
   "metadata": {},
   "source": [
    "### Generating 16 figures for every (list_mu,eps) combination"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0895f336",
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(4):\n",
    "    name_file_imed = \"results_npy/IMED_\" + str(i+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "    with open(name_file_imed, 'rb') as f:\n",
    "        gen_res_imed = np.load(f)\n",
    "    for j in range(5):\n",
    "        name_file_dp_se = \"results_npy/dp_se_\" + str(i+1) + \"_eps_\" + str(j+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "        with open(name_file_dp_se, 'rb') as f:\n",
    "            gen_res_dp_se = np.load(f)\n",
    "        name_file_adap_klucb = \"results_npy/adap_klucb_\" + str(i+1) + \"_eps_\" + str(j+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "        with open(name_file_adap_klucb, 'rb') as f:\n",
    "            gen_res_adap_klucb = np.load(f)\n",
    "        name_file_lazy_dp_ts = \"results_npy/lazy_dp_ts_\" + str(i+1) + \"_eps_\" + str(j+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "        with open(name_file_lazy_dp_ts, 'rb') as f:\n",
    "            gen_res_lazy_dp_ts = np.load(f)\n",
    "        name_file_dp_klucb = \"results_npy/dp_kl_ucb\" + str(i+1) + \"_eps_\" + str(j+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "        with open(name_file_dp_klucb, 'rb') as f:\n",
    "            gen_res_dp_klucb = np.load(f)\n",
    "        name_file_dp_imed = \"results_npy/dp_imed_\" + str(i+1) + \"_eps_\" + str(j+1) + \"_T_\" + str(n_iter) + \"_n_mc_\" + str(n_mc) + \".npy\"\n",
    "        with open(name_file_dp_imed, 'rb') as f:\n",
    "            gen_res_dp_imed = np.load(f)\n",
    "        fig = plt.figure()\n",
    "        fig.set_size_inches(w=5, h=4)\n",
    "        ax = fig.add_subplot(1, 1, 1)\n",
    "        ax.plot(np.arange(len(gen_res_dp_se.mean(axis=0)))[::1000], gen_res_dp_se.mean(axis=0)[::1000], marker = marker_list[0], markevery=50, label = r\"DP-SE\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_dp_se.mean(axis=0)))[::1000], gen_res_dp_se.mean(axis=0)[::1000] - 2*gen_res_dp_se.std(axis=0)[::1000], gen_res_dp_se.mean(axis=0)[::1000] + 2*gen_res_dp_se.std(axis=0)[::1000], alpha=0.2, rasterized=True)\n",
    "        ax.plot(np.arange(len(gen_res_adap_klucb.mean(axis=0)))[::1000], gen_res_adap_klucb.mean(axis=0)[::1000], marker = marker_list[1], markevery=50, label = r\"AdaP-KLUCB\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_adap_klucb.mean(axis=0)))[::1000], gen_res_adap_klucb.mean(axis=0)[::1000] - 2*gen_res_adap_klucb.std(axis=0)[::1000], gen_res_adap_klucb.mean(axis=0)[::1000] + 2 * gen_res_adap_klucb.std(axis=0)[::1000],  alpha=0.2, rasterized=True)\n",
    "        ax.plot(np.arange(len(gen_res_lazy_dp_ts.mean(axis=0)))[::1000], gen_res_lazy_dp_ts.mean(axis=0)[::1000], marker = marker_list[2], markevery=50, label = r\"Lazy-DP-TS\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_lazy_dp_ts.mean(axis=0)))[::1000], gen_res_lazy_dp_ts.mean(axis=0)[::1000] - 2*gen_res_lazy_dp_ts.std(axis=0)[::1000], gen_res_lazy_dp_ts.mean(axis=0)[::1000] + 2*gen_res_lazy_dp_ts.std(axis=0)[::1000],  alpha=0.2, rasterized=True)\n",
    "        ax.plot(np.arange(len(gen_res_dp_klucb.mean(axis=0)))[::1000], gen_res_dp_klucb.mean(axis=0)[::1000], marker = marker_list[3], markevery=50, label = r\"DP-KL-UCB\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_dp_klucb.mean(axis=0)))[::1000], gen_res_dp_klucb.mean(axis=0)[::1000] - gen_res_dp_klucb.std(axis=0)[::1000], gen_res_dp_klucb.mean(axis=0)[::1000] + gen_res_dp_klucb.std(axis=0)[::1000], alpha=0.2, rasterized=True)\n",
    "        ax.plot(np.arange(len(gen_res_dp_imed.mean(axis=0)))[::1000], gen_res_dp_imed.mean(axis=0)[::1000], marker = marker_list[4] , markevery=50, label = r\"DP-IMED\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_dp_imed.mean(axis=0))), gen_res_dp_imed.mean(axis=0) - 0.2*gen_res_dp_klucb.std(axis=0), gen_res_dp_imed.mean(axis=0) + 0.2*gen_res_dp_klucb.std(axis=0), alpha=0.2, rasterized=True)\n",
    "        ax.plot(np.arange(len(gen_res_imed.mean(axis=0)))[::1000], gen_res_imed.mean(axis=0)[::1000], marker = marker_list[5] , markevery=50, label = r\"IMED\", rasterized=True)\n",
    "        ax.fill_between(np.arange(len(gen_res_imed.mean(axis=0)))[::1000], gen_res_imed.mean(axis=0)[::1000] - gen_res_imed.std(axis=0)[::1000], gen_res_imed.mean(axis=0)[::1000] + gen_res_imed.std(axis=0)[::1000], alpha=0.2, rasterized=True)\n",
    "        plt.xlabel(r\"Step $t$\")\n",
    "        plt.ylabel(r\"Regret\")\n",
    "        ax.legend(loc='lower right')\n",
    "        plt.yscale('log')\n",
    "        name_fig = \"comparison_algorithms_list_mu_\" + str(i+1)+ \"_eps_\" + str(j+1) + \".pdf\"\n",
    "        print(list_mu[i], epss[j])\n",
    "        #plt.show()\n",
    "        plt.savefig(name_fig, bbox_inches='tight')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
