{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.linear_model import Lasso,LinearRegression,LassoCV\n",
    "import tqdm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### Variation with Tail\n",
    "from alg import CORRAL,BaseAlgorithm\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.linear_model import Lasso,LinearRegression,LassoCV\n",
    "import tqdm\n",
    "\n",
    "N_mc = 10\n",
    "d = 300\n",
    "k = 10\n",
    "T = 200\n",
    "N = 1000\n",
    "E_list = [10,20,40,80]\n",
    "from tqdm import tqdm\n",
    "tail_parameters = [0.2,0.4,0.7,1,10,100]\n",
    "gammas = np.zeros((N_mc,len(tail_parameters)))\n",
    "regrets = np.zeros((N_mc,len(tail_parameters),T))\n",
    "E=80\n",
    "for i in tqdm(range(N_mc)):\n",
    "    \n",
    "    embeddings = np.random.uniform(size=(N,d))\n",
    "    parametertrue = np.random.uniform(size=(d,))\n",
    "    ### create tail out d-k parameters\n",
    "    for j in range(len(tail_parameters)):\n",
    "        parametertrue_copy = parametertrue.copy()\n",
    "        parametertrue_copy[-d+k:] = parametertrue_copy[-d+k:]/tail_parameters[j]\n",
    "        gammas[i,j] = np.sum(np.abs(parametertrue_copy[-d+k:]))/np.sum(np.abs(parametertrue_copy[:k]))\n",
    "        ### sort the parameters\n",
    "        #parametertrue_copy = np.sort(parametertrue_copy)[::-1]\n",
    "        base_algorithm = BaseAlgorithm(N,d,E,T,embeddings,parametertrue_copy)\n",
    "        for t in range(T):\n",
    "            base_algorithm.make_decision()\n",
    "        regrets[i,j,:] = np.cumsum(np.sort(base_algorithm.true_rewards)[::-1][:T]- base_algorithm.true_rewards[base_algorithm.order_of_arms.astype(int)])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import seaborn as sns\n",
    "plt.rcParams.update({\n",
    "    \"text.usetex\": True,\n",
    "    \"font.family\": \"serif\",\n",
    "    \"font.serif\": [\"Computer Modern Roman\"],\n",
    "    \"font.monospace\": [\"Computer Modern Typewriter\"],\n",
    "})\n",
    "\n",
    "\n",
    "sns.set_style(\"darkgrid\")\n",
    "plt.figure(figsize=(8,5))\n",
    "plt.plot(regrets.mean(axis=0).T)\n",
    "plt.legend(np.round(gammas.mean(axis=0),1),title=\"Average Tail Parameter $\\gamma$\",title_fontsize=\"16\",fontsize=\"16\")\n",
    "plt.xlabel(\"Number of Rounds\",fontdict={\"size\":16})\n",
    "plt.ylabel(\"Regret\",fontdict={\"size\":16})\n",
    "### add the fill\n",
    "for i in range(len(tail_parameters)):\n",
    "    plt.fill_between(np.arange(T),regrets.mean(axis=0).T[:,i]-regrets.std(axis=0).T[:,i],regrets.mean(axis=0).T[:,i]+regrets.std(axis=0).T[:,i],alpha=0.2)\n",
    "plt.savefig(\"plots/tail_parameter.pdf\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### simulated experiment\n",
    "from alg import CORRAL,BaseAlgorithm\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from sklearn.linear_model import Lasso,LinearRegression,LassoCV\n",
    "import tqdm\n",
    "\n",
    "N_mc = 10\n",
    "d = 700\n",
    "k = 10\n",
    "T = 800\n",
    "N = 10000\n",
    "E_list = [10,20,40,80]\n",
    "# ks = np.array([2**i for i in range(15) if 2**i <= d])\n",
    "\n",
    "# E_list = (ks**(1/3)*T**(2/3)).astype(int)\n",
    "from tqdm import tqdm\n",
    "regrets = np.zeros((N_mc,T))\n",
    "regrets_random = np.zeros((N_mc,T))\n",
    "regrets_base_algorithm = np.zeros((len(E_list),N_mc,T))\n",
    "regrets_linear_regression = np.zeros((N_mc,T))\n",
    "p_store = np.zeros((N_mc,T,len(E_list)))\n",
    "for i in tqdm(range(N_mc)):\n",
    "    parametertrue = np.random.uniform(size=(d,))\n",
    "    embeddings = np.random.randn(N,d)\n",
    "\n",
    "    ### create tail out d-k parameters\n",
    "    parametertrue[-d+k:] = parametertrue[-d+k:]/1000\n",
    "    ### sort the parameters\n",
    "    parametertrue = np.sort(parametertrue)[::-1]\n",
    "    base_algorithms = [BaseAlgorithm(N,d,E_list[i],T,embeddings,parametertrue) for i in range(len(E_list))]\n",
    "    true_rewards = base_algorithms[0].true_rewards\n",
    "\n",
    "    p, p_bar, order_of_arms = CORRAL(1e-2, base_algorithms, T)\n",
    "    p_store[i,:,:] = p\n",
    "    regrets[i,:] = np.cumsum(np.sort(true_rewards)[::-1][:T]- true_rewards[order_of_arms.astype(int)])\n",
    "    for j in range(len(E_list)):\n",
    "        base_algorithm = BaseAlgorithm(N,d,E_list[j],T,embeddings,parametertrue)\n",
    "        for t in range(T):\n",
    "            base_algorithm.make_decision()\n",
    "        regrets_base_algorithm[j,i,:] = np.cumsum(np.sort(true_rewards)[::-1][:T]- true_rewards[base_algorithm.order_of_arms.astype(int)])\n",
    "    regrets_random[i,:] = np.cumsum(np.sort(true_rewards)[::-1][:T]- true_rewards[np.random.choice(N,size=T,replace=True)])\n",
    "    \n",
    "    base_algorithms_lr = [BaseAlgorithm(N,d,E_list[i],T,embeddings,parametertrue,linear_model=LinearRegression()) for i in range(len(E_list))]\n",
    "    true_rewards = base_algorithms_lr[0].true_rewards\n",
    "    p, p_bar, order_of_arms = CORRAL(1e-3, base_algorithms_lr, T)\n",
    "    regrets_linear_regression[i,:] = np.cumsum(np.sort(true_rewards)[::-1][:T]- true_rewards[order_of_arms.astype(int)])\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "parametertrue[-d+k:].sum()/parametertrue[:k].sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import seaborn as sns\n",
    "plt.rcParams.update({\n",
    "    \"text.usetex\": True,\n",
    "    \"font.family\": \"serif\",\n",
    "    \"font.serif\": [\"Computer Modern Roman\"],\n",
    "    \"font.monospace\": [\"Computer Modern Typewriter\"],\n",
    "})\n",
    "\n",
    "\n",
    "sns.set_style(\"darkgrid\")\n",
    "plt.plot(range(T),p_store[:,:].mean(axis=0))\n",
    "# for i in range(4):\n",
    "#     plt.fill_between(range(T),p_store[:,:].mean(axis=0)[:,i]-p_store[:,:].std(axis=0)[:,i],p_store[:,:].mean(axis=0)[:,i]+p_store[:,:].std(axis=0)[:,i],alpha=0.2)\n",
    "plt.legend([f\"Base Algorithm with $T_{i}$\" for i in range(4)])\n",
    "plt.xlabel(\"Rounds\")\n",
    "plt.ylabel(\"Probability of Sampling in CORRAL\")\n",
    "plt.savefig(\"plots/basealgs_cvg.pdf\")\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import seaborn as sns\n",
    "plt.rcParams.update({\n",
    "    \"text.usetex\": True,\n",
    "    \"font.family\": \"serif\",\n",
    "    \"font.serif\": [\"Computer Modern Roman\"],\n",
    "    \"font.monospace\": [\"Computer Modern Typewriter\"],\n",
    "})\n",
    "\n",
    "\n",
    "sns.set_style(\"darkgrid\")\n",
    "plt.figure(figsize=(8,6))\n",
    "plt.plot(regrets.mean(axis=0),label=\"C-BSLB\")\n",
    "plt.plot(regrets_linear_regression.mean(axis=0),label=\"Corral with $\\ell_2$ Regularization\")\n",
    "plt.plot(regrets_random.mean(axis=0),label=\"Random\")\n",
    "for i in range(len(E_list)):\n",
    "    plt.plot(regrets_base_algorithm[i,:,:].mean(axis=0),alpha=0.8,linestyle=\"--\",label=f\"$T_{{explore}}$={E_list[i]}\")\n",
    "## percentile based confidence intervals\n",
    "plt.fill_between(np.arange(T),np.percentile(regrets,25,axis=0),np.percentile(regrets,75,axis=0),alpha=0.2)\n",
    "# plt.fill_between(np.arange(T),regrets_linear_regression.mean(axis=0)-regrets_linear_regression.std(axis=0),regrets_linear_regression.mean(axis=0)+regrets_linear_regression.std(axis=0),alpha=0.2)\n",
    "# for i in range(len(E_list)):\n",
    "#     plt.fill_between(np.arange(T),regrets_base_algorithm[i,:,:].mean(axis=0)-regrets_base_algorithm[i,:,:].std(axis=0),regrets_base_algorithm[i,:,:].mean(axis=0)+regrets_base_algorithm[i,:,:].std(axis=0),alpha=0.2)\n",
    "plt.legend(fontsize=15,loc=\"upper left\")\n",
    "plt.xlabel(\"Number of Rounds\",fontsize=18)\n",
    "plt.ylabel(\"Cumulative Regret\",fontsize=18)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.savefig(\"plots/simulated_results.png\",dpi=300,bbox_inches=\"tight\")\n",
    "plt.show()\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": ".venv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
