{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import tqdm \n",
    "from sklearn.linear_model import Lasso,LinearRegression,LassoCV\n",
    "from sentence_transformers import SentenceTransformer\n",
    "df = pd.read_csv('./data/benchmark/books/books.csv')\n",
    "### import sentence bert\n",
    "\n",
    "model = SentenceTransformer('sentence-transformers/all-MiniLM-L12-v1')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "### Load the data\n",
    "df = df.loc[:,['authors','title','book_id','average_rating']]\n",
    "ratings = pd.read_csv('./data/benchmark/books/ratings.csv')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "### get the embeddings\n",
    "author_embedding = model.encode(df['authors'],show_progress_bar=True,normalize_embeddings=True)\n",
    "title_embedding = model.encode(df['title'],show_progress_bar=True,normalize_embeddings=True)\n",
    "\n",
    "### concatenate average rating with embedding\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['embedding'] = np.vstack((author_embedding + title_embedding)/2).tolist() ## convert to df column\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### save the embeddings and labels\n",
    "import pickle\n",
    "N_users = 5\n",
    "top_users = ratings.groupby('user_id').count().sort_values('rating',ascending=False)[:N_users].index\n",
    "embeddings_users = []\n",
    "unique_books_ids = []\n",
    "labels_users = []\n",
    "for i,user in tqdm.tqdm(enumerate(top_users)):\n",
    "    df_subset = ratings[ratings['user_id']==user]\n",
    "    df_subset = df_subset.merge(df,on='book_id')\n",
    "    unique_books_ids.append(df_subset['book_id'].unique())\n",
    "    print(df_subset['book_id'].nunique())\n",
    "    labels_all = df_subset['rating'].values\n",
    "    embeddings_all = np.vstack(df_subset['embedding'].values)\n",
    "    embeddings_users.append(embeddings_all)\n",
    "    labels_users.append(labels_all)\n",
    "\n",
    "pickle.dump(embeddings_users,open('./data/benchmark/books/embeddings_users.pkl','wb'))\n",
    "pickle.dump(labels_users,open('./data/benchmark/books/labels_users.pkl','wb'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "### get the good vectors\n",
    "import cvxpy as cp\n",
    "def get_good_vectors(embeddings):\n",
    "    n = embeddings.shape[0]\n",
    "    d = embeddings.shape[1]\n",
    "    x = cp.Variable(n)\n",
    "    constraints = [cp.sum(x)==1,x>=0]\n",
    "    objective_function = embeddings.T @ cp.diag(x) @ embeddings\n",
    "    objective = cp.Maximize(cp.lambda_min(objective_function))\n",
    "    prob = cp.Problem(objective,constraints)\n",
    "    prob.solve()\n",
    "    return x.value\n",
    "\n",
    "good_vectors = get_good_vectors(np.vstack(df[df['book_id'].isin(np.unique(np.concatenate(unique_books_ids)))]['embedding'].values))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [],
   "source": [
    "df['good_vector'] = np.zeros(df.shape[0])\n",
    "df.loc[df['book_id'].isin(np.unique(np.concatenate(unique_books_ids))),'good_vector'] = np.array(good_vectors).astype(float)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#### main loop\n",
    "N_mc = 100\n",
    "N_random = 60\n",
    "N_test = 40\n",
    "N_users = 5\n",
    "top_users = ratings.groupby('user_id').count().sort_values('rating',ascending=False)[:N_users].index\n",
    "cumsum_regrets = np.zeros((top_users.shape[0],N_mc,N_test+N_random,2))\n",
    "cumsum_regrets_just_lr = np.zeros((top_users.shape[0],N_mc,N_test+N_random,2))\n",
    "for i,user in tqdm.tqdm(enumerate(top_users)):\n",
    "    df_subset = ratings[ratings['user_id']==user]\n",
    "    df_subset = df_subset.merge(df,on='book_id')\n",
    "    labels_all = df_subset['rating'].values\n",
    "    embeddings_all = np.vstack(df_subset['embedding'].values)\n",
    "\n",
    "    for j in range(N_mc):\n",
    "        ### get the random indices\n",
    "        random_indices = np.random.choice(df_subset.shape[0],size=N_random,replace=False,p=df_subset['good_vector'].values/np.sum(df_subset['good_vector'].values))\n",
    "        \n",
    "        embeddings_subset = np.vstack(df_subset.loc[random_indices,'embedding'].values)\n",
    "        labels_subset = df_subset.loc[random_indices,'rating'].values\n",
    "        #### fit the lasso\n",
    "        model = Lasso(alpha=0.001,max_iter=10000)\n",
    "        model.fit(embeddings_subset,labels_subset)\n",
    "\n",
    "        non_zero_coef = model.coef_!=0\n",
    "        X = embeddings_subset[:,non_zero_coef]\n",
    "        y = labels_subset\n",
    "\n",
    "        model_lr = LinearRegression()\n",
    "        model_lr.fit(X,y)\n",
    "\n",
    "        #### get the predictions\n",
    "        y_pred = model_lr.predict(embeddings_all[:,non_zero_coef])\n",
    "        y_true = labels_all\n",
    "\n",
    "        labels_not_in_random = np.setdiff1d(df_subset.index,random_indices)\n",
    "        indices_sort_from_pred = np.argsort(y_pred)[::-1]\n",
    "        indices_sort_from_pred = [i for i in indices_sort_from_pred if i not in random_indices]\n",
    "        y_true_sorted_by_pred = y_true[indices_sort_from_pred]\n",
    "        y_true_by_pred = y_true_sorted_by_pred[:N_test]\n",
    "\n",
    "        y_from_pred = labels_all[indices_sort_from_pred]\n",
    "        y_sorted = np.sort(y_true)[::-1][:N_test+N_random]\n",
    "        \n",
    "        all_y_pred = np.concatenate([y,y_true_by_pred])\n",
    "        cumsum_regrets[i,j] = np.vstack([y_sorted,all_y_pred]).T\n",
    "\n",
    "        random_indices = np.random.choice(df_subset.shape[0],size=N_random,replace=False)\n",
    "        \n",
    "        embeddings_subset = np.vstack(df_subset.loc[random_indices,'embedding'].values)\n",
    "        labels_subset = df_subset.loc[random_indices,'rating'].values\n",
    "        model = LinearRegression()\n",
    "        model.fit(embeddings_subset,labels_subset)\n",
    "        y_pred = model.predict(embeddings_all)\n",
    "        y_true = labels_all\n",
    "\n",
    "        labels_not_in_random = np.setdiff1d(df_subset.index,random_indices)\n",
    "        indices_sort_from_pred = np.argsort(y_pred)[::-1]\n",
    "        indices_sort_from_pred = [i for i in indices_sort_from_pred if i not in random_indices]\n",
    "        y_true_sorted_by_pred = y_true[indices_sort_from_pred]\n",
    "        y_true_by_pred = y_true_sorted_by_pred[:N_test]\n",
    "        all_y_pred = np.concatenate([y,y_true_by_pred])\n",
    "        cumsum_regrets_just_lr[i,j] = np.vstack([y_sorted,all_y_pred]).T\n",
    "        \n",
    "        \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cumsum_regrets_ = np.sort(cumsum_regrets,axis=2)[:,:,::-1]\n",
    "cumsum_regrets_ = np.sort(cumsum_regrets[:,:,:,0],axis=2)[:,:,::-1]-cumsum_regrets[:,:,:,1]\n",
    "cumsum_regrets_ = np.cumsum(cumsum_regrets_,axis=2)\n",
    "\n",
    "cumsum_regrets_just_lr = np.sort(cumsum_regrets_just_lr[:,:,:,0],axis=2)[:,:,::-1]-cumsum_regrets_just_lr[:,:,:,1]\n",
    "cumsum_regrets_just_lr = np.cumsum(cumsum_regrets_just_lr,axis=2)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [],
   "source": [
    "cum_regret_random = np.zeros((N_mc,N_random+N_test))\n",
    "for i in range(N_mc):\n",
    "    random_indices = np.random.choice(df_subset.shape[0],size=N_test+N_random,replace=False)\n",
    "    y_true = labels_all[random_indices]\n",
    "    y_best = np.sort(labels_all)[::-1][:N_test+N_random]\n",
    "    cum_regret_random[i] = np.cumsum(y_best-y_true)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.plot(np.mean(cumsum_regrets_,axis=1).mean(axis=0),label='Our Algorithm')\n",
    "plt.plot(np.arange(N_random+N_test),np.mean(cum_regret_random,axis=0),label='Random Selected')\n",
    "plt.plot(np.arange(N_random+N_test),np.mean(cumsum_regrets_just_lr,axis=1).mean(axis=0),label='LR')\n",
    "plt.legend(fontsize=15)\n",
    "plt.fill_between(np.arange(N_random+N_test),np.percentile(cumsum_regrets_.mean(axis=0),25,axis=0),np.percentile(cumsum_regrets_.mean(axis=0),75,axis=0),alpha=0.2)\n",
    "plt.fill_between(np.arange(N_random+N_test),np.percentile(cum_regret_random,25,axis=0),np.percentile(cum_regret_random,75,axis=0),alpha=0.2)\n",
    "plt.fill_between(np.arange(N_random+N_test),np.percentile(cumsum_regrets_just_lr.mean(axis=0),25,axis=0),np.percentile(cumsum_regrets_just_lr.mean(axis=0),75,axis=0),alpha=0.2)\n",
    "plt.xlabel('Rounds',fontsize=15)\n",
    "plt.ylabel('Cumulative Regret',fontsize=15)\n",
    "plt.xticks(fontsize=15)\n",
    "plt.yticks(fontsize=15)\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "from alg import BaseAlgorithm\n",
    "import pickle\n",
    "import numpy as np\n",
    "import tqdm\n",
    "from sklearn.linear_model import Lasso,LinearRegression\n",
    "import matplotlib.pyplot as plt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "### check if the BaseAlgorithm is working \n",
    "embeddings_user = pickle.load(open('./data/benchmark/books/embeddings_users.pkl','rb'))\n",
    "labels_user = pickle.load(open('./data/benchmark/books/labels_users.pkl','rb'))\n",
    "N_mc = 100\n",
    "N_random = 50\n",
    "N_test = 100\n",
    "N_users = 5\n",
    "cumsum_regrets = np.zeros((len(embeddings_user),N_mc,N_test+N_random,2))\n",
    "cumsum_regrets_base = np.zeros((len(embeddings_user),N_mc,N_test+N_random,2))\n",
    "cumsum_regrets_random = np.zeros((len(embeddings_user),N_mc,N_test+N_random,2))\n",
    "for i,user in tqdm.tqdm(enumerate(range(len(embeddings_user)))):\n",
    "    embeddings_all = embeddings_user[i]\n",
    "    labels_all = labels_user[i]\n",
    "    n_books = embeddings_all.shape[0]\n",
    "    for j in range(N_mc):\n",
    "        random_indices = np.random.choice(n_books,size=N_random,replace=False)\n",
    "        ### get the random subset\n",
    "        embeddings_subset = embeddings_all[random_indices]\n",
    "        labels_subset = labels_all[random_indices]\n",
    "        ### fit a lasso model\n",
    "        model = Lasso(alpha=0.001,max_iter=10000)\n",
    "        model.fit(embeddings_subset,labels_subset)\n",
    "        ### get the non zero coefficients\n",
    "        non_zero_coef = model.coef_!=0\n",
    "        # print(non_zero_coef.sum())\n",
    "        X = embeddings_subset[:,non_zero_coef]\n",
    "\n",
    "        y = labels_subset\n",
    "        ### fit a linear regression model\n",
    "        model_lr = LinearRegression()\n",
    "        model_lr.fit(X,y)\n",
    "        ### predict the labels \n",
    "        y_pred = model_lr.predict(embeddings_all[:,non_zero_coef])\n",
    "        y_true = labels_all\n",
    "        ### get the labels not in the random subset\n",
    "        indices_sort_from_pred = np.argsort(y_pred)[::-1]\n",
    "        indices_sort_from_pred = [i for i in indices_sort_from_pred if i not in random_indices]\n",
    "        y_true_sorted_by_pred = y_true[indices_sort_from_pred]\n",
    "        y_true_by_pred = y_true_sorted_by_pred[:N_test]\n",
    "        ### get the labels sorted\n",
    "        y_from_pred = labels_all[indices_sort_from_pred]\n",
    "        y_sorted = np.sort(y_true)[::-1][:N_test+N_random]\n",
    "        ### get the labels sorted by the predicted values \n",
    "        all_y_pred = np.concatenate([y,y_true_by_pred])\n",
    "        cumsum_regrets[i,j] = np.vstack([y_sorted,all_y_pred]).T\n",
    "        ### run the base algorithm \n",
    "        base_algorithm = BaseAlgorithm(embeddings_all.shape[0],embeddings_all.shape[1],N_random,N_random+N_test,embeddings_all,true_parameter=None,true_rewards=labels_all)\n",
    "        base_algorithm.run()\n",
    "        y_pred_base = labels_all[base_algorithm.order_of_arms.astype(int)]\n",
    "        cumsum_regrets_base[i,j] = np.vstack([y_sorted,y_pred_base]).T\n",
    "        ### random selection\n",
    "        random_indices = np.random.choice(n_books,size=N_test+N_random,replace=False)\n",
    "        y_true = labels_all[random_indices]\n",
    "        cumsum_regrets_random[i,j] = np.vstack([y_sorted,y_true]).T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "cumsum_regrets_base = cumsum_regrets_base[:,:,:,0] - cumsum_regrets_base[:,:,:,1]\n",
    "# cumsum_regrets_base = np.cumsum(cumsum_regrets_base,axis=2)\n",
    "\n",
    "cumsum_regrets = cumsum_regrets[:,:,:,0] - cumsum_regrets[:,:,:,1]\n",
    "# cumsum_regrets = np.cumsum(cumsum_regrets,axis=2)\n",
    "\n",
    "cumsum_regrets_random = cumsum_regrets_random[:,:,:,0] - cumsum_regrets_random[:,:,:,1]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "plt.plot(np.mean(cumsum_regrets.cumsum(axis=2),axis=1).mean(axis=0),label='Our Algorithm')\n",
    "plt.plot(np.mean(cumsum_regrets_base.cumsum(axis=2),axis=1).mean(axis=0),label='Base Algorithm')\n",
    "plt.plot(np.mean(cumsum_regrets_random.cumsum(axis=2),axis=1).mean(axis=0),label='Random Selection')\n",
    "plt.vlines(N_random,0,cumsum_regrets.cumsum(axis=2).max(),linestyles='--')\n",
    "plt.legend()\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": ".venv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
