{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": [],
      "collapsed_sections": [
        "p8MwcFOOW0_b",
        "tIq9bhSYXEDe"
      ]
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "cells": [
    {
      "cell_type": "markdown",
      "source": [
        "# **Stochastic Bandits for Egalitarian Assignment - MovieLens Experiments**\n",
        "---"
      ],
      "metadata": {
        "id": "udvmtNUmA3E2"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "rootdir = 'drive/MyDrive/egalucb/movielens' # @param {type: \"string\"}\n",
        "K = 500 # @param {type: \"integer\"}\n",
        "\n",
        "from google.colab import drive\n",
        "drive.mount('drive', force_remount=True)\n",
        "! mkdir -p {rootdir}"
      ],
      "metadata": {
        "cellView": "form",
        "id": "UBBOzLf7UpiH"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "## Setup"
      ],
      "metadata": {
        "id": "p8MwcFOOW0_b"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "! sudo apt install cm-super dvipng texlive-latex-extra texlive-latex-recommended"
      ],
      "metadata": {
        "id": "r5QHe68h2Bu4"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "FNikf-Pa0c_O"
      },
      "outputs": [],
      "source": [
        "import numpy as np\n",
        "import matplotlib\n",
        "import matplotlib.pyplot as plt\n",
        "import pandas as pd\n",
        "import os.path\n",
        "\n",
        "from collections import defaultdict\n",
        "from tqdm import tqdm"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "olderr = np.seterr(all='ignore')\n",
        "\n",
        "matplotlib.rcParams[\"text.usetex\"] = True\n",
        "matplotlib.rcParams[\"font.size\"] = \"7\"\n",
        "matplotlib.rcParams['mathtext.fontset'] = 'stix'\n",
        "matplotlib.rcParams['font.family'] = 'STIXGeneral'\n",
        "\n",
        "def pt2inches(width, height):\n",
        "    return (width / 72.27, height / 72.27)"
      ],
      "metadata": {
        "id": "HDSWpmHJ0l8U"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "class MultiUserMovieLensBanditInstance:\n",
        "\n",
        "    options = [0.5, 1.0, 1.5, 2.0, 2.5, 3.0, 3.5, 4.0, 4.5, 5.0]\n",
        "\n",
        "    def __init__(self, K, U, probs):\n",
        "        self.K = K\n",
        "        self.U = U\n",
        "        self.probs = probs\n",
        "        self.mus = probs @ np.array(MultiUserMovieLensBanditInstance.options)\n",
        "        self.mustar = np.sum(np.sort(self.mus)[-U:])\n",
        "\n",
        "    def pull(self, arms):\n",
        "        rewards = np.zeros(self.U)\n",
        "        for u in range(self.U):\n",
        "            rewards[u] = self.sample_from(arms[u])\n",
        "        return rewards\n",
        "\n",
        "    def sample_from(self, arm):\n",
        "        return np.random.choice(MultiUserMovieLensBanditInstance.options, p=self.probs[arm, :])\n",
        "\n",
        "    def simulate_egalucb(self, T):\n",
        "        cumrewards = np.zeros(self.K)\n",
        "        numplays = np.zeros(self.K, dtype=int)\n",
        "        expregrets = np.zeros((self.U, T + 1))\n",
        "        B = int(T / self.U)\n",
        "        t = 0\n",
        "        for b in tqdm(range(B)):\n",
        "            muhats = cumrewards / numplays\n",
        "            ucbs = muhats + np.sqrt(6 * np.log(b) / numplays)\n",
        "            ucbs = np.nan_to_num(ucbs, nan=np.inf)\n",
        "            blockarms = ucbs.argsort()[-self.U:][::-1]\n",
        "            blockarms = np.concatenate([blockarms, blockarms])\n",
        "            for i in range(self.U):\n",
        "                t += 1\n",
        "                arms = blockarms[i:self.U+i]\n",
        "                rewards = self.pull(arms)\n",
        "                cumrewards[arms] += rewards\n",
        "                numplays[arms] += 1\n",
        "                expregrets[:,t] = expregrets[:,t-1] + (self.mustar / self.U - self.mus[arms])\n",
        "        expregrets = expregrets[:, 1:]\n",
        "        return cumrewards, numplays, expregrets"
      ],
      "metadata": {
        "id": "IcB_Hk280nAJ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "## Load Dataset"
      ],
      "metadata": {
        "id": "tIq9bhSYXEDe"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "if not os.path.isfile(f'{rootdir}/ratings.csv'):\n",
        "    ! wget https://files.grouplens.org/datasets/movielens/ml-25m.zip\n",
        "    ! unzip ml-25m.zip\n",
        "    ! mv ml-25m/ratings.csv {rootdir}/ratings.csv\n",
        "    ! rm -r ml-25m ml-25m.zip\n",
        "\n",
        "data = pd.read_csv(f'{rootdir}/ratings.csv')"
      ],
      "metadata": {
        "id": "z2Dzixe9cni_"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "if not os.path.isfile(f'{rootdir}/probs{K:d}.npz'):\n",
        "    ids = data['movieId'].value_counts().nlargest(K).index\n",
        "    probs = np.zeros((K, 10)) # each row is a movie; each column is possible rating: 0.5, ..., 4.5, 5.0\n",
        "    for k in range(K):\n",
        "        ratings = data[data['movieId'] == ids[k]]['rating'].value_counts()\n",
        "        for i in range(10):\n",
        "            if 0.5 * (i + 1) in ratings.index:\n",
        "                probs[k, i] = ratings[0.5 * (i + 1)]\n",
        "        probs[k, :] /= np.sum(probs[k, :])\n",
        "    np.savez(f'{rootdir}/probs{K:d}.npz', probs=probs, allow_pickle=True)"
      ],
      "metadata": {
        "id": "sTw5RANY3wNe"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "npzfile = np.load(f'{rootdir}/probs{K:d}.npz', allow_pickle=True)\n",
        "probs = npzfile['probs']"
      ],
      "metadata": {
        "id": "2LBK9e9h_7hM"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "## Experiment 1: How regret evolves over time?"
      ],
      "metadata": {
        "id": "0ViygFG5cMmj"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "T = 150000\n",
        "Us = [10, 20, 30, 40, 50]"
      ],
      "metadata": {
        "id": "4X7pJxqAX7u4"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "instances = []\n",
        "expregrets_list = []\n",
        "\n",
        "for i in range(len(Us)):\n",
        "    instances.append(MultiUserMovieLensBanditInstance(K, Us[i], probs))\n",
        "\n",
        "for i in range(len(Us)):\n",
        "    _, _, expregrets = instances[i].simulate_egalucb(T)\n",
        "    expregrets_list.append(expregrets)"
      ],
      "metadata": {
        "id": "umb56dJ91M7Y"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "np.save(f'{rootdir}/ex1-movielens.npy', np.array(expregrets_list, dtype=object))"
      ],
      "metadata": {
        "id": "sj0eq0Oh2cb1"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "expregrets_list = np.load(f'{rootdir}/ex1-movielens.npy', allow_pickle=True)"
      ],
      "metadata": {
        "id": "1ih75vqP1xEd"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "fig, ax = plt.subplots(figsize=(pt2inches(200, 120)), dpi=120)\n",
        "linestyles = [(0, ()), (0, (1, 1)), (0, (5, 1)), (0, (5, 5)), (0, (3, 1, 1, 1))]\n",
        "colors = ['#EE6677', '#228833', '#4477AA', '#AA3377', '#CCBB44']\n",
        "\n",
        "res = 1000\n",
        "time = np.arange(1, T + 1)\n",
        "for i in range(len(Us)):\n",
        "    ax.plot(time[::res], expregrets_list[i][0,::res], color=colors[i], label=f'{Us[i]:d} users', linestyle=linestyles[i], linewidth=0.5)\n",
        "\n",
        "xticks = matplotlib.ticker.FuncFormatter(lambda x, pos: '{0:g}'.format(x / 1000))\n",
        "yticks = matplotlib.ticker.FuncFormatter(lambda y, pos: '{0:g}'.format(y / 1000))\n",
        "\n",
        "ax.xaxis.set_major_formatter(xticks)\n",
        "ax.yaxis.set_major_formatter(yticks)\n",
        "ax.set_xticks(np.arange(0, 150001, 30000))\n",
        "ax.set_yticks(np.arange(0, 8001, 2000))\n",
        "ax.tick_params(axis='both', which='both', length=0)\n",
        "\n",
        "ax.spines['top'].set_visible(False)\n",
        "ax.spines['right'].set_visible(False)\n",
        "ax.spines['bottom'].set_visible(False)\n",
        "ax.spines['left'].set_visible(False)\n",
        "\n",
        "ax.set_xlabel('Timestep (in thousands)')\n",
        "ax.set_ylabel('Regret (in thousands)')\n",
        "ax.legend(fontsize='6')\n",
        "ax.grid(alpha=0.25, axis='y', color='#BBBBBB', linewidth=0.5)\n",
        "\n",
        "fig.show()\n",
        "fig.savefig(f'{rootdir}/ex1-movielens.pdf', bbox_inches='tight')"
      ],
      "metadata": {
        "id": "5CItfxCB62J0"
      },
      "execution_count": null,
      "outputs": []
    }
  ]
}