{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "offshore-serial",
   "metadata": {},
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "import matplotlib\n",
    "matplotlib.rcParams['text.usetex'] = True\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "import autograd.numpy as np \n",
    "from autograd import grad  \n",
    "\n",
    "\n",
    "def utility(xs,index_player):\n",
    "    if Game==\"Pigou's Network\":\n",
    "    #Atomic Pigou's Network\n",
    "        return xs[index_player][0]+1/len(xs)*sum([x[1] for x in xs])\n",
    "    #BoS  Network\n",
    "    if Game==\"Battle of the Sexes\":\n",
    "        if index_player == 0:\n",
    "            return xs[index_player][0]*xs[1-index_player][0]*2+(1-xs[index_player][1])*(1-xs[1-index_player][1])*1\n",
    "        if index_player == 1:\n",
    "            return xs[index_player][0]*xs[1-index_player][0]*1+(1-xs[index_player][1])*(1-xs[1-index_player][1])*2\n",
    "\n",
    "def choose(xs,x,index_player):\n",
    "    l = [elem for elem in xs]\n",
    "    l[index_player]=x\n",
    "    return l\n",
    "\n",
    "def gamma(time):\n",
    "    if style_step_size:\n",
    "        return 0.01\n",
    "    else:\n",
    "        return 1/time**(1/2.)\n",
    "    \n",
    "def epsilon(time):\n",
    "    return 1/time**(1/3.)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "former-lender",
   "metadata": {},
   "outputs": [],
   "source": [
    "def perfect_payoff(xs,step):\n",
    "    vs=[]\n",
    "    for index_player in range(len(xs)):\n",
    "        v = np.array([utility(choose(xs,np.array([1,0]),index_player),index_player),\n",
    "                      utility(choose(xs,np.array([0,1]),index_player),index_player),\n",
    "                    ])\n",
    "        vs.append(v)\n",
    "    return np.array(vs)\n",
    "\n",
    "def imperfect_payoff(xs,step):\n",
    "    vs=[]\n",
    "    for index_player in range(len(xs)):\n",
    "        v = np.array([utility(choose(xs,np.array([1,0]),index_player),index_player),\n",
    "                      utility(choose(xs,np.array([0,1]),index_player),index_player)\n",
    "                    ])\n",
    "        v = v + np.random.uniform([-0.1,0.1])  \n",
    "        vs.append(v)\n",
    "    return np.array(vs)    \n",
    "\n",
    "def truncgaussian_payoff(xs,step):\n",
    "    from scipy.stats import truncnorm\n",
    "    vs=[]\n",
    "    for index_player in range(len(xs)):\n",
    "        v = np.array([utility(choose(xs,np.array([1,0]),index_player),index_player),\n",
    "                      utility(choose(xs,np.array([0,1]),index_player),index_player)\n",
    "                    ])\n",
    "        v = v +truncnorm.rvs(-0.1, 0.1, size=2)\n",
    "        vs.append(v)\n",
    "    return np.array(vs)\n",
    "\n",
    "def semi_bandit_perfect_payoff(xs,step):\n",
    "    vs=[]\n",
    "    samples=[list(np.random.choice(2, 1, p=x))[0] for x in xs]\n",
    "    actions=np.array([[np.array([1,0]),np.array([0,1])][sample] for sample in samples])\n",
    "    for index_player in range(len(xs)):\n",
    "        v = np.array([utility(choose(actions,np.array([1,0]),index_player),index_player),\n",
    "                      utility(choose(actions,np.array([0,1]),index_player),index_player),\n",
    "                    ])\n",
    "        vs.append(v)\n",
    "    return np.array(vs)\n",
    "\n",
    "def bandit_perfect_payoff(xs,step):\n",
    "    xs_hat = [x*(1-epsilon(step))+epsilon(step)*np.ones(np.size(x))/np.size(x) for x in xs]\n",
    "    vs=[]\n",
    "    samples=[list(np.random.choice(2, 1, p=x))[0] for x in xs_hat]\n",
    "    actions=np.array([[np.array([1,0]),np.array([0,1])][sample] for sample in samples])\n",
    "    for index_player in range(len(xs)):\n",
    "        v=np.zeros(np.size(xs_hat[index_player]))\n",
    "        s=samples[index_player]\n",
    "        v[s]=utility(actions,index_player)/xs_hat[index_player][s]\n",
    "        vs.append(v)\n",
    "    return np.array(vs)    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "noticed-india",
   "metadata": {},
   "outputs": [],
   "source": [
    "def projection_in_simplex(y):\n",
    "    y=-np.sort(-y)\n",
    "    rho=max([ i+1   for i in range(np.size(y)) if (y[i]+1/(i+1)*(1-sum(y[:i+1])))>0])\n",
    "    ellambda = 1/rho*(1-sum(y[:rho]))\n",
    "    return np.array([ max([y[i]+ellambda,0]) for i in range(np.size(y))])\n",
    "\n",
    "def logit(y):\n",
    "    x = np.exp(y-min(y))\n",
    "    x = x/sum(x)\n",
    "    return x\n",
    "\n",
    "def inverse_logarithmic(y):\n",
    "    x = np.exp(y-min(y))\n",
    "    x = x/sum(x)\n",
    "    return x\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "imperial-framing",
   "metadata": {},
   "outputs": [],
   "source": [
    "def Q_map(y,regularizer):\n",
    "    if regularizer == \"replicator\":\n",
    "        x = logit(y)\n",
    "    if regularizer == \"euclidean\":\n",
    "        x = projection_in_simplex(y)\n",
    "    if regularizer == \"logarithmic\":\n",
    "        x = inverse_logarithmic(y)\n",
    "    return np.array(x)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "pleasant-cassette",
   "metadata": {},
   "outputs": [],
   "source": [
    "def experiment(ys,ys_middle,xs,steps,payoff,regularizers,algorithm=\"FTRL\",print_step=False):\n",
    "    start_step=1\n",
    "    num_players=len(ys[-1])\n",
    "    if algorithm==\"OptFTRL\":\n",
    "        xs_middle=[np.array([Q_map(ys_middle[-1][i],regularizers[i]) for i in range(num_players)])]\n",
    "        vs_middle=[payoff(xs_middle[-1],start_step)]\n",
    "    if algorithm==\"MirrorProx\":\n",
    "        xs.append(np.array([Q_map(ys[-1][i],regularizers[i]) for i in range(num_players)]))\n",
    "        xs_middle=[]\n",
    "        vs_middle=[]\n",
    "    \n",
    "    \n",
    "    for step in range(start_step,steps):\n",
    "        if print_step:\n",
    "            print(step)\n",
    "        if algorithm == \"FTRL\":\n",
    "            ys_curr = ys[-1]\n",
    "            xs_curr = np.array([Q_map(ys_curr[i],regularizers[i]) for i in range(num_players)])\n",
    "            xs.append(xs_curr)\n",
    "            vs=payoff(xs[-1],step)\n",
    "            ys_next = ys_curr + gamma(step)*vs\n",
    "            ys.append(ys_next)\n",
    "            \n",
    "        if algorithm == \"OptFTRL\":\n",
    "            #y(-1/2)\n",
    "            ys_middle_curr = ys_middle[-1]\n",
    "            \n",
    "            #x(-1/2)            \n",
    "            xs_middle_curr = xs_middle[-1]\n",
    "            \n",
    "            #v(-1/2)\n",
    "            vs_middle_curr = vs_middle[-1]\n",
    "            \n",
    "            #y(0)\n",
    "            ys_curr = ys[-1]\n",
    "            \n",
    "            #y(1/2)=y(0)+gamma*v(-1/2)\n",
    "            ys_middle_next = ys_curr + gamma(step)*vs_middle_curr\n",
    "            ys_middle.append(ys_middle_next)\n",
    "            \n",
    "            #y(1/2)\n",
    "            ys_middle_curr = ys_middle[-1]\n",
    "            \n",
    "            #x(1/2)\n",
    "            xs_middle_curr = np.array([Q_map(ys_middle_curr[i],regularizers[i]) for i in range(num_players)])\n",
    "            xs_middle.append(xs_middle_curr)\n",
    "            \n",
    "            #v(1/2)\n",
    "            vs_middle_curr = payoff(xs_middle_curr,step)\n",
    "            vs_middle.append(vs_middle_curr)\n",
    "            \n",
    "            \n",
    "            #y(1)=y(0)+gamma*v(1/2)\n",
    "            ys_next = ys_curr + gamma(step)*vs_middle_curr\n",
    "            ys.append(ys_next)\n",
    "            \n",
    "            #x(1)\n",
    "            xs_curr = np.array([Q_map(ys_next[i],regularizers[i]) for i in range(num_players)])\n",
    "            xs.append(xs_curr)\n",
    "\n",
    "        if algorithm == \"MirrorProx\":           \n",
    "            #y(0)\n",
    "            ys_curr = ys[-1]\n",
    "            \n",
    "            #x(0)\n",
    "            xs_curr = xs[-1]\n",
    "            x_agg = xs[-1]\n",
    "            #v(0)\n",
    "            vs_curr = payoff(x_agg,step)\n",
    "\n",
    "            \n",
    "            #y(1/2)=y(0)+gamma*v(0)\n",
    "            ys_middle_next = ys_curr + gamma(step)*vs_curr\n",
    "            ys_middle.append(ys_middle_next)\n",
    "            \n",
    "            #y(1/2)\n",
    "            ys_middle_curr = ys_middle[-1]\n",
    "            \n",
    "            #x(1/2)\n",
    "            xs_middle_curr = np.array([Q_map(ys_middle_curr[i],regularizers[i]) for i in range(num_players)])\n",
    "            xs_middle.append(xs_middle_curr)\n",
    "            \n",
    "            #v(1/2)\n",
    "            vs_middle_curr = payoff(xs_middle_curr,step)\n",
    "            vs_middle.append(vs_middle_curr)\n",
    "            \n",
    "            \n",
    "            #y(1)=y(0)+gamma*v(1/2)\n",
    "            ys_next = ys_curr + gamma(step)*vs_middle_curr\n",
    "            ys.append(ys_next)\n",
    "            \n",
    "            \n",
    "            #x(1)\n",
    "            xs_next=np.array([Q_map(ys_next[i],regularizers[i]) for i in range(num_players)])\n",
    "            xs.append(xs_next)\n",
    "            \n",
    "    return ys,xs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "amber-economics",
   "metadata": {},
   "outputs": [],
   "source": [
    "def super_plot(bag_of_results,algorithmos,modeling):\n",
    "                \n",
    "    imarker=0\n",
    "    subsampling=1\n",
    "    markers=[\".\",\"o\",\"v\",\">\",\"8\",\"s\",\"*\",\"+\",\"x\",\"D\",\"2\"]\n",
    "    import matplotlib.pyplot as plt\n",
    "\n",
    "    SMALLER_SIZE = 10\n",
    "    SMALL_SIZE = 16\n",
    "    MEDIUM_SIZE = 24\n",
    "    BIGGER_SIZE = 28\n",
    "\n",
    "\n",
    "    plt.rc('font', size=SMALL_SIZE)          # controls default text sizes\n",
    "    plt.rc('axes', titlesize=SMALL_SIZE)     # fontsize of the axes title\n",
    "    plt.rc('axes', labelsize=MEDIUM_SIZE)    # fontsize of the x and y labels\n",
    "    plt.rc('xtick', labelsize=SMALL_SIZE)    # fontsize of the tick labels\n",
    "    plt.rc('ytick', labelsize=SMALL_SIZE)    # fontsize of the tick labels\n",
    "    plt.rc('legend', fontsize=SMALL_SIZE)    # legend fontsize\n",
    "    plt.rc('figure', titlesize=BIGGER_SIZE)  # fontsize of the figure title\n",
    "    plt.rcParams['lines.markersize']=SMALLER_SIZE           # controls default marker sizes\n",
    "\n",
    "    \n",
    "    \n",
    "    algos = [\"FTRL\",\"OptFTRL\",\"MirrorProx\"]\n",
    "    legend_regularizers={\"replicator\":'MWU',\"euclidean\":r'$\\ell_2$',\"logarithmic\":r'$\\log$'}\n",
    "    legend_names_payoff ={'Perfect Payoff':'Perfect',\n",
    "            'Imperfect Payoff with Uniform noise':'uniform',\n",
    "            'Imperfect Payoff with Truncated-Gaussian noise':'gaussian',\n",
    "            'Semi-Bandit Noiseless Payoff':'oracle',\n",
    "            'Bandit Noiseless Payoff':'bandit'}\n",
    "    bag_xs_cummulatives = {}\n",
    "    for key in bag_of_results[0]:\n",
    "        (c,b,a)=key\n",
    "        label_legend=a+'-'+legend_regularizers[b]+'-'+legend_names_payoff[c]\n",
    "        bag_xs_cummulatives[label_legend]=[]\n",
    "        \n",
    "    for results in bag_of_results:\n",
    "        for key in results:\n",
    "            (c,b,a)=key\n",
    "            label_legend=a+'-'+legend_regularizers[b]+'-'+legend_names_payoff[c]\n",
    "            ys,xs=results[key]\n",
    "            num_players=len(xs[-1])\n",
    "            steps=len(xs)\n",
    "            time_steps=list(range(0,steps,subsampling))\n",
    "        \n",
    "            xs_cummulative = [ np.array([0,0]) for t in range(len(xs))]\n",
    "            for t in time_steps:\n",
    "                for i in range(num_players):\n",
    "                    xs_cummulative[t]= xs_cummulative[t] + 1-xs[t][i]\n",
    "            #\n",
    "            #plt.plot(time_steps,[xs_cummulative[t][0] for t in time_steps])\n",
    "            #plt.show()\n",
    "            bag_xs_cummulatives[label_legend].append(xs_cummulative.copy())\n",
    "\n",
    "                        \n",
    " # STRATEGY 0\n",
    "    f = plt.figure(figsize=(16,8))\n",
    "    plt.title(Game+\"-\"+r'$\\|x^*-X_k\\|_1$')\n",
    "    for label_legend in bag_xs_cummulatives:\n",
    "        xs_list=bag_xs_cummulatives[label_legend]\n",
    "        xs_mean=[np.mean([xs[t][0]  for xs in xs_list]) for t in time_steps]\n",
    "        xs_min =[np.min([xs[t][0]  for xs in xs_list]) for t in time_steps]\n",
    "        xs_max =[np.max([xs[t][0]  for xs in xs_list]) for t in time_steps]\n",
    "        \n",
    "        base_line, = plt.semilogy(time_steps,xs_mean,label=label_legend)\n",
    "        plt.fill_between(time_steps, xs_min, xs_max, facecolor=base_line.get_color(), alpha=0.25)\n",
    "    plt.legend()\n",
    "    plt.ylim( (pow(10,-10),pow(10,0)) )\n",
    "    plt.xlabel('rounds')\n",
    "    plt.legend(loc='upper right')\n",
    "    plt.savefig(\"Appendix_\"+algorithmos+modeling+Game+style_step_size+'Strategy_0.pdf')\n",
    "    plt.tight_layout()\n",
    "    plt.show()\n",
    "    \n",
    "     # STRATEGY 1\n",
    "    f = plt.figure(figsize=(16,8))\n",
    "    plt.title(Game+\"-\"+r'$\\|x^*-X_k\\|_1$')\n",
    "    for label_legend in bag_xs_cummulatives:\n",
    "        xs_list=bag_xs_cummulatives[label_legend]\n",
    "        xs_mean=[np.mean([xs[t][1]  for xs in xs_list]) for t in time_steps]\n",
    "        xs_min =[np.min([xs[t][1]  for xs in xs_list]) for t in time_steps]\n",
    "        xs_max =[np.max([xs[t][1]  for xs in xs_list]) for t in time_steps]\n",
    "        \n",
    "        base_line, = plt.semilogy(time_steps,xs_mean,label=label_legend)\n",
    "        plt.fill_between(time_steps, xs_min, xs_max, facecolor=base_line.get_color(), alpha=0.25)\n",
    "    plt.legend()\n",
    "    plt.ylim( (pow(10,-10),pow(10,0)) )\n",
    "    plt.xlabel('rounds')\n",
    "    plt.legend(loc='upper right')\n",
    "    plt.savefig(\"Appendix_\"+algorithmos+modeling+Game+style_step_size+'Strategy_1.pdf')\n",
    "    plt.tight_layout()\n",
    "    plt.show()\n",
    "    return\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "quick-attribute",
   "metadata": {},
   "outputs": [],
   "source": [
    "algos = [\"FTRL\",\"OptFTRL\",\"MirrorProx\"]\n",
    "regularizers=[\"replicator\",\"euclidean\"]\n",
    "names_payoff =['Perfect Payoff',\n",
    "            'Imperfect Payoff with Uniform noise',\n",
    "            'Imperfect Payoff with Truncated-Gaussian noise',\n",
    "            'Semi-Bandit Noiseless Payoff',\n",
    "            'Bandit Noiseless Payoff']\n",
    "payoffs = [perfect_payoff,\n",
    "           imperfect_payoff,\n",
    "           truncgaussian_payoff,\n",
    "           semi_bandit_perfect_payoff,\n",
    "           bandit_perfect_payoff]\n",
    "\n",
    "settings=[(\"Battle of the Sexes\",2),(\"Pigou's Network\",2)]\n",
    "iterations=5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "published-applicant",
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "\n",
    "################################################################3\n",
    "\n",
    "names_payoff =['Semi-Bandit Noiseless Payoff',\n",
    "            'Bandit Noiseless Payoff']\n",
    "payoffs = [semi_bandit_perfect_payoff,\n",
    "           bandit_perfect_payoff]\n",
    "\n",
    "for algo in algos:\n",
    "    for Game,num_players in settings:\n",
    "        for style_step_size in [\"constant step size\",\"polynomial step size\"]:\n",
    "            bag_of_results = []\n",
    "            for iteration in range(iterations):\n",
    "                print(iteration)\n",
    "                ys_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "                ys_middle_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "\n",
    "                results = {}\n",
    "                for reg in regularizers:\n",
    "                    for payoff,name in zip(payoffs,names_payoff):\n",
    "                        print(Game+' '+name+' '+reg+' '+algo+' '+style_step_size)\n",
    "                        regs = [reg for i in range(num_players)]\n",
    "                        ys = [ys_initial]\n",
    "                        xs = []      \n",
    "                        ys_middle = [ys_middle_initial]\n",
    "                        steps = 1500\n",
    "                        ys,xs=experiment(ys,ys_middle,xs,steps,payoff,regs,algorithm=algo)\n",
    "                        results[(name,reg,algo)]=ys,xs\n",
    "                bag_of_results.append(dict(results))\n",
    "            print('PLOT')\n",
    "            super_plot(bag_of_results,algo,'bandit')\n",
    "################################################################3\n",
    "\n",
    "names_payoff =['Perfect Payoff',\n",
    "            'Imperfect Payoff with Uniform noise',\n",
    "            'Imperfect Payoff with Truncated-Gaussian noise']\n",
    "\n",
    "payoffs = [perfect_payoff,\n",
    "           imperfect_payoff,\n",
    "           truncgaussian_payoff]\n",
    "\n",
    "for algo in algos:\n",
    "    for Game,num_players in settings:\n",
    "        for style_step_size in [\"constant step size\",\"polynomial step size\"]:\n",
    "            bag_of_results = []\n",
    "            for iteration in range(iterations):\n",
    "                print(iteration)\n",
    "                ys_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "                ys_middle_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "\n",
    "                results = {}\n",
    "                for reg in regularizers:\n",
    "                    for payoff,name in zip(payoffs,names_payoff):\n",
    "                        print(Game+' '+name+' '+reg+' '+algo+' '+style_step_size)\n",
    "                        regs = [reg for i in range(num_players)]\n",
    "                        ys = [ys_initial]\n",
    "                        xs = []      \n",
    "                        ys_middle = [ys_middle_initial]\n",
    "                        steps = 2000\n",
    "                        ys,xs=experiment(ys,ys_middle,xs,steps,payoff,regs,algorithm=algo)\n",
    "                        results[(name,reg,algo)]=ys,xs\n",
    "                bag_of_results.append(dict(results))\n",
    "            print('PLOT')\n",
    "            super_plot(bag_of_results,algo,'random')\n",
    "################################################################3"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "sunrise-passport",
   "metadata": {},
   "outputs": [],
   "source": [
    "names_payoff =[\n",
    "            'Imperfect Payoff with Uniform noise',\n",
    "            'Imperfect Payoff with Truncated-Gaussian noise']\n",
    "\n",
    "payoffs = [\n",
    "           imperfect_payoff,\n",
    "           truncgaussian_payoff]\n",
    "\n",
    "for algo in algos:\n",
    "    for Game,num_players in settings:\n",
    "        for style_step_size in [\"constant step size\",\"polynomial step size\"]:\n",
    "            bag_of_results = []\n",
    "            for iteration in range(iterations):\n",
    "                print(iteration)\n",
    "                ys_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "                ys_middle_initial = np.array([np.random.rand(1,2)[0] for i in range(num_players)])\n",
    "\n",
    "                results = {}\n",
    "                for reg in regularizers:\n",
    "                    for payoff,name in zip(payoffs,names_payoff):\n",
    "                        print(Game+' '+name+' '+reg+' '+algo+' '+style_step_size)\n",
    "                        regs = [reg for i in range(num_players)]\n",
    "                        ys = [ys_initial]\n",
    "                        xs = []      \n",
    "                        ys_middle = [ys_middle_initial]\n",
    "                        steps = 2000\n",
    "                        ys,xs=experiment(ys,ys_middle,xs,steps,payoff,regs,algorithm=algo)\n",
    "                        results[(name,reg,algo)]=ys,xs\n",
    "                bag_of_results.append(dict(results))\n",
    "            print('PLOT')\n",
    "            super_plot(bag_of_results,algo,'random')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.1"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
