{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Code was run on Colab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import math\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import collections\n",
    "import torch.optim as optim\n",
    "from torch.optim import Optimizer\n",
    "import time\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from AdamW          import AdamW\n",
    "from utils          import utility, misreportUtility, misreportOptimization, trueUtility, loss\n",
    "from networks       import AdditiveMechanism, Misreports\n",
    "from restrictedAdam import Adam "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = 'cuda' if torch.cuda.is_available() else 'cpu'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Set Random Seed "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Initializing seeds\n",
    "torch.manual_seed(42)\n",
    "np.random.seed(42)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing Function\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(nBatch, nbrInit, R, gamma=0.001, minimum=0, maximum=1):\n",
    "    \n",
    "    \"\"\" This function computes the regret and payment of mechanism on a test set of size nBatch\n",
    "        The optimal misreport is computed by optimizing the utility function (not by using the Misreport network)\n",
    "        for R gradient steps (of stepsize gamma) and starting from nbrInit initialization, we only keep the best misreport\n",
    "        To compute the regret we evaluate the mechanism at the misreport and compare to the valuation\n",
    "        minimum and maximum indicate the range of the valuations\n",
    "    \"\"\"\n",
    "    \n",
    "    true = np.random.rand(nBatch,nAgent,nObject)\n",
    "\n",
    "    localMisreports     = np.random.rand(nBatch,nbrInit,nAgent,nObject)\n",
    "    batchMisreports     = torch.tensor(localMisreports).float().to(device)\n",
    "    batchTrueValuations = torch.tensor(true).float().to(device)\n",
    "    batchMisreports.requires_grad = True\n",
    "    \n",
    "    opt = Adam([batchMisreports], lr=gamma)\n",
    "    \n",
    "    for k in range(R):\n",
    "        advU         = misreportUtility(mechanism,batchTrueValuations,batchMisreports)\n",
    "        los          =  -1*torch.mean(advU).to(device)\n",
    "        los.backward()\n",
    "        opt.step(restricted= True, min=minimum, max=maximum)\n",
    "        opt.zero_grad()\n",
    "    \n",
    "    misReportUtilityMax  = torch.max(advU, dim =1)[0]\n",
    "    mechanism.zero_grad()\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "    regret = F.relu(misReportUtilityMax -utility(batchTrueValuations, allocation, payment))\n",
    "    mregret= torch.sum(torch.mean(regret, dim=0)).to(device)\n",
    "    mregret= float(mregret.cpu().detach().numpy())\n",
    "\n",
    "    with torch.no_grad():\n",
    "        l,rMean,p = loss(payment, regret)\n",
    "\n",
    "    testRegret.append(mregret)\n",
    "    testPayment.append(float(p.detach().cpu().numpy() ))\n",
    "    testOptimal.append(float((-l).detach().cpu().numpy())**2)\n",
    "    \n",
    "    print(\"Total regret: \",'{0:.5f}'.format(mregret), \"Average regret per bidder: \",'{0:.5f}'.format(mregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float((-l).detach().cpu().numpy())**2), \" payment: \",'{0:.3f}'.format(float(p.detach().cpu().numpy() )))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Initializing Networks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "nAgent   = 2\n",
    "nObject  = 2\n",
    "\n",
    "# Parameters for the mechanism (payment and allocation network)\n",
    "nLayersAllocation   = 5\n",
    "nLayersPayment      = 5\n",
    "widthAllocation     = 200\n",
    "widthPayment        = 200\n",
    "\n",
    "# Parameters for the misreport network\n",
    "nLayersMisreport    = 5\n",
    "widthMisreport      = 200\n",
    "\n",
    "gamma              = 0.001 \n",
    "testBatch          = 10000\n",
    "\n",
    "nExperiments       = 100000\n",
    "batchSize          = 500\n",
    "nbrBatches         = int(nExperiments/batchSize)\n",
    "\n",
    "\n",
    "mechanism            = AdditiveMechanism(nAgent, nObject, nLayersAllocation, widthAllocation).to(device)\n",
    "optimizerMechanism   = AdamW(mechanism.parameters(), lr=0.0005)\n",
    "\n",
    "misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "testRegret    = []\n",
    "testMaxRegret = []\n",
    "testPayment   = []\n",
    "testOptimal   = []\n",
    "testTime      = []\n",
    "testIteration = [0]\n",
    "\n",
    "# range of valuations\n",
    "minimum            = 0\n",
    "maximum            = 1"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Initial Test\n",
      "Total regret:  0.21250 Average regret per bidder:  0.10625  Optimal Revenue:  0.006  payment:  0.356\n",
      "Batch:  4\n",
      "Total regret:  0.00273 Average regret per bidder:  0.00136  Optimal Revenue:  0.785  payment:  0.885\n",
      "Batch:  8\n",
      "Total regret:  0.00122 Average regret per bidder:  0.00061  Optimal Revenue:  0.802  payment:  0.868\n",
      "Batch:  12\n",
      "Total regret:  0.00205 Average regret per bidder:  0.00103  Optimal Revenue:  0.797  payment:  0.884\n",
      "Batch:  16\n",
      "Total regret:  0.00150 Average regret per bidder:  0.00075  Optimal Revenue:  0.779  payment:  0.851\n",
      "Batch:  20\n",
      "Total regret:  0.00142 Average regret per bidder:  0.00071  Optimal Revenue:  0.752  payment:  0.822\n",
      "Batch:  24\n",
      "Total regret:  0.00227 Average regret per bidder:  0.00114  Optimal Revenue:  0.827  payment:  0.920\n",
      "Batch:  28\n",
      "Total regret:  0.00166 Average regret per bidder:  0.00083  Optimal Revenue:  0.877  payment:  0.958\n",
      "Batch:  32\n",
      "Total regret:  0.00088 Average regret per bidder:  0.00044  Optimal Revenue:  0.744  payment:  0.798\n",
      "Batch:  36\n",
      "Total regret:  0.00090 Average regret per bidder:  0.00045  Optimal Revenue:  0.857  payment:  0.915\n",
      "Batch:  40\n",
      "Total regret:  0.00087 Average regret per bidder:  0.00044  Optimal Revenue:  0.764  payment:  0.818\n",
      "Batch:  44\n",
      "Total regret:  0.00107 Average regret per bidder:  0.00053  Optimal Revenue:  0.852  payment:  0.915\n",
      "Batch:  48\n",
      "Total regret:  0.00103 Average regret per bidder:  0.00051  Optimal Revenue:  0.856  payment:  0.919\n",
      "Batch:  52\n",
      "Total regret:  0.00120 Average regret per bidder:  0.00060  Optimal Revenue:  0.814  payment:  0.880\n",
      "Batch:  56\n",
      "Total regret:  0.00129 Average regret per bidder:  0.00065  Optimal Revenue:  0.773  payment:  0.840\n",
      "Batch:  60\n",
      "Total regret:  0.00103 Average regret per bidder:  0.00052  Optimal Revenue:  0.766  payment:  0.826\n"
     ]
    }
   ],
   "source": [
    "duration   = 0\n",
    "R          = 100\n",
    "\n",
    "i=0\n",
    "\n",
    "print(\"Initial Test\")\n",
    "test(50, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)\n",
    "\n",
    "for t in range(1,60*nbrBatches+1):\n",
    "    \n",
    "    # Reinitialize Misreport network periodically at the beginning of training\n",
    "    if (t%(4*nbrBatches) ==1):\n",
    "      if   t< 20*nbrBatches+2 :\n",
    "    \n",
    "        misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "        optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)\n",
    "\n",
    "    batchTrueValuations = torch.tensor(np.random.rand(batchSize,nAgent,nObject)).float().to(device)\n",
    "    \n",
    "    # Optimize Misreport Network for R steps\n",
    "    for k in range(R):\n",
    "  \n",
    "        misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "        mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "        mLoss               = torch.sum(torch.mean(-mUtility,dim=0))\n",
    "\n",
    "        optimizerMisreport.zero_grad()\n",
    "        mLoss.backward()\n",
    "        optimizerMisreport.step()\n",
    "\n",
    "    \n",
    "    # Optimize Mechanism network for one step\n",
    "    misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "    mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "\n",
    "    regret     = F.relu(mUtility -utility(batchTrueValuations, allocation, payment))\n",
    "    l,rMean,p = loss(payment, regret)\n",
    "        \n",
    "    optimizerMechanism.zero_grad()\n",
    "\n",
    "    l.backward()\n",
    "\n",
    "    optimizerMechanism.step()\n",
    "    \n",
    "    # Test mechanism periodically\n",
    "    if t % (4*nbrBatches)==0 :\n",
    "        print(\"Batch: \", 2*int(t/(2*nbrBatches)))\n",
    "        testTime.append(duration)\n",
    "        testIteration.append(t/nbrBatches)\n",
    "        test(100, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total regret:  0.00113 Average regret per bidder:  0.00057  Optimal Revenue:  0.821  payment:  0.886\n",
      "Total regret:  0.00112 Average regret per bidder:  0.00056  Optimal Revenue:  0.803  payment:  0.866\n",
      "Total regret:  0.00111 Average regret per bidder:  0.00056  Optimal Revenue:  0.841  payment:  0.905\n",
      "Total regret:  0.00113 Average regret per bidder:  0.00057  Optimal Revenue:  0.813  payment:  0.877\n",
      "Total regret:  0.00109 Average regret per bidder:  0.00055  Optimal Revenue:  0.811  payment:  0.873\n",
      "Total regret:  0.00111 Average regret per bidder:  0.00055  Optimal Revenue:  0.809  payment:  0.872\n",
      "Total regret:  0.00116 Average regret per bidder:  0.00058  Optimal Revenue:  0.820  payment:  0.885\n",
      "Total regret:  0.00106 Average regret per bidder:  0.00053  Optimal Revenue:  0.809  payment:  0.870\n",
      "Total regret:  0.00105 Average regret per bidder:  0.00052  Optimal Revenue:  0.835  payment:  0.897\n",
      "Total regret:  0.00110 Average regret per bidder:  0.00055  Optimal Revenue:  0.795  payment:  0.857\n"
     ]
    }
   ],
   "source": [
    "for i in range(10):\n",
    "  test(1000, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Final Result\n",
      "Total Regret =  0.00111 Average regret per bidder:  0.00055  Optimal Revenue:  0.818  payment:  0.879\n"
     ]
    }
   ],
   "source": [
    "totalregret = np.mean(np.array(testRegret[-10:]))\n",
    "revenue     = np.mean(np.array(testPayment[-10:]))\n",
    "print(\"Final Result\")\n",
    "print(\"Total Regret = \", '{0:.5f}'.format(totalregret), \"Average regret per bidder: \",'{0:.5f}'.format(totalregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float(np.sqrt(revenue)-np.sqrt(totalregret))**2), \" payment: \",'{0:.3f}'.format(revenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "std Regret =  0.00003 std regret per bidder:  0.00002  std payment:  0.014\n"
     ]
    }
   ],
   "source": [
    "stdregret = np.std(np.array(testRegret[-10:]))\n",
    "stdrevenue= np.std(np.array(testPayment[-10:]))\n",
    "print(\"std Regret = \", '{0:.5f}'.format(stdregret), \"std regret per bidder: \",'{0:.5f}'.format(stdregret/nAgent), \" std payment: \",'{0:.3f}'.format(stdrevenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
