{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Code was run on Colab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import math\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import collections\n",
    "import torch.optim as optim\n",
    "from torch.optim import Optimizer\n",
    "import time\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from AdamW          import AdamW\n",
    "from utils          import utility, misreportUtility, misreportOptimization, trueUtility, loss\n",
    "from networks       import AdditiveMechanism, Misreports\n",
    "from restrictedAdam import Adam "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = 'cuda' if torch.cuda.is_available() else 'cpu'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Set Random Seed "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Initializing seeds\n",
    "torch.manual_seed(42)\n",
    "np.random.seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(nBatch, nbrInit, R, gamma=0.001, minimum=0, maximum=1):\n",
    "    \n",
    "    \"\"\" This function computes the regret and payment of mechanism on a test set of size nBatch\n",
    "        The optimal misreport is computed by optimizing the utility function (not by using the Misreport network)\n",
    "        for R gradient steps (of stepsize gamma) and starting from nbrInit initialization, we only keep the best misreport\n",
    "        To compute the regret we evaluate the mechanism at the misreport and compare to the valuation\n",
    "        minimum and maximum indicate the range of the valuations\n",
    "    \"\"\"\n",
    "    \n",
    "    true = np.random.rand(nBatch,nAgent,nObject)\n",
    "\n",
    "    localMisreports     = np.random.rand(nBatch,nbrInit,nAgent,nObject)\n",
    "    batchMisreports     = torch.tensor(localMisreports).float().to(device)\n",
    "    batchTrueValuations = torch.tensor(true).float().to(device)\n",
    "    batchMisreports.requires_grad = True\n",
    "    \n",
    "    opt = Adam([batchMisreports], lr=gamma)\n",
    "    \n",
    "    for k in range(R):\n",
    "        advU         = misreportUtility(mechanism,batchTrueValuations,batchMisreports)\n",
    "        los          =  -1*torch.mean(advU).to(device)\n",
    "        los.backward()\n",
    "        opt.step(restricted= True, min=minimum, max=maximum)\n",
    "        opt.zero_grad()\n",
    "    \n",
    "    misReportUtilityMax  = torch.max(advU, dim =1)[0]\n",
    "    mechanism.zero_grad()\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "    regret = F.relu(misReportUtilityMax -utility(batchTrueValuations, allocation, payment))\n",
    "    mregret= torch.sum(torch.mean(regret, dim=0)).to(device)\n",
    "    mregret= float(mregret.cpu().detach().numpy())\n",
    "\n",
    "    with torch.no_grad():\n",
    "        l,rMean,p = loss(payment, regret)\n",
    "\n",
    "    testRegret.append(mregret)\n",
    "    testPayment.append(float(p.detach().cpu().numpy() ))\n",
    "    testOptimal.append(float((-l).detach().cpu().numpy())**2)\n",
    "    \n",
    "    print(\"Total regret: \",'{0:.5f}'.format(mregret), \"Average regret per bidder: \",'{0:.5f}'.format(mregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float((-l).detach().cpu().numpy())**2), \" payment: \",'{0:.3f}'.format(float(p.detach().cpu().numpy() )))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "nAgent   = 1\n",
    "nObject  = 10\n",
    "\n",
    "# Parameters for the mechanism (payment and allocation network)\n",
    "nLayersAllocation   = 5\n",
    "nLayersPayment      = 5\n",
    "widthAllocation     = 100\n",
    "widthPayment        = 100\n",
    "\n",
    "# Parameters for the misreport network\n",
    "nLayersMisreport    = 5\n",
    "widthMisreport      = 100\n",
    "\n",
    "gamma              = 0.001 \n",
    "testBatch          = 10000\n",
    "\n",
    "nExperiments       = 100000\n",
    "batchSize          = 500\n",
    "nbrBatches         = int(nExperiments/batchSize)\n",
    "\n",
    "\n",
    "mechanism            = AdditiveMechanism(nAgent, nObject, nLayersAllocation, widthAllocation).to(device)\n",
    "optimizerMechanism   = AdamW(mechanism.parameters(), lr=0.0005)\n",
    "\n",
    "misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "testRegret    = []\n",
    "testMaxRegret = []\n",
    "testPayment   = []\n",
    "testOptimal   = []\n",
    "testTime      = []\n",
    "testIteration = [0]\n",
    "\n",
    "# range of valuations\n",
    "minimum            = 0\n",
    "maximum            = 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Initial Test\n",
      "Total regret:  1.03706 Average regret per bidder:  1.03706  Optimal Revenue:  1.417  payment:  0.749\n",
      "Batch:  2\n",
      "Total regret:  0.01789 Average regret per bidder:  0.01789  Optimal Revenue:  2.721  payment:  3.244\n",
      "Batch:  4\n",
      "Total regret:  0.01591 Average regret per bidder:  0.01591  Optimal Revenue:  2.968  payment:  3.478\n",
      "Batch:  6\n",
      "Total regret:  0.01376 Average regret per bidder:  0.01376  Optimal Revenue:  2.906  payment:  3.370\n",
      "Batch:  8\n",
      "Total regret:  0.00946 Average regret per bidder:  0.00946  Optimal Revenue:  2.951  payment:  3.329\n",
      "Batch:  10\n",
      "Total regret:  0.01645 Average regret per bidder:  0.01645  Optimal Revenue:  2.941  payment:  3.459\n",
      "Batch:  12\n",
      "Total regret:  0.01354 Average regret per bidder:  0.01354  Optimal Revenue:  2.883  payment:  3.341\n",
      "Batch:  14\n",
      "Total regret:  0.00411 Average regret per bidder:  0.00411  Optimal Revenue:  3.203  payment:  3.452\n",
      "Batch:  16\n",
      "Total regret:  0.00478 Average regret per bidder:  0.00478  Optimal Revenue:  3.142  payment:  3.410\n",
      "Batch:  18\n",
      "Total regret:  0.00441 Average regret per bidder:  0.00441  Optimal Revenue:  3.015  payment:  3.266\n",
      "Batch:  20\n",
      "Total regret:  0.00406 Average regret per bidder:  0.00406  Optimal Revenue:  3.227  payment:  3.475\n",
      "Batch:  22\n",
      "Total regret:  0.00392 Average regret per bidder:  0.00392  Optimal Revenue:  2.970  payment:  3.204\n",
      "Batch:  24\n",
      "Total regret:  0.00296 Average regret per bidder:  0.00296  Optimal Revenue:  3.252  payment:  3.462\n",
      "Batch:  26\n",
      "Total regret:  0.00657 Average regret per bidder:  0.00657  Optimal Revenue:  2.934  payment:  3.242\n",
      "Batch:  28\n",
      "Total regret:  0.00274 Average regret per bidder:  0.00274  Optimal Revenue:  3.162  payment:  3.361\n",
      "Batch:  30\n",
      "Total regret:  0.01059 Average regret per bidder:  0.01059  Optimal Revenue:  3.175  payment:  3.593\n",
      "Batch:  32\n",
      "Total regret:  0.00377 Average regret per bidder:  0.00377  Optimal Revenue:  3.106  payment:  3.340\n",
      "Batch:  34\n",
      "Total regret:  0.00578 Average regret per bidder:  0.00578  Optimal Revenue:  3.137  payment:  3.433\n",
      "Batch:  36\n",
      "Total regret:  0.00181 Average regret per bidder:  0.00181  Optimal Revenue:  3.405  payment:  3.570\n",
      "Batch:  38\n",
      "Total regret:  0.00166 Average regret per bidder:  0.00166  Optimal Revenue:  3.300  payment:  3.455\n",
      "Batch:  40\n",
      "Total regret:  0.00278 Average regret per bidder:  0.00278  Optimal Revenue:  3.269  payment:  3.473\n",
      "Batch:  42\n",
      "Total regret:  0.00211 Average regret per bidder:  0.00211  Optimal Revenue:  3.257  payment:  3.433\n",
      "Batch:  44\n",
      "Total regret:  0.00183 Average regret per bidder:  0.00183  Optimal Revenue:  3.383  payment:  3.549\n",
      "Batch:  46\n",
      "Total regret:  0.00140 Average regret per bidder:  0.00140  Optimal Revenue:  3.357  payment:  3.500\n",
      "Batch:  48\n",
      "Total regret:  0.00100 Average regret per bidder:  0.00100  Optimal Revenue:  3.315  payment:  3.435\n",
      "Batch:  50\n",
      "Total regret:  0.00219 Average regret per bidder:  0.00219  Optimal Revenue:  3.143  payment:  3.319\n",
      "Batch:  52\n",
      "Total regret:  0.00162 Average regret per bidder:  0.00162  Optimal Revenue:  3.322  payment:  3.477\n",
      "Batch:  54\n",
      "Total regret:  0.00112 Average regret per bidder:  0.00112  Optimal Revenue:  3.500  payment:  3.630\n",
      "Batch:  56\n",
      "Total regret:  0.00271 Average regret per bidder:  0.00271  Optimal Revenue:  3.252  payment:  3.453\n",
      "Batch:  58\n",
      "Total regret:  0.00290 Average regret per bidder:  0.00290  Optimal Revenue:  3.103  payment:  3.306\n",
      "Batch:  60\n",
      "Total regret:  0.00286 Average regret per bidder:  0.00286  Optimal Revenue:  3.294  payment:  3.501\n"
     ]
    }
   ],
   "source": [
    "duration   = 0\n",
    "R          = 100\n",
    "\n",
    "i=0\n",
    "\n",
    "print(\"Initial Test\")\n",
    "test(50, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)\n",
    "\n",
    "for t in range(1,60*nbrBatches+1):\n",
    "    \n",
    "    # Reinitialize Misreport network periodically at the beginning of training\n",
    "    if (t%(4*nbrBatches) ==1):\n",
    "      if   t< 20*nbrBatches+2 :\n",
    "    \n",
    "        misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "        optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)\n",
    "\n",
    "    batchTrueValuations = torch.tensor(np.random.rand(batchSize,nAgent,nObject)).float().to(device)\n",
    "    \n",
    "    # Optimize Misreport Network for R steps\n",
    "    for k in range(R):\n",
    "  \n",
    "        misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "        mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "        mLoss               = torch.sum(torch.mean(-mUtility,dim=0))\n",
    "\n",
    "        optimizerMisreport.zero_grad()\n",
    "        mLoss.backward()\n",
    "        optimizerMisreport.step()\n",
    "\n",
    "    \n",
    "    # Optimize Mechanism network for one step\n",
    "    misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "    mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "\n",
    "    regret     = F.relu(mUtility -utility(batchTrueValuations, allocation, payment))\n",
    "    l,rMean,p = loss(payment, regret)\n",
    "        \n",
    "    optimizerMechanism.zero_grad()\n",
    "\n",
    "    l.backward()\n",
    "\n",
    "    optimizerMechanism.step()\n",
    "    \n",
    "    # Test mechanism periodically\n",
    "    if t % (2*nbrBatches)==0 :\n",
    "        print(\"Batch: \", 2*int(t/(2*nbrBatches)))\n",
    "        testTime.append(duration)\n",
    "        testIteration.append(t/nbrBatches)\n",
    "        test(100, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total regret:  0.00194 Average regret per bidder:  0.00194  Optimal Revenue:  3.346  payment:  3.517\n",
      "Total regret:  0.00179 Average regret per bidder:  0.00179  Optimal Revenue:  3.292  payment:  3.453\n",
      "Total regret:  0.00195 Average regret per bidder:  0.00195  Optimal Revenue:  3.272  payment:  3.441\n",
      "Total regret:  0.00185 Average regret per bidder:  0.00185  Optimal Revenue:  3.262  payment:  3.426\n",
      "Total regret:  0.00202 Average regret per bidder:  0.00202  Optimal Revenue:  3.298  payment:  3.471\n",
      "Total regret:  0.00185 Average regret per bidder:  0.00185  Optimal Revenue:  3.335  payment:  3.501\n",
      "Total regret:  0.00209 Average regret per bidder:  0.00209  Optimal Revenue:  3.204  payment:  3.378\n",
      "Total regret:  0.00186 Average regret per bidder:  0.00186  Optimal Revenue:  3.288  payment:  3.453\n",
      "Total regret:  0.00196 Average regret per bidder:  0.00196  Optimal Revenue:  3.319  payment:  3.490\n",
      "Total regret:  0.00193 Average regret per bidder:  0.00193  Optimal Revenue:  3.334  payment:  3.504\n"
     ]
    }
   ],
   "source": [
    "# Final Tests\n",
    "for i in range(10):\n",
    "  test(1000, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Final Result\n",
      "Total Regret =  0.00193 Average regret per bidder:  0.00193  Optimal Revenue:  3.302  payment:  3.463\n"
     ]
    }
   ],
   "source": [
    "totalregret = np.mean(np.array(testRegret[-10:]))\n",
    "revenue     = np.mean(np.array(testPayment[-10:]))\n",
    "print(\"Final Result\")\n",
    "print(\"Total Regret = \", '{0:.5f}'.format(totalregret), \"Average regret per bidder: \",'{0:.5f}'.format(totalregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float(np.sqrt(revenue)-np.sqrt(totalregret))**2), \" payment: \",'{0:.3f}'.format(revenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "std Regret =  0.00009 std regret per bidder:  0.00009  std payment:  0.040\n"
     ]
    }
   ],
   "source": [
    "stdregret = np.std(np.array(testRegret[-10:]))\n",
    "stdrevenue= np.std(np.array(testPayment[-10:]))\n",
    "print(\"std Regret = \", '{0:.5f}'.format(stdregret), \"std regret per bidder: \",'{0:.5f}'.format(stdregret/nAgent), \" std payment: \",'{0:.3f}'.format(stdrevenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
