{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Code was run on Colab Pro"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import math\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import collections\n",
    "import torch.optim as optim\n",
    "from torch.optim import Optimizer\n",
    "import time\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from AdamW          import AdamW\n",
    "from utils          import utility, misreportUtility, misreportOptimization, trueUtility, loss\n",
    "from networks       import AdditiveMechanism, Misreports\n",
    "from restrictedAdam import Adam "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = 'cuda' if torch.cuda.is_available() else 'cpu'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Set Random Seed \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Initializing seeds\n",
    "torch.manual_seed(42)\n",
    "np.random.seed(42)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing Function\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(nBatch, nbrInit, R, gamma=0.001, minimum=0, maximum=1):\n",
    "    \n",
    "    \"\"\" This function computes the regret and payment of mechanism on a test set of size nBatch\n",
    "        The optimal misreport is computed by optimizing the utility function (not by using the Misreport network)\n",
    "        for R gradient steps (of stepsize gamma) and starting from nbrInit initialization, we only keep the best misreport\n",
    "        To compute the regret we evaluate the mechanism at the misreport and compare to the valuation\n",
    "        minimum and maximum indicate the range of the valuations\n",
    "    \"\"\"\n",
    "    \n",
    "    true = np.random.rand(nBatch,nAgent,nObject)\n",
    "\n",
    "    localMisreports     = np.random.rand(nBatch,nbrInit,nAgent,nObject)\n",
    "    batchMisreports     = torch.tensor(localMisreports).float().to(device)\n",
    "    batchTrueValuations = torch.tensor(true).float().to(device)\n",
    "    batchMisreports.requires_grad = True\n",
    "    \n",
    "    opt = Adam([batchMisreports], lr=gamma)\n",
    "    \n",
    "    for k in range(R):\n",
    "        advU         = misreportUtility(mechanism,batchTrueValuations,batchMisreports)\n",
    "        los          =  -1*torch.mean(advU).to(device)\n",
    "        los.backward()\n",
    "        opt.step(restricted= True, min=minimum, max=maximum)\n",
    "        opt.zero_grad()\n",
    "    \n",
    "    misReportUtilityMax  = torch.max(advU, dim =1)[0]\n",
    "    mechanism.zero_grad()\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "    regret = F.relu(misReportUtilityMax -utility(batchTrueValuations, allocation, payment))\n",
    "    mregret= torch.sum(torch.mean(regret, dim=0)).to(device)\n",
    "    mregret= float(mregret.cpu().detach().numpy())\n",
    "\n",
    "    with torch.no_grad():\n",
    "        l,rMean,p = loss(payment, regret)\n",
    "\n",
    "    testRegret.append(mregret)\n",
    "    testPayment.append(float(p.detach().cpu().numpy() ))\n",
    "    testOptimal.append(float((-l).detach().cpu().numpy())**2)\n",
    "    \n",
    "    print(\"Total regret: \",'{0:.5f}'.format(mregret), \"Average regret per bidder: \",'{0:.5f}'.format(mregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float((-l).detach().cpu().numpy())**2), \" payment: \",'{0:.3f}'.format(float(p.detach().cpu().numpy() )))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Initializing Networks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "nAgent   = 3\n",
    "nObject  = 10\n",
    "\n",
    "# Parameters for the mechanism (payment and allocation network)\n",
    "nLayersAllocation   = 7\n",
    "nLayersPayment      = 7\n",
    "widthAllocation     = 100\n",
    "widthPayment        = 100\n",
    "\n",
    "# Parameters for the misreport network\n",
    "nLayersMisreport    = 7\n",
    "widthMisreport      = 100\n",
    "\n",
    "gamma              = 0.001 \n",
    "testBatch          = 10000\n",
    "\n",
    "nExperiments       = 200000\n",
    "batchSize          = 500\n",
    "nbrBatches         = int(nExperiments/batchSize)\n",
    "\n",
    "\n",
    "mechanism            = AdditiveMechanism(nAgent, nObject, nLayersAllocation, widthAllocation).to(device)\n",
    "optimizerMechanism   = AdamW(mechanism.parameters(), lr=0.001)\n",
    "\n",
    "misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "optimizerMisreport   = AdamW(misreport.parameters(), lr=0.001)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "testRegret    = []\n",
    "testMaxRegret = []\n",
    "testPayment   = []\n",
    "testOptimal   = []\n",
    "testTime      = []\n",
    "testIteration = [0]\n",
    "\n",
    "# range of valuations\n",
    "minimum            = 0\n",
    "maximum            = 1"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Initial Test\n",
      "Total regret:  2.26073 Average regret per bidder:  0.75358  Optimal Revenue:  6.870  payment:  1.307\n",
      "Batch:  4\n",
      "Total regret:  0.00897 Average regret per bidder:  0.00299  Optimal Revenue:  4.478  payment:  4.928\n",
      "Batch:  8\n",
      "Total regret:  0.00419 Average regret per bidder:  0.00140  Optimal Revenue:  4.603  payment:  4.904\n",
      "Batch:  12\n",
      "Total regret:  0.00528 Average regret per bidder:  0.00176  Optimal Revenue:  4.565  payment:  4.904\n",
      "Batch:  16\n",
      "Total regret:  0.00541 Average regret per bidder:  0.00180  Optimal Revenue:  4.603  payment:  4.948\n",
      "Batch:  20\n",
      "Total regret:  0.00316 Average regret per bidder:  0.00105  Optimal Revenue:  4.698  payment:  4.959\n",
      "Batch:  24\n",
      "Total regret:  0.00282 Average regret per bidder:  0.00094  Optimal Revenue:  4.698  payment:  4.943\n",
      "Batch:  28\n",
      "Total regret:  0.00359 Average regret per bidder:  0.00120  Optimal Revenue:  4.905  payment:  5.190\n",
      "Batch:  32\n",
      "Total regret:  0.00629 Average regret per bidder:  0.00210  Optimal Revenue:  4.907  payment:  5.293\n",
      "Batch:  36\n",
      "Total regret:  0.00742 Average regret per bidder:  0.00247  Optimal Revenue:  4.616  payment:  5.027\n",
      "Batch:  40\n",
      "Total regret:  0.00686 Average regret per bidder:  0.00229  Optimal Revenue:  4.832  payment:  5.234\n",
      "Batch:  44\n",
      "Total regret:  0.00467 Average regret per bidder:  0.00156  Optimal Revenue:  4.985  payment:  5.316\n",
      "Batch:  48\n",
      "Total regret:  0.00421 Average regret per bidder:  0.00140  Optimal Revenue:  5.160  payment:  5.478\n",
      "Batch:  52\n",
      "Total regret:  0.00526 Average regret per bidder:  0.00175  Optimal Revenue:  5.046  payment:  5.401\n",
      "Batch:  56\n",
      "Total regret:  0.01147 Average regret per bidder:  0.00382  Optimal Revenue:  5.069  payment:  5.617\n",
      "Batch:  60\n",
      "Total regret:  0.00481 Average regret per bidder:  0.00160  Optimal Revenue:  5.174  payment:  5.517\n",
      "Batch:  64\n",
      "Total regret:  0.00595 Average regret per bidder:  0.00198  Optimal Revenue:  4.956  payment:  5.333\n",
      "Batch:  68\n",
      "Total regret:  0.00995 Average regret per bidder:  0.00332  Optimal Revenue:  5.163  payment:  5.674\n",
      "Batch:  72\n",
      "Total regret:  0.00728 Average regret per bidder:  0.00243  Optimal Revenue:  5.066  payment:  5.491\n",
      "Batch:  76\n",
      "Total regret:  0.00708 Average regret per bidder:  0.00236  Optimal Revenue:  5.091  payment:  5.511\n",
      "Batch:  80\n",
      "Total regret:  0.00530 Average regret per bidder:  0.00177  Optimal Revenue:  5.201  payment:  5.563\n",
      "\n"
     ]
    }
   ],
   "source": [
    "duration   = 0\n",
    "R          = 100\n",
    "\n",
    "i=0\n",
    "\n",
    "print(\"Initial Test\")\n",
    "test(50, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)\n",
    "\n",
    "for t in range(1,80*nbrBatches+1):\n",
    "    \n",
    "    # Reinitialize Misreport network periodically at the beginning of training\n",
    "    if (t%(4*nbrBatches) ==1):\n",
    "      if   t< 20*nbrBatches+2 :\n",
    "    \n",
    "        misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "        optimizerMisreport   = AdamW(misreport.parameters(), lr=0.001)\n",
    "\n",
    "    batchTrueValuations = torch.tensor(np.random.rand(batchSize,nAgent,nObject)).float().to(device)\n",
    "    \n",
    "    # Optimize Misreport Network for R steps\n",
    "    for k in range(R):\n",
    "  \n",
    "        misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "        mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "        mLoss               = torch.sum(torch.mean(-mUtility,dim=0))\n",
    "\n",
    "        optimizerMisreport.zero_grad()\n",
    "        mLoss.backward()\n",
    "        optimizerMisreport.step()\n",
    "\n",
    "    \n",
    "    # Optimize Mechanism network for one step\n",
    "    misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "    mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "\n",
    "    regret     = F.relu(mUtility -utility(batchTrueValuations, allocation, payment))\n",
    "    l,rMean,p = loss(payment, regret)\n",
    "        \n",
    "    optimizerMechanism.zero_grad()\n",
    "\n",
    "    l.backward()\n",
    "\n",
    "    optimizerMechanism.step()\n",
    "    \n",
    "    # Test mechanism periodically\n",
    "    if t % (4*nbrBatches)==0 :\n",
    "        print(\"Batch: \", 2*int(t/(2*nbrBatches)))\n",
    "        testTime.append(duration)\n",
    "        testIteration.append(t/nbrBatches)\n",
    "        test(50, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total regret:  0.00611 Average regret per bidder:  0.00204  Optimal Revenue:  5.194  payment:  5.586\n",
      "Total regret:  0.00570 Average regret per bidder:  0.00190  Optimal Revenue:  5.190  payment:  5.566\n",
      "Total regret:  0.00497 Average regret per bidder:  0.00166  Optimal Revenue:  5.315  payment:  5.669\n",
      "Total regret:  0.00585 Average regret per bidder:  0.00195  Optimal Revenue:  5.179  payment:  5.560\n",
      "Total regret:  0.00622 Average regret per bidder:  0.00207  Optimal Revenue:  5.118  payment:  5.510\n",
      "Total regret:  0.00661 Average regret per bidder:  0.00220  Optimal Revenue:  5.164  payment:  5.571\n",
      "Total regret:  0.00533 Average regret per bidder:  0.00178  Optimal Revenue:  5.257  payment:  5.622\n",
      "Total regret:  0.00595 Average regret per bidder:  0.00198  Optimal Revenue:  5.212  payment:  5.598\n",
      "Total regret:  0.00582 Average regret per bidder:  0.00194  Optimal Revenue:  5.210  payment:  5.592\n",
      "Total regret:  0.00587 Average regret per bidder:  0.00196  Optimal Revenue:  5.224  payment:  5.607\n",
      "Total regret:  0.00570 Average regret per bidder:  0.00190  Optimal Revenue:  5.194  payment:  5.571\n",
      "Total regret:  0.00609 Average regret per bidder:  0.00203  Optimal Revenue:  5.216  payment:  5.607\n",
      "Total regret:  0.00589 Average regret per bidder:  0.00196  Optimal Revenue:  5.204  payment:  5.588\n",
      "Total regret:  0.00675 Average regret per bidder:  0.00225  Optimal Revenue:  5.152  payment:  5.563\n",
      "Total regret:  0.00509 Average regret per bidder:  0.00170  Optimal Revenue:  5.253  payment:  5.609\n",
      "Total regret:  0.00584 Average regret per bidder:  0.00195  Optimal Revenue:  5.204  payment:  5.586\n",
      "Total regret:  0.00616 Average regret per bidder:  0.00205  Optimal Revenue:  5.127  payment:  5.518\n",
      "Total regret:  0.00697 Average regret per bidder:  0.00232  Optimal Revenue:  5.111  payment:  5.528\n",
      "Total regret:  0.00507 Average regret per bidder:  0.00169  Optimal Revenue:  5.302  payment:  5.659\n",
      "Total regret:  0.00653 Average regret per bidder:  0.00218  Optimal Revenue:  5.133  payment:  5.537\n",
      "Total regret:  0.00525 Average regret per bidder:  0.00175  Optimal Revenue:  5.237  payment:  5.599\n",
      "Total regret:  0.00645 Average regret per bidder:  0.00215  Optimal Revenue:  5.114  payment:  5.513\n",
      "Total regret:  0.00594 Average regret per bidder:  0.00198  Optimal Revenue:  5.208  payment:  5.593\n",
      "Total regret:  0.00512 Average regret per bidder:  0.00171  Optimal Revenue:  5.279  payment:  5.638\n",
      "Total regret:  0.00658 Average regret per bidder:  0.00219  Optimal Revenue:  5.139  payment:  5.545\n",
      "Total regret:  0.00601 Average regret per bidder:  0.00200  Optimal Revenue:  5.218  payment:  5.606\n",
      "Total regret:  0.00554 Average regret per bidder:  0.00185  Optimal Revenue:  5.186  payment:  5.557\n",
      "Total regret:  0.00590 Average regret per bidder:  0.00197  Optimal Revenue:  5.263  payment:  5.649\n",
      "Total regret:  0.00620 Average regret per bidder:  0.00207  Optimal Revenue:  5.215  payment:  5.610\n",
      "Total regret:  0.00542 Average regret per bidder:  0.00181  Optimal Revenue:  5.227  payment:  5.595\n",
      "Total regret:  0.00697 Average regret per bidder:  0.00232  Optimal Revenue:  5.168  payment:  5.588\n",
      "Total regret:  0.00725 Average regret per bidder:  0.00242  Optimal Revenue:  5.139  payment:  5.567\n",
      "Total regret:  0.00543 Average regret per bidder:  0.00181  Optimal Revenue:  5.198  payment:  5.566\n",
      "Total regret:  0.00614 Average regret per bidder:  0.00205  Optimal Revenue:  5.212  payment:  5.605\n",
      "Total regret:  0.00606 Average regret per bidder:  0.00202  Optimal Revenue:  5.186  payment:  5.575\n",
      "Total regret:  0.00534 Average regret per bidder:  0.00178  Optimal Revenue:  5.272  payment:  5.639\n",
      "Total regret:  0.00651 Average regret per bidder:  0.00217  Optimal Revenue:  5.170  payment:  5.574\n",
      "Total regret:  0.00591 Average regret per bidder:  0.00197  Optimal Revenue:  5.205  payment:  5.590\n",
      "Total regret:  0.00624 Average regret per bidder:  0.00208  Optimal Revenue:  5.187  payment:  5.582\n",
      "Total regret:  0.00539 Average regret per bidder:  0.00180  Optimal Revenue:  5.248  payment:  5.615\n",
      "Total regret:  0.00641 Average regret per bidder:  0.00214  Optimal Revenue:  5.166  payment:  5.566\n",
      "Total regret:  0.00537 Average regret per bidder:  0.00179  Optimal Revenue:  5.231  payment:  5.597\n",
      "Total regret:  0.00577 Average regret per bidder:  0.00192  Optimal Revenue:  5.206  payment:  5.586\n",
      "Total regret:  0.00558 Average regret per bidder:  0.00186  Optimal Revenue:  5.187  payment:  5.559\n",
      "Total regret:  0.00679 Average regret per bidder:  0.00226  Optimal Revenue:  5.175  payment:  5.588\n",
      "Total regret:  0.00590 Average regret per bidder:  0.00197  Optimal Revenue:  5.126  payment:  5.507\n",
      "Total regret:  0.00534 Average regret per bidder:  0.00178  Optimal Revenue:  5.291  payment:  5.658\n",
      "Total regret:  0.00542 Average regret per bidder:  0.00181  Optimal Revenue:  5.177  payment:  5.543\n",
      "Total regret:  0.00704 Average regret per bidder:  0.00235  Optimal Revenue:  5.144  payment:  5.565\n",
      "Total regret:  0.00547 Average regret per bidder:  0.00182  Optimal Revenue:  5.177  payment:  5.545\n"
     ]
    }
   ],
   "source": [
    "for i in range(50):\n",
    "  test(200, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Final Result\n",
      "Total Regret =  0.00595 Average regret per bidder:  0.00198  Optimal Revenue:  5.225  payment:  5.583\n"
     ]
    }
   ],
   "source": [
    "totalregret = np.mean(np.array(testRegret[-50:]))\n",
    "revenue     = np.mean(np.array(testPayment[-50:]))\n",
    "print(\"Final Result\")\n",
    "print(\"Total Regret = \", '{0:.5f}'.format(totalregret), \"Average regret per bidder: \",'{0:.5f}'.format(totalregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float(np.sqrt(revenue)-np.sqrt(totalregret))**2), \" payment: \",'{0:.3f}'.format(revenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "std Regret =  0.00056 std regret per bidder:  0.00019  std payment:  0.038\n"
     ]
    }
   ],
   "source": [
    "stdregret = np.std(np.array(testRegret[-50:]))\n",
    "stdrevenue= np.std(np.array(testPayment[-50:]))\n",
    "print(\"std Regret = \", '{0:.5f}'.format(stdregret), \"std regret per bidder: \",'{0:.5f}'.format(stdregret/nAgent), \" std payment: \",'{0:.3f}'.format(stdrevenue))"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
