{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Code was run on Colab"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import math\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "import collections\n",
    "import torch.optim as optim\n",
    "from torch.optim import Optimizer\n",
    "import time\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from AdamW          import AdamW\n",
    "from utils          import utility, misreportUtility, misreportOptimization, trueUtility, loss\n",
    "from networks       import AdditiveMechanism, Misreports\n",
    "from restrictedAdam import Adam "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "device = 'cuda' if torch.cuda.is_available() else 'cpu'"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Set Random Seed "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Initializing seeds\n",
    "torch.manual_seed(42)\n",
    "np.random.seed(42)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing Function\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def test(nBatch, nbrInit, R, gamma=0.001, minimum=0, maximum=1):\n",
    "    \n",
    "    \"\"\" This function computes the regret and payment of mechanism on a test set of size nBatch\n",
    "        The optimal misreport is computed by optimizing the utility function (not by using the Misreport network)\n",
    "        for R gradient steps (of stepsize gamma) and starting from nbrInit initialization, we only keep the best misreport\n",
    "        To compute the regret we evaluate the mechanism at the misreport and compare to the valuation\n",
    "        minimum and maximum indicate the range of the valuations\n",
    "    \"\"\"\n",
    "    \n",
    "    true = np.random.rand(nBatch,nAgent,nObject)\n",
    "\n",
    "    localMisreports     = np.random.rand(nBatch,nbrInit,nAgent,nObject)\n",
    "    batchMisreports     = torch.tensor(localMisreports).float().to(device)\n",
    "    batchTrueValuations = torch.tensor(true).float().to(device)\n",
    "    batchMisreports.requires_grad = True\n",
    "    \n",
    "    opt = Adam([batchMisreports], lr=gamma)\n",
    "    \n",
    "    for k in range(R):\n",
    "        advU         = misreportUtility(mechanism,batchTrueValuations,batchMisreports)\n",
    "        los          =  -1*torch.mean(advU).to(device)\n",
    "        los.backward()\n",
    "        opt.step(restricted= True, min=minimum, max=maximum)\n",
    "        opt.zero_grad()\n",
    "    \n",
    "    misReportUtilityMax  = torch.max(advU, dim =1)[0]\n",
    "    mechanism.zero_grad()\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "    regret = F.relu(misReportUtilityMax -utility(batchTrueValuations, allocation, payment))\n",
    "    mregret= torch.sum(torch.mean(regret, dim=0)).to(device)\n",
    "    mregret= float(mregret.cpu().detach().numpy())\n",
    "\n",
    "    with torch.no_grad():\n",
    "        l,rMean,p = loss(payment, regret)\n",
    "\n",
    "    testRegret.append(mregret)\n",
    "    testPayment.append(float(p.detach().cpu().numpy() ))\n",
    "    testOptimal.append(float((-l).detach().cpu().numpy())**2)\n",
    "    \n",
    "    print(\"Total regret: \",'{0:.5f}'.format(mregret), \"Average regret per bidder: \",'{0:.5f}'.format(mregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float((-l).detach().cpu().numpy())**2), \" payment: \",'{0:.3f}'.format(float(p.detach().cpu().numpy() )))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Initializing Networks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "nAgent   = 1\n",
    "nObject  = 10\n",
    "\n",
    "# Parameters for the mechanism (payment and allocation network)\n",
    "nLayersAllocation   = 4\n",
    "nLayersPayment      = 4\n",
    "widthAllocation     = 100\n",
    "widthPayment        = 100\n",
    "\n",
    "# Parameters for the misreport network\n",
    "nLayersMisreport    = 4\n",
    "widthMisreport      = 100\n",
    "\n",
    "gamma              = 0.001 \n",
    "testBatch          = 10000\n",
    "\n",
    "nExperiments       = 100000\n",
    "batchSize          = 500\n",
    "nbrBatches         = int(nExperiments/batchSize)\n",
    "\n",
    "\n",
    "mechanism            = AdditiveMechanism(nAgent, nObject, nLayersAllocation, widthAllocation).to(device)\n",
    "optimizerMechanism   = AdamW(mechanism.parameters(), lr=0.0005)\n",
    "\n",
    "misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "testRegret    = []\n",
    "testMaxRegret = []\n",
    "testPayment   = []\n",
    "testOptimal   = []\n",
    "testTime      = []\n",
    "testIteration = [0]\n",
    "\n",
    "# range of valuations\n",
    "minimum            = 0\n",
    "maximum            = 1"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Initial Test\n",
      "Total regret:  0.20760 Average regret per bidder:  0.20760  Optimal Revenue:  0.073  payment:  0.155\n",
      "Batch:  4\n",
      "Total regret:  0.00184 Average regret per bidder:  0.00184  Optimal Revenue:  0.499  payment:  0.565\n",
      "Batch:  8\n",
      "Total regret:  0.00039 Average regret per bidder:  0.00039  Optimal Revenue:  0.561  payment:  0.592\n",
      "Batch:  12\n",
      "Total regret:  0.00113 Average regret per bidder:  0.00113  Optimal Revenue:  0.422  payment:  0.468\n",
      "Batch:  16\n",
      "Total regret:  0.00069 Average regret per bidder:  0.00069  Optimal Revenue:  0.504  payment:  0.543\n",
      "Batch:  20\n",
      "Total regret:  0.00036 Average regret per bidder:  0.00036  Optimal Revenue:  0.515  payment:  0.543\n",
      "Batch:  24\n",
      "Total regret:  0.00070 Average regret per bidder:  0.00070  Optimal Revenue:  0.524  payment:  0.565\n",
      "Batch:  28\n",
      "Total regret:  0.00016 Average regret per bidder:  0.00016  Optimal Revenue:  0.522  payment:  0.541\n",
      "Batch:  32\n",
      "Total regret:  0.00050 Average regret per bidder:  0.00050  Optimal Revenue:  0.465  payment:  0.497\n",
      "Batch:  36\n",
      "Total regret:  0.00008 Average regret per bidder:  0.00008  Optimal Revenue:  0.527  payment:  0.540\n",
      "Batch:  40\n",
      "Total regret:  0.00013 Average regret per bidder:  0.00013  Optimal Revenue:  0.484  payment:  0.501\n",
      "Batch:  44\n",
      "Total regret:  0.00052 Average regret per bidder:  0.00052  Optimal Revenue:  0.548  payment:  0.583\n",
      "Batch:  48\n",
      "Total regret:  0.00011 Average regret per bidder:  0.00011  Optimal Revenue:  0.518  payment:  0.534\n",
      "Batch:  52\n",
      "Total regret:  0.00015 Average regret per bidder:  0.00015  Optimal Revenue:  0.617  payment:  0.636\n",
      "Batch:  56\n",
      "Total regret:  0.00042 Average regret per bidder:  0.00042  Optimal Revenue:  0.557  payment:  0.589\n",
      "Batch:  60\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.531  payment:  0.567\n"
     ]
    }
   ],
   "source": [
    "duration   = 0\n",
    "R          = 100\n",
    "\n",
    "i=0\n",
    "\n",
    "print(\"Initial Test\")\n",
    "test(50, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)\n",
    "\n",
    "for t in range(1,60*nbrBatches+1):\n",
    "    \n",
    "    # Reinitialize Misreport network periodically at the beginning of training\n",
    "    if (t%(4*nbrBatches) ==1):\n",
    "      if   t< 20*nbrBatches+2 :\n",
    "    \n",
    "        misreport            = Misreports(nAgent,nObject,nLayersMisreport, widthMisreport).to(device)\n",
    "        optimizerMisreport   = AdamW(misreport.parameters(), lr=0.0005)\n",
    "\n",
    "    batchTrueValuations = torch.tensor(np.random.rand(batchSize,nAgent,nObject)).float().to(device)\n",
    "    \n",
    "    # Optimize Misreport Network for R steps\n",
    "    for k in range(R):\n",
    "  \n",
    "        misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "        mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "        mLoss               = torch.sum(torch.mean(-mUtility,dim=0))\n",
    "\n",
    "        optimizerMisreport.zero_grad()\n",
    "        mLoss.backward()\n",
    "        optimizerMisreport.step()\n",
    "\n",
    "    \n",
    "    # Optimize Mechanism network for one step\n",
    "    misreports          = misreport(batchTrueValuations).unsqueeze(1)\n",
    "    mUtility            = misreportUtility(mechanism,batchTrueValuations,misreports).squeeze(1)\n",
    "\n",
    "    allocation, payment = mechanism(batchTrueValuations)\n",
    "\n",
    "    regret     = F.relu(mUtility -utility(batchTrueValuations, allocation, payment))\n",
    "    l,rMean,p = loss(payment, regret)\n",
    "        \n",
    "    optimizerMechanism.zero_grad()\n",
    "\n",
    "    l.backward()\n",
    "\n",
    "    optimizerMechanism.step()\n",
    "    \n",
    "    # Test mechanism periodically\n",
    "    if t % (4*nbrBatches)==0 :\n",
    "        print(\"Batch: \", 2*int(t/(2*nbrBatches)))\n",
    "        testTime.append(duration)\n",
    "        testIteration.append(t/nbrBatches)\n",
    "        test(100, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Testing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total regret:  0.00054 Average regret per bidder:  0.00054  Optimal Revenue:  0.531  payment:  0.566\n",
      "Total regret:  0.00054 Average regret per bidder:  0.00054  Optimal Revenue:  0.527  payment:  0.562\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.518  payment:  0.554\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.513  payment:  0.548\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.534  payment:  0.571\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.536  payment:  0.572\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.512  payment:  0.547\n",
      "Total regret:  0.00054 Average regret per bidder:  0.00054  Optimal Revenue:  0.508  payment:  0.543\n",
      "Total regret:  0.00053 Average regret per bidder:  0.00053  Optimal Revenue:  0.504  payment:  0.538\n",
      "Total regret:  0.00056 Average regret per bidder:  0.00056  Optimal Revenue:  0.520  payment:  0.555\n"
     ]
    }
   ],
   "source": [
    "for i in range(10):\n",
    "  test(1000, nbrInit=300, R=300, gamma=0.001, minimum=0, maximum=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Final Result\n",
      "Total Regret =  0.00055 Average regret per bidder:  0.00055  Optimal Revenue:  0.521  payment:  0.556\n"
     ]
    }
   ],
   "source": [
    "totalregret = np.mean(np.array(testRegret[-10:]))\n",
    "revenue     = np.mean(np.array(testPayment[-10:]))\n",
    "print(\"Final Result\")\n",
    "print(\"Total Regret = \", '{0:.5f}'.format(totalregret), \"Average regret per bidder: \",'{0:.5f}'.format(totalregret/nAgent), \" Optimal Revenue: \",'{0:.3f}'.format(float(np.sqrt(revenue)-np.sqrt(totalregret))**2), \" payment: \",'{0:.3f}'.format(revenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "std Regret =  0.00001 std regret per bidder:  0.00001  std payment:  0.011\n"
     ]
    }
   ],
   "source": [
    "stdregret = np.std(np.array(testRegret[-10:]))\n",
    "stdrevenue= np.std(np.array(testPayment[-10:]))\n",
    "print(\"std Regret = \", '{0:.5f}'.format(stdregret), \"std regret per bidder: \",'{0:.5f}'.format(stdregret/nAgent), \" std payment: \",'{0:.3f}'.format(stdrevenue))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
