{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "True\n",
      "cuda\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n"
     ]
    }
   ],
   "source": [
    "# Import basic libraries\n",
    "import numpy as np # linear algebra\n",
    "import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)\n",
    "from collections import OrderedDict\n",
    "\n",
    "# Import PyTorch\n",
    "import torch # import main library\n",
    "from torch.autograd import Variable\n",
    "import torch.nn as nn # import modules\n",
    "from torch.autograd import Function # import Function to create custom activations\n",
    "from torch.nn.parameter import Parameter # import Parameter to create custom activations with learnable parameters\n",
    "from torch import optim # import optimizers for demonstrations\n",
    "import torch.nn.functional as F # import torch functions\n",
    "from torchvision import datasets, transforms # import transformations to use for demo\n",
    "from torch.nn.parameter import Parameter # import Parameter to create custom activations with learnable parameters\n",
    "\n",
    "from models.activ_func import *\n",
    "from models.Nets import *\n",
    "from models.test import test_img\n",
    "from models.Update import *\n",
    "\n",
    "from utils.sampling import mnist_iid, mnist_noniid, cifar_iid\n",
    "from utils.options import args_parser\n",
    "\n",
    "import torchvision\n",
    "\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "class my_argument:    \n",
    "    epochs    = 16    #\"rounds of training\"\n",
    "    num_users = 1  # \"number of users: K\"\n",
    "    frac      = 0.5 #\"the fraction of clients: C\"\n",
    "    local_ep  = 1 #\"the number of local epochs: E\"\n",
    "    local_bs  = 128  #\"local batch size: B\"\n",
    "    bs        = 128 #\"test batch size\"\n",
    "    lr        = 0.1 #\"learning rate\"\n",
    "    momentum  = 0.5 # \"SGD momentum (default: 0.5)\"\n",
    "    split     = 'user' # \"train-test split type, user or sample\"\n",
    "\n",
    "    # model arguments\n",
    "    model = 'cnn'\n",
    "    kernel_num=9 #, help='number of each kind of kernel')\n",
    "    kernel_sizes='3,4,5' #  help='comma-separated kernel size to use for convolution')\n",
    "    norm='batch_norm' #, help=\"batch_norm, layer_norm, or None\")\n",
    "    num_filters=32 #, help=\"number of filters for conv nets\")\n",
    "    max_pool='True' #help=\"Whether use max pooling rather than strided convolutions\")\n",
    "\n",
    "    # other arguments\n",
    "    dataset='cifar' #, help=\"name of dataset\")\n",
    "    iid=1\n",
    "    num_classes=10#, help=\"number of classes\")\n",
    "    num_channels=1#, help=\"number of channels of imges\")\n",
    "    gpu=1#, help=\"GPU ID, -1 for CPU\")\n",
    "    stopping_rounds=10#, help='rounds of early stopping')\n",
    "    verbose='False'#, help='verbose print')\n",
    "    seed=1#, help='random seed (default: 1)')\n",
    "    \n",
    "args = my_argument()\n",
    "\n",
    "args.device = torch.device('cuda:{}'.format(args.gpu) if torch.cuda.is_available() and args.gpu != -1 else 'cpu')\n",
    "\n",
    "use_cuda = torch.cuda.is_available()\n",
    "print(use_cuda)\n",
    "args.device = torch.device(\"cuda\" if use_cuda else \"cpu\")\n",
    "print(args.device)\n",
    "\n",
    "transform_train = transforms.Compose([\n",
    "    transforms.RandomCrop(32, padding=4),\n",
    "    transforms.RandomHorizontalFlip(),\n",
    "    transforms.ToTensor(),\n",
    "    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),\n",
    "])\n",
    "\n",
    "# Normalize the test set same as training set without augmentation\n",
    "transform_test = transforms.Compose([\n",
    "    transforms.ToTensor(),\n",
    "    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),\n",
    "])\n",
    "\n",
    "trainset = torchvision.datasets.CIFAR10(\n",
    "    root=\"./data/cifar\", train=True, download=True, transform=transform_train)\n",
    "trainloader = torch.utils.data.DataLoader(\n",
    "    trainset, batch_size=args.bs, shuffle=True, num_workers=2)\n",
    "\n",
    "testset = torchvision.datasets.CIFAR10(\n",
    "    root=\"./data/cifar\", train=False, download=True, transform=transform_test)\n",
    "testloader = torch.utils.data.DataLoader(\n",
    "    testset, batch_size=args.bs, shuffle=False, num_workers=2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "def validation(model, testloader, criterion):\n",
    "    test_loss = 0\n",
    "    accuracy = 0\n",
    "    for images, labels in testloader:\n",
    "\n",
    "#         images.resize_(images.shape[0], 3*32*32)\n",
    "\n",
    "        images = images.cuda()\n",
    "        labels = labels.cuda()\n",
    "\n",
    "        output = model.forward(images)\n",
    "        test_loss += criterion(output, labels).item()\n",
    "\n",
    "        ps = torch.exp(output)\n",
    "        equality = (labels.data == ps.max(dim=1)[1])\n",
    "        accuracy += equality.type(torch.FloatTensor).mean()\n",
    "\n",
    "    return test_loss, accuracy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "VGG(\n",
       "  (features): Sequential(\n",
       "    (0): Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (2): ReLU(inplace=True)\n",
       "    (3): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (4): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (5): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (6): ReLU(inplace=True)\n",
       "    (7): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (8): Conv2d(128, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (9): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (10): ReLU(inplace=True)\n",
       "    (11): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (12): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (13): ReLU(inplace=True)\n",
       "    (14): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (15): Conv2d(256, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (16): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (17): ReLU(inplace=True)\n",
       "    (18): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (19): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (20): ReLU(inplace=True)\n",
       "    (21): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (22): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (23): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (24): ReLU(inplace=True)\n",
       "    (25): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
       "    (26): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (27): ReLU(inplace=True)\n",
       "    (28): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (29): AvgPool2d(kernel_size=1, stride=1, padding=0)\n",
       "  )\n",
       "  (classifier): Linear(in_features=512, out_features=10, bias=True)\n",
       ")"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from torch.nn import Module\n",
    "import torch.nn.functional as F\n",
    "import brevitas.nn as qnn\n",
    "from brevitas.core.quant import QuantType\n",
    "\n",
    "\n",
    "from models.vgg import *\n",
    "\n",
    "import math\n",
    "\n",
    "                    \n",
    "net = VGG('VGG11')\n",
    "net.cuda()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(2.2992, device='cuda:0')\n",
      "100 tensor(1.5402, device='cuda:0')\n",
      "200 tensor(1.4077, device='cuda:0')\n",
      "300 tensor(1.4371, device='cuda:0')\n",
      "Iteration: 1 | Loss: 1.5121257305145264 | Train,Test accuracy: 0.5327685475349426.3f%, 0.539655864238739.3f%\n",
      "0 tensor(1.3398, device='cuda:0')\n",
      "100 tensor(1.2915, device='cuda:0')\n",
      "200 tensor(0.9962, device='cuda:0')\n",
      "300 tensor(0.9332, device='cuda:0')\n",
      "Iteration: 2 | Loss: 1.0909663438796997 | Train,Test accuracy: 0.6628236770629883.3f%, 0.6563488841056824.3f%\n",
      "0 tensor(0.9677, device='cuda:0')\n",
      "100 tensor(0.9513, device='cuda:0')\n",
      "200 tensor(1.0188, device='cuda:0')\n",
      "300 tensor(0.9661, device='cuda:0')\n",
      "Iteration: 3 | Loss: 0.9079623818397522 | Train,Test accuracy: 0.7054027915000916.3f%, 0.7023338675498962.3f%\n",
      "0 tensor(0.8110, device='cuda:0')\n",
      "100 tensor(0.7948, device='cuda:0')\n",
      "200 tensor(0.9047, device='cuda:0')\n",
      "300 tensor(0.7853, device='cuda:0')\n",
      "Iteration: 4 | Loss: 0.8063987493515015 | Train,Test accuracy: 0.7525854706764221.3f%, 0.7200356125831604.3f%\n",
      "0 tensor(0.6756, device='cuda:0')\n",
      "100 tensor(0.8497, device='cuda:0')\n",
      "200 tensor(0.7904, device='cuda:0')\n",
      "300 tensor(0.7509, device='cuda:0')\n",
      "Iteration: 5 | Loss: 0.7354734539985657 | Train,Test accuracy: 0.7561940550804138.3f%, 0.7270569801330566.3f%\n",
      "0 tensor(0.6462, device='cuda:0')\n",
      "100 tensor(0.7655, device='cuda:0')\n",
      "200 tensor(0.6761, device='cuda:0')\n",
      "300 tensor(0.5312, device='cuda:0')\n",
      "Iteration: 6 | Loss: 0.6722784638404846 | Train,Test accuracy: 0.7854699492454529.3f%, 0.7639438509941101.3f%\n",
      "0 tensor(0.6648, device='cuda:0')\n",
      "100 tensor(0.6320, device='cuda:0')\n",
      "200 tensor(0.5943, device='cuda:0')\n",
      "300 tensor(0.6116, device='cuda:0')\n",
      "Iteration: 7 | Loss: 0.6328436732292175 | Train,Test accuracy: 0.8056905269622803.3f%, 0.769679605960846.3f%\n",
      "0 tensor(0.6618, device='cuda:0')\n",
      "100 tensor(0.6718, device='cuda:0')\n",
      "200 tensor(0.6585, device='cuda:0')\n",
      "300 tensor(0.4659, device='cuda:0')\n",
      "Iteration: 8 | Loss: 0.5862708687782288 | Train,Test accuracy: 0.7991927862167358.3f%, 0.7767009735107422.3f%\n",
      "0 tensor(0.4362, device='cuda:0')\n",
      "100 tensor(0.4253, device='cuda:0')\n",
      "200 tensor(0.4104, device='cuda:0')\n",
      "300 tensor(0.4878, device='cuda:0')\n",
      "Iteration: 9 | Loss: 0.5485372543334961 | Train,Test accuracy: 0.820252537727356.3f%, 0.7914358973503113.3f%\n",
      "0 tensor(0.4913, device='cuda:0')\n",
      "100 tensor(0.5229, device='cuda:0')\n",
      "200 tensor(0.4957, device='cuda:0')\n",
      "300 tensor(0.4596, device='cuda:0')\n",
      "Iteration: 10 | Loss: 0.5220752358436584 | Train,Test accuracy: 0.8381713628768921.3f%, 0.7972705960273743.3f%\n",
      "0 tensor(0.5025, device='cuda:0')\n",
      "100 tensor(0.5107, device='cuda:0')\n",
      "200 tensor(0.4565, device='cuda:0')\n",
      "300 tensor(0.5828, device='cuda:0')\n",
      "Iteration: 11 | Loss: 0.4923417866230011 | Train,Test accuracy: 0.8431146144866943.3f%, 0.8079509735107422.3f%\n",
      "0 tensor(0.4546, device='cuda:0')\n",
      "100 tensor(0.5259, device='cuda:0')\n",
      "200 tensor(0.4835, device='cuda:0')\n",
      "300 tensor(0.5529, device='cuda:0')\n",
      "Iteration: 12 | Loss: 0.4670410454273224 | Train,Test accuracy: 0.8518861532211304.3f%, 0.8161590099334717.3f%\n",
      "0 tensor(0.4535, device='cuda:0')\n",
      "100 tensor(0.4149, device='cuda:0')\n",
      "200 tensor(0.6105, device='cuda:0')\n",
      "300 tensor(0.5231, device='cuda:0')\n",
      "Iteration: 13 | Loss: 0.45098116993904114 | Train,Test accuracy: 0.8660725355148315.3f%, 0.8167523741722107.3f%\n",
      "0 tensor(0.3410, device='cuda:0')\n",
      "100 tensor(0.4798, device='cuda:0')\n",
      "200 tensor(0.3543, device='cuda:0')\n",
      "300 tensor(0.4360, device='cuda:0')\n",
      "Iteration: 14 | Loss: 0.42977896332740784 | Train,Test accuracy: 0.8753436803817749.3f%, 0.8270371556282043.3f%\n",
      "0 tensor(0.3067, device='cuda:0')\n",
      "100 tensor(0.3639, device='cuda:0')\n",
      "200 tensor(0.3911, device='cuda:0')\n",
      "300 tensor(0.3637, device='cuda:0')\n",
      "Iteration: 15 | Loss: 0.411542147397995 | Train,Test accuracy: 0.869025707244873.3f%, 0.8195213675498962.3f%\n",
      "0 tensor(0.3467, device='cuda:0')\n",
      "100 tensor(0.3154, device='cuda:0')\n",
      "200 tensor(0.3088, device='cuda:0')\n",
      "300 tensor(0.4124, device='cuda:0')\n",
      "Iteration: 16 | Loss: 0.399280309677124 | Train,Test accuracy: 0.8739609718322754.3f%, 0.8173457384109497.3f%\n",
      "0 tensor(0.3695, device='cuda:0')\n",
      "100 tensor(0.3779, device='cuda:0')\n",
      "200 tensor(0.3828, device='cuda:0')\n",
      "300 tensor(0.4527, device='cuda:0')\n",
      "Iteration: 17 | Loss: 0.38777101039886475 | Train,Test accuracy: 0.8814658522605896.3f%, 0.8070608973503113.3f%\n",
      "0 tensor(0.2499, device='cuda:0')\n",
      "100 tensor(0.3030, device='cuda:0')\n",
      "200 tensor(0.3650, device='cuda:0')\n",
      "300 tensor(0.4423, device='cuda:0')\n",
      "Iteration: 18 | Loss: 0.37248170375823975 | Train,Test accuracy: 0.88213711977005.3f%, 0.8221914768218994.3f%\n",
      "0 tensor(0.3288, device='cuda:0')\n",
      "100 tensor(0.3968, device='cuda:0')\n",
      "200 tensor(0.4040, device='cuda:0')\n",
      "300 tensor(0.3409, device='cuda:0')\n",
      "Iteration: 19 | Loss: 0.3639894723892212 | Train,Test accuracy: 0.8872761726379395.3f%, 0.8289161324501038.3f%\n",
      "0 tensor(0.3357, device='cuda:0')\n",
      "100 tensor(0.3625, device='cuda:0')\n",
      "200 tensor(0.4388, device='cuda:0')\n",
      "300 tensor(0.3505, device='cuda:0')\n",
      "Iteration: 20 | Loss: 0.3479176461696625 | Train,Test accuracy: 0.88620924949646.3f%, 0.8322784900665283.3f%\n",
      "0 tensor(0.4087, device='cuda:0')\n",
      "100 tensor(0.3526, device='cuda:0')\n",
      "200 tensor(0.4105, device='cuda:0')\n",
      "300 tensor(0.3966, device='cuda:0')\n",
      "Iteration: 21 | Loss: 0.3466860353946686 | Train,Test accuracy: 0.8926351070404053.3f%, 0.8200158476829529.3f%\n",
      "0 tensor(0.2377, device='cuda:0')\n",
      "100 tensor(0.2532, device='cuda:0')\n",
      "200 tensor(0.2613, device='cuda:0')\n",
      "300 tensor(0.3838, device='cuda:0')\n",
      "Iteration: 22 | Loss: 0.33038443326950073 | Train,Test accuracy: 0.8984375.3f%, 0.8330696225166321.3f%\n",
      "0 tensor(0.3947, device='cuda:0')\n",
      "100 tensor(0.4392, device='cuda:0')\n",
      "200 tensor(0.2331, device='cuda:0')\n",
      "300 tensor(0.3013, device='cuda:0')\n",
      "Iteration: 23 | Loss: 0.32873979210853577 | Train,Test accuracy: 0.8968150615692139.3f%, 0.8400909900665283.3f%\n",
      "0 tensor(0.2694, device='cuda:0')\n",
      "100 tensor(0.2824, device='cuda:0')\n",
      "200 tensor(0.3519, device='cuda:0')\n",
      "300 tensor(0.3604, device='cuda:0')\n",
      "Iteration: 24 | Loss: 0.3172850012779236 | Train,Test accuracy: 0.9022378325462341.3f%, 0.8311906456947327.3f%\n",
      "0 tensor(0.2732, device='cuda:0')\n",
      "100 tensor(0.2055, device='cuda:0')\n",
      "200 tensor(0.3877, device='cuda:0')\n",
      "300 tensor(0.3568, device='cuda:0')\n",
      "Iteration: 25 | Loss: 0.3105263113975525 | Train,Test accuracy: 0.9055386781692505.3f%, 0.843156635761261.3f%\n",
      "0 tensor(0.2542, device='cuda:0')\n",
      "100 tensor(0.3016, device='cuda:0')\n",
      "200 tensor(0.3409, device='cuda:0')\n",
      "300 tensor(0.2859, device='cuda:0')\n",
      "Iteration: 26 | Loss: 0.30628883838653564 | Train,Test accuracy: 0.8992806673049927.3f%, 0.8343552350997925.3f%\n",
      "0 tensor(0.2686, device='cuda:0')\n",
      "100 tensor(0.2295, device='cuda:0')\n",
      "200 tensor(0.2811, device='cuda:0')\n",
      "300 tensor(0.2500, device='cuda:0')\n",
      "Iteration: 27 | Loss: 0.3001580238342285 | Train,Test accuracy: 0.9128316640853882.3f%, 0.8423655033111572.3f%\n",
      "0 tensor(0.2464, device='cuda:0')\n",
      "100 tensor(0.4108, device='cuda:0')\n",
      "200 tensor(0.3106, device='cuda:0')\n",
      "300 tensor(0.3271, device='cuda:0')\n",
      "Iteration: 28 | Loss: 0.29336726665496826 | Train,Test accuracy: 0.9126158952713013.3f%, 0.8392009735107422.3f%\n",
      "0 tensor(0.2204, device='cuda:0')\n",
      "100 tensor(0.3969, device='cuda:0')\n",
      "200 tensor(0.3046, device='cuda:0')\n",
      "300 tensor(0.2591, device='cuda:0')\n",
      "Iteration: 29 | Loss: 0.29042693972587585 | Train,Test accuracy: 0.913519024848938.3f%, 0.8403876423835754.3f%\n",
      "0 tensor(0.2318, device='cuda:0')\n",
      "100 tensor(0.3116, device='cuda:0')\n",
      "200 tensor(0.3019, device='cuda:0')\n",
      "300 tensor(0.2714, device='cuda:0')\n",
      "Iteration: 30 | Loss: 0.28849416971206665 | Train,Test accuracy: 0.9092791080474854.3f%, 0.8319817781448364.3f%\n",
      "0 tensor(0.1908, device='cuda:0')\n",
      "100 tensor(0.2985, device='cuda:0')\n",
      "200 tensor(0.2765, device='cuda:0')\n",
      "300 tensor(0.2632, device='cuda:0')\n",
      "Iteration: 31 | Loss: 0.284192830324173 | Train,Test accuracy: 0.9176989793777466.3f%, 0.841969907283783.3f%\n",
      "0 tensor(0.2345, device='cuda:0')\n",
      "100 tensor(0.3357, device='cuda:0')\n",
      "200 tensor(0.3092, device='cuda:0')\n",
      "300 tensor(0.2630, device='cuda:0')\n",
      "Iteration: 32 | Loss: 0.2734920084476471 | Train,Test accuracy: 0.9150775671005249.3f%, 0.8404865264892578.3f%\n",
      "0 tensor(0.1639, device='cuda:0')\n",
      "100 tensor(0.2216, device='cuda:0')\n",
      "200 tensor(0.2911, device='cuda:0')\n",
      "300 tensor(0.1931, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 33 | Loss: 0.27162623405456543 | Train,Test accuracy: 0.916236400604248.3f%, 0.8418710231781006.3f%\n",
      "0 tensor(0.2962, device='cuda:0')\n",
      "100 tensor(0.2962, device='cuda:0')\n",
      "200 tensor(0.2168, device='cuda:0')\n",
      "300 tensor(0.2641, device='cuda:0')\n",
      "Iteration: 34 | Loss: 0.2727038562297821 | Train,Test accuracy: 0.9206002354621887.3f%, 0.839695394039154.3f%\n",
      "0 tensor(0.2335, device='cuda:0')\n",
      "100 tensor(0.3211, device='cuda:0')\n",
      "200 tensor(0.2772, device='cuda:0')\n",
      "300 tensor(0.3389, device='cuda:0')\n",
      "Iteration: 35 | Loss: 0.26466643810272217 | Train,Test accuracy: 0.9149256348609924.3f%, 0.842563271522522.3f%\n",
      "0 tensor(0.2769, device='cuda:0')\n",
      "100 tensor(0.2872, device='cuda:0')\n",
      "200 tensor(0.2951, device='cuda:0')\n",
      "300 tensor(0.3326, device='cuda:0')\n",
      "Iteration: 36 | Loss: 0.26590314507484436 | Train,Test accuracy: 0.9133711457252502.3f%, 0.8356408476829529.3f%\n",
      "0 tensor(0.2891, device='cuda:0')\n",
      "100 tensor(0.2151, device='cuda:0')\n",
      "200 tensor(0.2956, device='cuda:0')\n",
      "300 tensor(0.2479, device='cuda:0')\n",
      "Iteration: 37 | Loss: 0.25840556621551514 | Train,Test accuracy: 0.9140345454216003.3f%, 0.8337618708610535.3f%\n",
      "0 tensor(0.3004, device='cuda:0')\n",
      "100 tensor(0.2258, device='cuda:0')\n",
      "200 tensor(0.2799, device='cuda:0')\n",
      "300 tensor(0.3702, device='cuda:0')\n",
      "Iteration: 38 | Loss: 0.25231632590293884 | Train,Test accuracy: 0.9236932396888733.3f%, 0.8348496556282043.3f%\n",
      "0 tensor(0.2615, device='cuda:0')\n",
      "100 tensor(0.2571, device='cuda:0')\n",
      "200 tensor(0.2198, device='cuda:0')\n",
      "300 tensor(0.2994, device='cuda:0')\n",
      "Iteration: 39 | Loss: 0.2556169331073761 | Train,Test accuracy: 0.9224344491958618.3f%, 0.8458267450332642.3f%\n",
      "0 tensor(0.2194, device='cuda:0')\n",
      "100 tensor(0.2802, device='cuda:0')\n",
      "200 tensor(0.3152, device='cuda:0')\n",
      "300 tensor(0.2025, device='cuda:0')\n",
      "Iteration: 40 | Loss: 0.2519080638885498 | Train,Test accuracy: 0.9207121133804321.3f%, 0.8427610993385315.3f%\n",
      "0 tensor(0.4831, device='cuda:0')\n",
      "100 tensor(0.2341, device='cuda:0')\n",
      "200 tensor(0.2846, device='cuda:0')\n",
      "300 tensor(0.2265, device='cuda:0')\n",
      "Iteration: 41 | Loss: 0.24241864681243896 | Train,Test accuracy: 0.9242127537727356.3f%, 0.8394976258277893.3f%\n",
      "0 tensor(0.2144, device='cuda:0')\n",
      "100 tensor(0.2149, device='cuda:0')\n",
      "200 tensor(0.1634, device='cuda:0')\n",
      "300 tensor(0.2338, device='cuda:0')\n",
      "Iteration: 42 | Loss: 0.24648039042949677 | Train,Test accuracy: 0.9225543737411499.3f%, 0.8438488841056824.3f%\n",
      "0 tensor(0.1898, device='cuda:0')\n",
      "100 tensor(0.1668, device='cuda:0')\n",
      "200 tensor(0.2297, device='cuda:0')\n",
      "300 tensor(0.3876, device='cuda:0')\n",
      "Iteration: 43 | Loss: 0.24566404521465302 | Train,Test accuracy: 0.9167279005050659.3f%, 0.8429588675498962.3f%\n",
      "0 tensor(0.2585, device='cuda:0')\n",
      "100 tensor(0.2764, device='cuda:0')\n",
      "200 tensor(0.1390, device='cuda:0')\n",
      "300 tensor(0.2241, device='cuda:0')\n",
      "Iteration: 44 | Loss: 0.24278980493545532 | Train,Test accuracy: 0.9289482235908508.3f%, 0.8470134735107422.3f%\n",
      "0 tensor(0.2261, device='cuda:0')\n",
      "100 tensor(0.2504, device='cuda:0')\n",
      "200 tensor(0.3859, device='cuda:0')\n",
      "300 tensor(0.2701, device='cuda:0')\n",
      "Iteration: 45 | Loss: 0.24234908819198608 | Train,Test accuracy: 0.931253969669342.3f%, 0.846914529800415.3f%\n",
      "0 tensor(0.1609, device='cuda:0')\n",
      "100 tensor(0.1797, device='cuda:0')\n",
      "200 tensor(0.1506, device='cuda:0')\n",
      "300 tensor(0.1983, device='cuda:0')\n",
      "Iteration: 46 | Loss: 0.2404252290725708 | Train,Test accuracy: 0.9234814047813416.3f%, 0.8421677350997925.3f%\n",
      "0 tensor(0.2188, device='cuda:0')\n",
      "100 tensor(0.2078, device='cuda:0')\n",
      "200 tensor(0.1840, device='cuda:0')\n",
      "300 tensor(0.2046, device='cuda:0')\n",
      "Iteration: 47 | Loss: 0.23658770322799683 | Train,Test accuracy: 0.9279491901397705.3f%, 0.8390031456947327.3f%\n",
      "0 tensor(0.1669, device='cuda:0')\n",
      "100 tensor(0.2524, device='cuda:0')\n",
      "200 tensor(0.3572, device='cuda:0')\n",
      "300 tensor(0.2591, device='cuda:0')\n",
      "Iteration: 48 | Loss: 0.23390959203243256 | Train,Test accuracy: 0.9326486587524414.3f%, 0.8479034900665283.3f%\n",
      "0 tensor(0.1904, device='cuda:0')\n",
      "100 tensor(0.1938, device='cuda:0')\n",
      "200 tensor(0.3036, device='cuda:0')\n",
      "300 tensor(0.1491, device='cuda:0')\n",
      "Iteration: 49 | Loss: 0.23300285637378693 | Train,Test accuracy: 0.9299432635307312.3f%, 0.8452333807945251.3f%\n",
      "0 tensor(0.1899, device='cuda:0')\n",
      "100 tensor(0.2961, device='cuda:0')\n",
      "200 tensor(0.2642, device='cuda:0')\n",
      "300 tensor(0.1852, device='cuda:0')\n",
      "Iteration: 50 | Loss: 0.22989439964294434 | Train,Test accuracy: 0.9298713207244873.3f%, 0.8492879867553711.3f%\n",
      "0 tensor(0.2577, device='cuda:0')\n",
      "100 tensor(0.2497, device='cuda:0')\n",
      "200 tensor(0.2272, device='cuda:0')\n",
      "300 tensor(0.2915, device='cuda:0')\n",
      "Iteration: 51 | Loss: 0.2269386351108551 | Train,Test accuracy: 0.9210757613182068.3f%, 0.846914529800415.3f%\n",
      "0 tensor(0.3487, device='cuda:0')\n",
      "100 tensor(0.2180, device='cuda:0')\n",
      "200 tensor(0.1830, device='cuda:0')\n",
      "300 tensor(0.2877, device='cuda:0')\n",
      "Iteration: 52 | Loss: 0.2296053022146225 | Train,Test accuracy: 0.9265384674072266.3f%, 0.8487935066223145.3f%\n",
      "0 tensor(0.1238, device='cuda:0')\n",
      "100 tensor(0.2181, device='cuda:0')\n",
      "200 tensor(0.2628, device='cuda:0')\n",
      "300 tensor(0.2656, device='cuda:0')\n",
      "Iteration: 53 | Loss: 0.2307257354259491 | Train,Test accuracy: 0.9310821890830994.3f%, 0.8400909900665283.3f%\n",
      "0 tensor(0.2346, device='cuda:0')\n",
      "100 tensor(0.2098, device='cuda:0')\n",
      "200 tensor(0.3062, device='cuda:0')\n",
      "300 tensor(0.3523, device='cuda:0')\n",
      "Iteration: 54 | Loss: 0.22458332777023315 | Train,Test accuracy: 0.9306066036224365.3f%, 0.8458267450332642.3f%\n",
      "0 tensor(0.2961, device='cuda:0')\n",
      "100 tensor(0.2508, device='cuda:0')\n",
      "200 tensor(0.3223, device='cuda:0')\n",
      "300 tensor(0.3155, device='cuda:0')\n",
      "Iteration: 55 | Loss: 0.2204955816268921 | Train,Test accuracy: 0.9306145906448364.3f%, 0.8501780033111572.3f%\n",
      "0 tensor(0.2841, device='cuda:0')\n",
      "100 tensor(0.2419, device='cuda:0')\n",
      "200 tensor(0.2249, device='cuda:0')\n",
      "300 tensor(0.3510, device='cuda:0')\n",
      "Iteration: 56 | Loss: 0.22180035710334778 | Train,Test accuracy: 0.9320172667503357.3f%, 0.8444422483444214.3f%\n",
      "0 tensor(0.1886, device='cuda:0')\n",
      "100 tensor(0.1382, device='cuda:0')\n",
      "200 tensor(0.1201, device='cuda:0')\n",
      "300 tensor(0.2545, device='cuda:0')\n",
      "Iteration: 57 | Loss: 0.21998712420463562 | Train,Test accuracy: 0.9304987788200378.3f%, 0.8470134735107422.3f%\n",
      "0 tensor(0.2297, device='cuda:0')\n",
      "100 tensor(0.1993, device='cuda:0')\n",
      "200 tensor(0.2307, device='cuda:0')\n",
      "300 tensor(0.3237, device='cuda:0')\n",
      "Iteration: 58 | Loss: 0.21754305064678192 | Train,Test accuracy: 0.930027186870575.3f%, 0.8410798907279968.3f%\n",
      "0 tensor(0.2444, device='cuda:0')\n",
      "100 tensor(0.2184, device='cuda:0')\n",
      "200 tensor(0.2526, device='cuda:0')\n",
      "300 tensor(0.1497, device='cuda:0')\n",
      "Iteration: 59 | Loss: 0.2133350372314453 | Train,Test accuracy: 0.9329403638839722.3f%, 0.8423655033111572.3f%\n",
      "0 tensor(0.1845, device='cuda:0')\n",
      "100 tensor(0.1649, device='cuda:0')\n",
      "200 tensor(0.2593, device='cuda:0')\n",
      "300 tensor(0.1882, device='cuda:0')\n",
      "Iteration: 60 | Loss: 0.22108164429664612 | Train,Test accuracy: 0.9296315312385559.3f%, 0.8461233973503113.3f%\n",
      "0 tensor(0.2045, device='cuda:0')\n",
      "100 tensor(0.1847, device='cuda:0')\n",
      "200 tensor(0.1311, device='cuda:0')\n",
      "300 tensor(0.1586, device='cuda:0')\n",
      "Iteration: 61 | Loss: 0.21362954378128052 | Train,Test accuracy: 0.9357936978340149.3f%, 0.8541337251663208.3f%\n",
      "0 tensor(0.1039, device='cuda:0')\n",
      "100 tensor(0.1826, device='cuda:0')\n",
      "200 tensor(0.3803, device='cuda:0')\n",
      "300 tensor(0.1591, device='cuda:0')\n",
      "Iteration: 62 | Loss: 0.21364624798297882 | Train,Test accuracy: 0.9330163598060608.3f%, 0.8507713675498962.3f%\n",
      "0 tensor(0.1541, device='cuda:0')\n",
      "100 tensor(0.2131, device='cuda:0')\n",
      "200 tensor(0.2728, device='cuda:0')\n",
      "300 tensor(0.1860, device='cuda:0')\n",
      "Iteration: 63 | Loss: 0.21356083452701569 | Train,Test accuracy: 0.9361932873725891.3f%, 0.8435522317886353.3f%\n",
      "0 tensor(0.1379, device='cuda:0')\n",
      "100 tensor(0.3170, device='cuda:0')\n",
      "200 tensor(0.1574, device='cuda:0')\n",
      "300 tensor(0.3043, device='cuda:0')\n",
      "Iteration: 64 | Loss: 0.21244795620441437 | Train,Test accuracy: 0.9282408952713013.3f%, 0.8460245132446289.3f%\n",
      "0 tensor(0.2246, device='cuda:0')\n",
      "100 tensor(0.1247, device='cuda:0')\n",
      "200 tensor(0.2254, device='cuda:0')\n",
      "300 tensor(0.2647, device='cuda:0')\n",
      "Iteration: 65 | Loss: 0.21136532723903656 | Train,Test accuracy: 0.9367207288742065.3f%, 0.8433544039726257.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.1856, device='cuda:0')\n",
      "100 tensor(0.2000, device='cuda:0')\n",
      "200 tensor(0.1807, device='cuda:0')\n",
      "300 tensor(0.1488, device='cuda:0')\n",
      "Iteration: 66 | Loss: 0.21145881712436676 | Train,Test accuracy: 0.9348225593566895.3f%, 0.8429588675498962.3f%\n",
      "0 tensor(0.2515, device='cuda:0')\n",
      "100 tensor(0.1717, device='cuda:0')\n",
      "200 tensor(0.2172, device='cuda:0')\n",
      "300 tensor(0.1770, device='cuda:0')\n",
      "Iteration: 67 | Loss: 0.20946188271045685 | Train,Test accuracy: 0.9364410042762756.3f%, 0.8403876423835754.3f%\n",
      "0 tensor(0.3195, device='cuda:0')\n",
      "100 tensor(0.1499, device='cuda:0')\n",
      "200 tensor(0.2319, device='cuda:0')\n",
      "300 tensor(0.1727, device='cuda:0')\n",
      "Iteration: 68 | Loss: 0.20495417714118958 | Train,Test accuracy: 0.9334718585014343.3f%, 0.8433544039726257.3f%\n",
      "0 tensor(0.1263, device='cuda:0')\n",
      "100 tensor(0.2206, device='cuda:0')\n",
      "200 tensor(0.1883, device='cuda:0')\n",
      "300 tensor(0.1144, device='cuda:0')\n",
      "Iteration: 69 | Loss: 0.2063254863023758 | Train,Test accuracy: 0.9373041987419128.3f%, 0.8532436490058899.3f%\n",
      "0 tensor(0.1729, device='cuda:0')\n",
      "100 tensor(0.3330, device='cuda:0')\n",
      "200 tensor(0.2195, device='cuda:0')\n",
      "300 tensor(0.1520, device='cuda:0')\n",
      "Iteration: 70 | Loss: 0.2054002583026886 | Train,Test accuracy: 0.9390225410461426.3f%, 0.8557159900665283.3f%\n",
      "0 tensor(0.1402, device='cuda:0')\n",
      "100 tensor(0.0904, device='cuda:0')\n",
      "200 tensor(0.2722, device='cuda:0')\n",
      "300 tensor(0.2026, device='cuda:0')\n",
      "Iteration: 71 | Loss: 0.20963627099990845 | Train,Test accuracy: 0.9289961457252502.3f%, 0.8363330960273743.3f%\n",
      "0 tensor(0.1912, device='cuda:0')\n",
      "100 tensor(0.2535, device='cuda:0')\n",
      "200 tensor(0.1872, device='cuda:0')\n",
      "300 tensor(0.1679, device='cuda:0')\n",
      "Iteration: 72 | Loss: 0.2035914659500122 | Train,Test accuracy: 0.938127338886261.3f%, 0.8511669039726257.3f%\n",
      "0 tensor(0.1275, device='cuda:0')\n",
      "100 tensor(0.1778, device='cuda:0')\n",
      "200 tensor(0.1554, device='cuda:0')\n",
      "300 tensor(0.1165, device='cuda:0')\n",
      "Iteration: 73 | Loss: 0.2028147429227829 | Train,Test accuracy: 0.9210837483406067.3f%, 0.8272349834442139.3f%\n",
      "0 tensor(0.2467, device='cuda:0')\n",
      "100 tensor(0.2286, device='cuda:0')\n",
      "200 tensor(0.3016, device='cuda:0')\n",
      "300 tensor(0.2424, device='cuda:0')\n",
      "Iteration: 74 | Loss: 0.20839855074882507 | Train,Test accuracy: 0.9374960064888.3f%, 0.8482990264892578.3f%\n",
      "0 tensor(0.1565, device='cuda:0')\n",
      "100 tensor(0.2247, device='cuda:0')\n",
      "200 tensor(0.2394, device='cuda:0')\n",
      "300 tensor(0.1296, device='cuda:0')\n",
      "Iteration: 75 | Loss: 0.2028941661119461 | Train,Test accuracy: 0.9379275441169739.3f%, 0.8568037748336792.3f%\n",
      "0 tensor(0.2337, device='cuda:0')\n",
      "100 tensor(0.1689, device='cuda:0')\n",
      "200 tensor(0.3429, device='cuda:0')\n",
      "300 tensor(0.4304, device='cuda:0')\n",
      "Iteration: 76 | Loss: 0.20429468154907227 | Train,Test accuracy: 0.9397058486938477.3f%, 0.8438488841056824.3f%\n",
      "0 tensor(0.2064, device='cuda:0')\n",
      "100 tensor(0.1539, device='cuda:0')\n",
      "200 tensor(0.1405, device='cuda:0')\n",
      "300 tensor(0.1707, device='cuda:0')\n",
      "Iteration: 77 | Loss: 0.2024412602186203 | Train,Test accuracy: 0.9381593465805054.3f%, 0.8512658476829529.3f%\n",
      "0 tensor(0.0734, device='cuda:0')\n",
      "100 tensor(0.1738, device='cuda:0')\n",
      "200 tensor(0.2172, device='cuda:0')\n",
      "300 tensor(0.1537, device='cuda:0')\n",
      "Iteration: 78 | Loss: 0.19542087614536285 | Train,Test accuracy: 0.9355778694152832.3f%, 0.8441455960273743.3f%\n",
      "0 tensor(0.2904, device='cuda:0')\n",
      "100 tensor(0.1178, device='cuda:0')\n",
      "200 tensor(0.2525, device='cuda:0')\n",
      "300 tensor(0.2875, device='cuda:0')\n",
      "Iteration: 79 | Loss: 0.1994638890028 | Train,Test accuracy: 0.9428228735923767.3f%, 0.8486946225166321.3f%\n",
      "0 tensor(0.1844, device='cuda:0')\n",
      "100 tensor(0.2621, device='cuda:0')\n",
      "200 tensor(0.2005, device='cuda:0')\n",
      "300 tensor(0.2391, device='cuda:0')\n",
      "Iteration: 80 | Loss: 0.19585677981376648 | Train,Test accuracy: 0.9408727884292603.3f%, 0.8470134735107422.3f%\n",
      "0 tensor(0.1205, device='cuda:0')\n",
      "100 tensor(0.1171, device='cuda:0')\n",
      "200 tensor(0.2278, device='cuda:0')\n",
      "300 tensor(0.2467, device='cuda:0')\n",
      "Iteration: 81 | Loss: 0.19845902919769287 | Train,Test accuracy: 0.9417918920516968.3f%, 0.8386076092720032.3f%\n",
      "0 tensor(0.1791, device='cuda:0')\n",
      "100 tensor(0.1017, device='cuda:0')\n",
      "200 tensor(0.1479, device='cuda:0')\n",
      "300 tensor(0.1457, device='cuda:0')\n",
      "Iteration: 82 | Loss: 0.1319730281829834 | Train,Test accuracy: 0.9653453230857849.3f%, 0.8661985993385315.3f%\n",
      "0 tensor(0.0496, device='cuda:0')\n",
      "100 tensor(0.0672, device='cuda:0')\n",
      "200 tensor(0.0895, device='cuda:0')\n",
      "300 tensor(0.0873, device='cuda:0')\n",
      "Iteration: 83 | Loss: 0.11477620899677277 | Train,Test accuracy: 0.9658128023147583.3f%, 0.8627373576164246.3f%\n",
      "0 tensor(0.0798, device='cuda:0')\n",
      "100 tensor(0.0895, device='cuda:0')\n",
      "200 tensor(0.0928, device='cuda:0')\n",
      "300 tensor(0.0997, device='cuda:0')\n",
      "Iteration: 84 | Loss: 0.10936139523983002 | Train,Test accuracy: 0.9661045670509338.3f%, 0.8583860993385315.3f%\n",
      "0 tensor(0.0999, device='cuda:0')\n",
      "100 tensor(0.0826, device='cuda:0')\n",
      "200 tensor(0.1777, device='cuda:0')\n",
      "300 tensor(0.1164, device='cuda:0')\n",
      "Iteration: 85 | Loss: 0.10804338753223419 | Train,Test accuracy: 0.966779887676239.3f%, 0.8531447649002075.3f%\n",
      "0 tensor(0.0768, device='cuda:0')\n",
      "100 tensor(0.0846, device='cuda:0')\n",
      "200 tensor(0.1586, device='cuda:0')\n",
      "300 tensor(0.1124, device='cuda:0')\n",
      "Iteration: 86 | Loss: 0.11015201359987259 | Train,Test accuracy: 0.9664722084999084.3f%, 0.8536392450332642.3f%\n",
      "0 tensor(0.0616, device='cuda:0')\n",
      "100 tensor(0.0744, device='cuda:0')\n",
      "200 tensor(0.0651, device='cuda:0')\n",
      "300 tensor(0.0750, device='cuda:0')\n",
      "Iteration: 87 | Loss: 0.10163959115743637 | Train,Test accuracy: 0.9620803594589233.3f%, 0.845530092716217.3f%\n",
      "0 tensor(0.0983, device='cuda:0')\n",
      "100 tensor(0.0340, device='cuda:0')\n",
      "200 tensor(0.1298, device='cuda:0')\n",
      "300 tensor(0.1316, device='cuda:0')\n",
      "Iteration: 88 | Loss: 0.10430160164833069 | Train,Test accuracy: 0.9705842733383179.3f%, 0.856210470199585.3f%\n",
      "0 tensor(0.0656, device='cuda:0')\n",
      "100 tensor(0.0564, device='cuda:0')\n",
      "200 tensor(0.0855, device='cuda:0')\n",
      "300 tensor(0.1145, device='cuda:0')\n",
      "Iteration: 89 | Loss: 0.09793151915073395 | Train,Test accuracy: 0.968122661113739.3f%, 0.8542326092720032.3f%\n",
      "0 tensor(0.1380, device='cuda:0')\n",
      "100 tensor(0.1548, device='cuda:0')\n",
      "200 tensor(0.1308, device='cuda:0')\n",
      "300 tensor(0.1241, device='cuda:0')\n",
      "Iteration: 90 | Loss: 0.10644049942493439 | Train,Test accuracy: 0.9682504534721375.3f%, 0.8569027185440063.3f%\n",
      "0 tensor(0.1019, device='cuda:0')\n",
      "100 tensor(0.0749, device='cuda:0')\n",
      "200 tensor(0.0716, device='cuda:0')\n",
      "300 tensor(0.1876, device='cuda:0')\n",
      "Iteration: 91 | Loss: 0.10094285756349564 | Train,Test accuracy: 0.969916820526123.3f%, 0.8558148741722107.3f%\n",
      "0 tensor(0.0459, device='cuda:0')\n",
      "100 tensor(0.0874, device='cuda:0')\n",
      "200 tensor(0.1054, device='cuda:0')\n",
      "300 tensor(0.1138, device='cuda:0')\n",
      "Iteration: 92 | Loss: 0.10017802566289902 | Train,Test accuracy: 0.9721787571907043.3f%, 0.8568037748336792.3f%\n",
      "0 tensor(0.0865, device='cuda:0')\n",
      "100 tensor(0.1063, device='cuda:0')\n",
      "200 tensor(0.1393, device='cuda:0')\n",
      "300 tensor(0.0928, device='cuda:0')\n",
      "Iteration: 93 | Loss: 0.09788557142019272 | Train,Test accuracy: 0.9701966047286987.3f%, 0.8507713675498962.3f%\n",
      "0 tensor(0.0863, device='cuda:0')\n",
      "100 tensor(0.1020, device='cuda:0')\n",
      "200 tensor(0.1102, device='cuda:0')\n",
      "300 tensor(0.0366, device='cuda:0')\n",
      "Iteration: 94 | Loss: 0.10404903441667557 | Train,Test accuracy: 0.9690657258033752.3f%, 0.8583860993385315.3f%\n",
      "0 tensor(0.0950, device='cuda:0')\n",
      "100 tensor(0.0563, device='cuda:0')\n",
      "200 tensor(0.1155, device='cuda:0')\n",
      "300 tensor(0.1476, device='cuda:0')\n",
      "Iteration: 95 | Loss: 0.09811404347419739 | Train,Test accuracy: 0.9701007604598999.3f%, 0.8539358973503113.3f%\n",
      "0 tensor(0.0703, device='cuda:0')\n",
      "100 tensor(0.1380, device='cuda:0')\n",
      "200 tensor(0.0820, device='cuda:0')\n",
      "300 tensor(0.0335, device='cuda:0')\n",
      "Iteration: 96 | Loss: 0.09832646697759628 | Train,Test accuracy: 0.9678348898887634.3f%, 0.8542326092720032.3f%\n",
      "0 tensor(0.1017, device='cuda:0')\n",
      "100 tensor(0.0667, device='cuda:0')\n",
      "200 tensor(0.0965, device='cuda:0')\n",
      "300 tensor(0.1034, device='cuda:0')\n",
      "Iteration: 97 | Loss: 0.09915091842412949 | Train,Test accuracy: 0.969916820526123.3f%, 0.8582871556282043.3f%\n",
      "0 tensor(0.0564, device='cuda:0')\n",
      "100 tensor(0.0873, device='cuda:0')\n",
      "200 tensor(0.0473, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "300 tensor(0.1013, device='cuda:0')\n",
      "Iteration: 98 | Loss: 0.09381457418203354 | Train,Test accuracy: 0.9712516069412231.3f%, 0.864022970199585.3f%\n",
      "0 tensor(0.1097, device='cuda:0')\n",
      "100 tensor(0.1126, device='cuda:0')\n",
      "200 tensor(0.0699, device='cuda:0')\n",
      "300 tensor(0.1007, device='cuda:0')\n",
      "Iteration: 99 | Loss: 0.09804291278123856 | Train,Test accuracy: 0.9697051048278809.3f%, 0.856210470199585.3f%\n",
      "0 tensor(0.1252, device='cuda:0')\n",
      "100 tensor(0.0633, device='cuda:0')\n",
      "200 tensor(0.0866, device='cuda:0')\n",
      "300 tensor(0.0878, device='cuda:0')\n",
      "Iteration: 100 | Loss: 0.09924370795488358 | Train,Test accuracy: 0.9710517525672913.3f%, 0.8520569801330566.3f%\n",
      "0 tensor(0.0456, device='cuda:0')\n",
      "100 tensor(0.0987, device='cuda:0')\n",
      "200 tensor(0.1691, device='cuda:0')\n",
      "300 tensor(0.1121, device='cuda:0')\n",
      "Iteration: 101 | Loss: 0.09217723459005356 | Train,Test accuracy: 0.9729299545288086.3f%, 0.8493868708610535.3f%\n",
      "0 tensor(0.0386, device='cuda:0')\n",
      "100 tensor(0.1194, device='cuda:0')\n",
      "200 tensor(0.0610, device='cuda:0')\n",
      "300 tensor(0.1305, device='cuda:0')\n",
      "Iteration: 102 | Loss: 0.09861398488283157 | Train,Test accuracy: 0.9698968529701233.3f%, 0.8558148741722107.3f%\n",
      "0 tensor(0.0424, device='cuda:0')\n",
      "100 tensor(0.0614, device='cuda:0')\n",
      "200 tensor(0.1039, device='cuda:0')\n",
      "300 tensor(0.0598, device='cuda:0')\n",
      "Iteration: 103 | Loss: 0.09786706417798996 | Train,Test accuracy: 0.9711117148399353.3f%, 0.8595727682113647.3f%\n",
      "0 tensor(0.0866, device='cuda:0')\n",
      "100 tensor(0.0888, device='cuda:0')\n",
      "200 tensor(0.0836, device='cuda:0')\n",
      "300 tensor(0.0832, device='cuda:0')\n",
      "Iteration: 104 | Loss: 0.1003345400094986 | Train,Test accuracy: 0.9716112613677979.3f%, 0.8552215099334717.3f%\n",
      "0 tensor(0.1282, device='cuda:0')\n",
      "100 tensor(0.0979, device='cuda:0')\n",
      "200 tensor(0.0491, device='cuda:0')\n",
      "300 tensor(0.0856, device='cuda:0')\n",
      "Iteration: 105 | Loss: 0.09517528116703033 | Train,Test accuracy: 0.970240592956543.3f%, 0.8567048907279968.3f%\n",
      "0 tensor(0.0731, device='cuda:0')\n",
      "100 tensor(0.1209, device='cuda:0')\n",
      "200 tensor(0.0582, device='cuda:0')\n",
      "300 tensor(0.1081, device='cuda:0')\n",
      "Iteration: 106 | Loss: 0.09362240880727768 | Train,Test accuracy: 0.9703884124755859.3f%, 0.859375.3f%\n",
      "0 tensor(0.1129, device='cuda:0')\n",
      "100 tensor(0.0900, device='cuda:0')\n",
      "200 tensor(0.0752, device='cuda:0')\n",
      "300 tensor(0.0379, device='cuda:0')\n",
      "Iteration: 107 | Loss: 0.09233036637306213 | Train,Test accuracy: 0.9698209762573242.3f%, 0.854727029800415.3f%\n",
      "0 tensor(0.0568, device='cuda:0')\n",
      "100 tensor(0.0635, device='cuda:0')\n",
      "200 tensor(0.0999, device='cuda:0')\n",
      "300 tensor(0.1069, device='cuda:0')\n",
      "Iteration: 108 | Loss: 0.09398282319307327 | Train,Test accuracy: 0.966424286365509.3f%, 0.8555182218551636.3f%\n",
      "0 tensor(0.1229, device='cuda:0')\n",
      "100 tensor(0.1050, device='cuda:0')\n",
      "200 tensor(0.1266, device='cuda:0')\n",
      "300 tensor(0.0930, device='cuda:0')\n",
      "Iteration: 109 | Loss: 0.0975503921508789 | Train,Test accuracy: 0.9730738401412964.3f%, 0.8543314933776855.3f%\n",
      "0 tensor(0.0695, device='cuda:0')\n",
      "100 tensor(0.0806, device='cuda:0')\n",
      "200 tensor(0.1139, device='cuda:0')\n",
      "300 tensor(0.0910, device='cuda:0')\n",
      "Iteration: 110 | Loss: 0.09310371428728104 | Train,Test accuracy: 0.9696131348609924.3f%, 0.8555182218551636.3f%\n",
      "0 tensor(0.1065, device='cuda:0')\n",
      "100 tensor(0.0672, device='cuda:0')\n",
      "200 tensor(0.1082, device='cuda:0')\n",
      "300 tensor(0.0959, device='cuda:0')\n",
      "Iteration: 111 | Loss: 0.09349647164344788 | Train,Test accuracy: 0.9714834094047546.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0548, device='cuda:0')\n",
      "100 tensor(0.1491, device='cuda:0')\n",
      "200 tensor(0.0867, device='cuda:0')\n",
      "300 tensor(0.0632, device='cuda:0')\n",
      "Iteration: 112 | Loss: 0.09624825417995453 | Train,Test accuracy: 0.96977698802948.3f%, 0.8461233973503113.3f%\n",
      "0 tensor(0.0755, device='cuda:0')\n",
      "100 tensor(0.1177, device='cuda:0')\n",
      "200 tensor(0.1138, device='cuda:0')\n",
      "300 tensor(0.1857, device='cuda:0')\n",
      "Iteration: 113 | Loss: 0.09658562391996384 | Train,Test accuracy: 0.9708999395370483.3f%, 0.8609572649002075.3f%\n",
      "0 tensor(0.0621, device='cuda:0')\n",
      "100 tensor(0.1483, device='cuda:0')\n",
      "200 tensor(0.0963, device='cuda:0')\n",
      "300 tensor(0.0699, device='cuda:0')\n",
      "Iteration: 114 | Loss: 0.09141182154417038 | Train,Test accuracy: 0.969900906085968.3f%, 0.8586827516555786.3f%\n",
      "0 tensor(0.0584, device='cuda:0')\n",
      "100 tensor(0.0607, device='cuda:0')\n",
      "200 tensor(0.1199, device='cuda:0')\n",
      "300 tensor(0.1082, device='cuda:0')\n",
      "Iteration: 115 | Loss: 0.09701194614171982 | Train,Test accuracy: 0.9708639979362488.3f%, 0.8570016026496887.3f%\n",
      "0 tensor(0.1128, device='cuda:0')\n",
      "100 tensor(0.1049, device='cuda:0')\n",
      "200 tensor(0.1166, device='cuda:0')\n",
      "300 tensor(0.0493, device='cuda:0')\n",
      "Iteration: 116 | Loss: 0.09117225557565689 | Train,Test accuracy: 0.9746283292770386.3f%, 0.8569027185440063.3f%\n",
      "0 tensor(0.1881, device='cuda:0')\n",
      "100 tensor(0.0763, device='cuda:0')\n",
      "200 tensor(0.0402, device='cuda:0')\n",
      "300 tensor(0.1252, device='cuda:0')\n",
      "Iteration: 117 | Loss: 0.09385775774717331 | Train,Test accuracy: 0.9693094491958618.3f%, 0.8539358973503113.3f%\n",
      "0 tensor(0.0194, device='cuda:0')\n",
      "100 tensor(0.1072, device='cuda:0')\n",
      "200 tensor(0.0263, device='cuda:0')\n",
      "300 tensor(0.1189, device='cuda:0')\n",
      "Iteration: 118 | Loss: 0.09267105162143707 | Train,Test accuracy: 0.972290575504303.3f%, 0.8572982549667358.3f%\n",
      "0 tensor(0.1133, device='cuda:0')\n",
      "100 tensor(0.0700, device='cuda:0')\n",
      "200 tensor(0.1161, device='cuda:0')\n",
      "300 tensor(0.1854, device='cuda:0')\n",
      "Iteration: 119 | Loss: 0.09363407641649246 | Train,Test accuracy: 0.9726423025131226.3f%, 0.861155092716217.3f%\n",
      "0 tensor(0.0548, device='cuda:0')\n",
      "100 tensor(0.0291, device='cuda:0')\n",
      "200 tensor(0.0597, device='cuda:0')\n",
      "300 tensor(0.1547, device='cuda:0')\n",
      "Iteration: 120 | Loss: 0.09108507633209229 | Train,Test accuracy: 0.9661164879798889.3f%, 0.8579905033111572.3f%\n",
      "0 tensor(0.1758, device='cuda:0')\n",
      "100 tensor(0.0733, device='cuda:0')\n",
      "200 tensor(0.1582, device='cuda:0')\n",
      "300 tensor(0.0827, device='cuda:0')\n",
      "Iteration: 121 | Loss: 0.09629058837890625 | Train,Test accuracy: 0.9702325463294983.3f%, 0.8609572649002075.3f%\n",
      "0 tensor(0.0698, device='cuda:0')\n",
      "100 tensor(0.0942, device='cuda:0')\n",
      "200 tensor(0.1303, device='cuda:0')\n",
      "300 tensor(0.0401, device='cuda:0')\n",
      "Iteration: 122 | Loss: 0.09574016183614731 | Train,Test accuracy: 0.9729459881782532.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0967, device='cuda:0')\n",
      "100 tensor(0.1194, device='cuda:0')\n",
      "200 tensor(0.0461, device='cuda:0')\n",
      "300 tensor(0.0846, device='cuda:0')\n",
      "Iteration: 123 | Loss: 0.09046962112188339 | Train,Test accuracy: 0.970588207244873.3f%, 0.8520569801330566.3f%\n",
      "0 tensor(0.0978, device='cuda:0')\n",
      "100 tensor(0.0866, device='cuda:0')\n",
      "200 tensor(0.0564, device='cuda:0')\n",
      "300 tensor(0.0384, device='cuda:0')\n",
      "Iteration: 124 | Loss: 0.0919240266084671 | Train,Test accuracy: 0.9746803045272827.3f%, 0.856210470199585.3f%\n",
      "0 tensor(0.0673, device='cuda:0')\n",
      "100 tensor(0.0422, device='cuda:0')\n",
      "200 tensor(0.0546, device='cuda:0')\n",
      "300 tensor(0.0975, device='cuda:0')\n",
      "Iteration: 125 | Loss: 0.09336759150028229 | Train,Test accuracy: 0.9680427312850952.3f%, 0.8548259735107422.3f%\n",
      "0 tensor(0.0832, device='cuda:0')\n",
      "100 tensor(0.1216, device='cuda:0')\n",
      "200 tensor(0.0787, device='cuda:0')\n",
      "300 tensor(0.0919, device='cuda:0')\n",
      "Iteration: 126 | Loss: 0.09313718974590302 | Train,Test accuracy: 0.9744405746459961.3f%, 0.8590783476829529.3f%\n",
      "0 tensor(0.1218, device='cuda:0')\n",
      "100 tensor(0.0618, device='cuda:0')\n",
      "200 tensor(0.1099, device='cuda:0')\n",
      "300 tensor(0.0506, device='cuda:0')\n",
      "Iteration: 127 | Loss: 0.0916994959115982 | Train,Test accuracy: 0.9695731997489929.3f%, 0.8519580960273743.3f%\n",
      "0 tensor(0.1056, device='cuda:0')\n",
      "100 tensor(0.0974, device='cuda:0')\n",
      "200 tensor(0.0969, device='cuda:0')\n",
      "300 tensor(0.1263, device='cuda:0')\n",
      "Iteration: 128 | Loss: 0.09511663764715195 | Train,Test accuracy: 0.9744005799293518.3f%, 0.8594738841056824.3f%\n",
      "0 tensor(0.1383, device='cuda:0')\n",
      "100 tensor(0.0430, device='cuda:0')\n",
      "200 tensor(0.1019, device='cuda:0')\n",
      "300 tensor(0.0236, device='cuda:0')\n",
      "Iteration: 129 | Loss: 0.08814269304275513 | Train,Test accuracy: 0.9746922850608826.3f%, 0.8572982549667358.3f%\n",
      "0 tensor(0.1051, device='cuda:0')\n",
      "100 tensor(0.0395, device='cuda:0')\n",
      "200 tensor(0.0879, device='cuda:0')\n",
      "300 tensor(0.0962, device='cuda:0')\n",
      "Iteration: 130 | Loss: 0.09230250865221024 | Train,Test accuracy: 0.9754515290260315.3f%, 0.8603639006614685.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.0983, device='cuda:0')\n",
      "100 tensor(0.1070, device='cuda:0')\n",
      "200 tensor(0.1154, device='cuda:0')\n",
      "300 tensor(0.0920, device='cuda:0')\n",
      "Iteration: 131 | Loss: 0.09336642920970917 | Train,Test accuracy: 0.9708600044250488.3f%, 0.8522547483444214.3f%\n",
      "0 tensor(0.0452, device='cuda:0')\n",
      "100 tensor(0.0535, device='cuda:0')\n",
      "200 tensor(0.0592, device='cuda:0')\n",
      "300 tensor(0.1499, device='cuda:0')\n",
      "Iteration: 132 | Loss: 0.08828316628932953 | Train,Test accuracy: 0.9730898141860962.3f%, 0.8590783476829529.3f%\n",
      "0 tensor(0.1352, device='cuda:0')\n",
      "100 tensor(0.0632, device='cuda:0')\n",
      "200 tensor(0.1504, device='cuda:0')\n",
      "300 tensor(0.0329, device='cuda:0')\n",
      "Iteration: 133 | Loss: 0.09110604226589203 | Train,Test accuracy: 0.9732217192649841.3f%, 0.8579905033111572.3f%\n",
      "0 tensor(0.1055, device='cuda:0')\n",
      "100 tensor(0.1915, device='cuda:0')\n",
      "200 tensor(0.1201, device='cuda:0')\n",
      "300 tensor(0.0600, device='cuda:0')\n",
      "Iteration: 134 | Loss: 0.08905460685491562 | Train,Test accuracy: 0.9760109782218933.3f%, 0.8576938509941101.3f%\n",
      "0 tensor(0.0788, device='cuda:0')\n",
      "100 tensor(0.0634, device='cuda:0')\n",
      "200 tensor(0.0599, device='cuda:0')\n",
      "300 tensor(0.1027, device='cuda:0')\n",
      "Iteration: 135 | Loss: 0.08839637041091919 | Train,Test accuracy: 0.9725903272628784.3f%, 0.8622428774833679.3f%\n",
      "0 tensor(0.0877, device='cuda:0')\n",
      "100 tensor(0.0790, device='cuda:0')\n",
      "200 tensor(0.1048, device='cuda:0')\n",
      "300 tensor(0.1010, device='cuda:0')\n",
      "Iteration: 136 | Loss: 0.09240934252738953 | Train,Test accuracy: 0.9730179309844971.3f%, 0.8627373576164246.3f%\n",
      "0 tensor(0.1275, device='cuda:0')\n",
      "100 tensor(0.0765, device='cuda:0')\n",
      "200 tensor(0.0822, device='cuda:0')\n",
      "300 tensor(0.0623, device='cuda:0')\n",
      "Iteration: 137 | Loss: 0.08912904560565948 | Train,Test accuracy: 0.9747322201728821.3f%, 0.8571993708610535.3f%\n",
      "0 tensor(0.0339, device='cuda:0')\n",
      "100 tensor(0.0877, device='cuda:0')\n",
      "200 tensor(0.0631, device='cuda:0')\n",
      "300 tensor(0.0436, device='cuda:0')\n",
      "Iteration: 138 | Loss: 0.0937429741024971 | Train,Test accuracy: 0.9736332893371582.3f%, 0.860561728477478.3f%\n",
      "0 tensor(0.0387, device='cuda:0')\n",
      "100 tensor(0.0476, device='cuda:0')\n",
      "200 tensor(0.1021, device='cuda:0')\n",
      "300 tensor(0.0473, device='cuda:0')\n",
      "Iteration: 139 | Loss: 0.09048768132925034 | Train,Test accuracy: 0.9714953303337097.3f%, 0.8566060066223145.3f%\n",
      "0 tensor(0.0897, device='cuda:0')\n",
      "100 tensor(0.0757, device='cuda:0')\n",
      "200 tensor(0.0583, device='cuda:0')\n",
      "300 tensor(0.0658, device='cuda:0')\n",
      "Iteration: 140 | Loss: 0.08922422677278519 | Train,Test accuracy: 0.9741288423538208.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0258, device='cuda:0')\n",
      "100 tensor(0.0638, device='cuda:0')\n",
      "200 tensor(0.0485, device='cuda:0')\n",
      "300 tensor(0.1470, device='cuda:0')\n",
      "Iteration: 141 | Loss: 0.09096837043762207 | Train,Test accuracy: 0.9745844006538391.3f%, 0.8604628443717957.3f%\n",
      "0 tensor(0.1029, device='cuda:0')\n",
      "100 tensor(0.0374, device='cuda:0')\n",
      "200 tensor(0.0785, device='cuda:0')\n",
      "300 tensor(0.0331, device='cuda:0')\n",
      "Iteration: 142 | Loss: 0.05066622793674469 | Train,Test accuracy: 0.9870204329490662.3f%, 0.8682753443717957.3f%\n",
      "0 tensor(0.0334, device='cuda:0')\n",
      "100 tensor(0.0195, device='cuda:0')\n",
      "200 tensor(0.0311, device='cuda:0')\n",
      "300 tensor(0.0419, device='cuda:0')\n",
      "Iteration: 143 | Loss: 0.03689252585172653 | Train,Test accuracy: 0.9897778034210205.3f%, 0.8721321225166321.3f%\n",
      "0 tensor(0.0174, device='cuda:0')\n",
      "100 tensor(0.0079, device='cuda:0')\n",
      "200 tensor(0.0300, device='cuda:0')\n",
      "300 tensor(0.0152, device='cuda:0')\n",
      "Iteration: 144 | Loss: 0.02989381179213524 | Train,Test accuracy: 0.9908367395401001.3f%, 0.8723298907279968.3f%\n",
      "0 tensor(0.0099, device='cuda:0')\n",
      "100 tensor(0.0276, device='cuda:0')\n",
      "200 tensor(0.0174, device='cuda:0')\n",
      "300 tensor(0.0082, device='cuda:0')\n",
      "Iteration: 145 | Loss: 0.028117908164858818 | Train,Test accuracy: 0.9923194050788879.3f%, 0.8702531456947327.3f%\n",
      "0 tensor(0.0428, device='cuda:0')\n",
      "100 tensor(0.0460, device='cuda:0')\n",
      "200 tensor(0.0249, device='cuda:0')\n",
      "300 tensor(0.0171, device='cuda:0')\n",
      "Iteration: 146 | Loss: 0.02721189148724079 | Train,Test accuracy: 0.9929267764091492.3f%, 0.8713409900665283.3f%\n",
      "0 tensor(0.0287, device='cuda:0')\n",
      "100 tensor(0.0099, device='cuda:0')\n",
      "200 tensor(0.0186, device='cuda:0')\n",
      "300 tensor(0.0315, device='cuda:0')\n",
      "Iteration: 147 | Loss: 0.025375550612807274 | Train,Test accuracy: 0.9936660528182983.3f%, 0.8697587251663208.3f%\n",
      "0 tensor(0.0288, device='cuda:0')\n",
      "100 tensor(0.0031, device='cuda:0')\n",
      "200 tensor(0.0201, device='cuda:0')\n",
      "300 tensor(0.0251, device='cuda:0')\n",
      "Iteration: 148 | Loss: 0.023688744753599167 | Train,Test accuracy: 0.9941815733909607.3f%, 0.871835470199585.3f%\n",
      "0 tensor(0.0129, device='cuda:0')\n",
      "100 tensor(0.0050, device='cuda:0')\n",
      "200 tensor(0.0152, device='cuda:0')\n",
      "300 tensor(0.0352, device='cuda:0')\n",
      "Iteration: 149 | Loss: 0.0215652696788311 | Train,Test accuracy: 0.9941256642341614.3f%, 0.8726266026496887.3f%\n",
      "0 tensor(0.0152, device='cuda:0')\n",
      "100 tensor(0.0270, device='cuda:0')\n",
      "200 tensor(0.0352, device='cuda:0')\n",
      "300 tensor(0.0079, device='cuda:0')\n",
      "Iteration: 150 | Loss: 0.019195718690752983 | Train,Test accuracy: 0.9935062527656555.3f%, 0.8751977682113647.3f%\n",
      "0 tensor(0.0085, device='cuda:0')\n",
      "100 tensor(0.0073, device='cuda:0')\n",
      "200 tensor(0.0246, device='cuda:0')\n",
      "300 tensor(0.0079, device='cuda:0')\n",
      "Iteration: 151 | Loss: 0.020532656461000443 | Train,Test accuracy: 0.9946851134300232.3f%, 0.8714398741722107.3f%\n",
      "0 tensor(0.0069, device='cuda:0')\n",
      "100 tensor(0.0397, device='cuda:0')\n",
      "200 tensor(0.0038, device='cuda:0')\n",
      "300 tensor(0.0162, device='cuda:0')\n",
      "Iteration: 152 | Loss: 0.018381968140602112 | Train,Test accuracy: 0.9949527978897095.3f%, 0.875.3f%\n",
      "0 tensor(0.0148, device='cuda:0')\n",
      "100 tensor(0.0083, device='cuda:0')\n",
      "200 tensor(0.0445, device='cuda:0')\n",
      "300 tensor(0.0160, device='cuda:0')\n",
      "Iteration: 153 | Loss: 0.01727008819580078 | Train,Test accuracy: 0.993486225605011.3f%, 0.8717365264892578.3f%\n",
      "0 tensor(0.0030, device='cuda:0')\n",
      "100 tensor(0.0113, device='cuda:0')\n",
      "200 tensor(0.0460, device='cuda:0')\n",
      "300 tensor(0.0329, device='cuda:0')\n",
      "Iteration: 154 | Loss: 0.01829918660223484 | Train,Test accuracy: 0.9946011900901794.3f%, 0.8736155033111572.3f%\n",
      "0 tensor(0.0060, device='cuda:0')\n",
      "100 tensor(0.0355, device='cuda:0')\n",
      "200 tensor(0.0165, device='cuda:0')\n",
      "300 tensor(0.0205, device='cuda:0')\n",
      "Iteration: 155 | Loss: 0.018387220799922943 | Train,Test accuracy: 0.9946730732917786.3f%, 0.8729232549667358.3f%\n",
      "0 tensor(0.0069, device='cuda:0')\n",
      "100 tensor(0.0280, device='cuda:0')\n",
      "200 tensor(0.0042, device='cuda:0')\n",
      "300 tensor(0.0172, device='cuda:0')\n",
      "Iteration: 156 | Loss: 0.016886521130800247 | Train,Test accuracy: 0.9947130680084229.3f%, 0.8737143874168396.3f%\n",
      "0 tensor(0.0215, device='cuda:0')\n",
      "100 tensor(0.0030, device='cuda:0')\n",
      "200 tensor(0.0189, device='cuda:0')\n",
      "300 tensor(0.0050, device='cuda:0')\n",
      "Iteration: 157 | Loss: 0.016337424516677856 | Train,Test accuracy: 0.9950447678565979.3f%, 0.8710442781448364.3f%\n",
      "0 tensor(0.0068, device='cuda:0')\n",
      "100 tensor(0.0079, device='cuda:0')\n",
      "200 tensor(0.0082, device='cuda:0')\n",
      "300 tensor(0.0124, device='cuda:0')\n",
      "Iteration: 158 | Loss: 0.016905061900615692 | Train,Test accuracy: 0.9952046275138855.3f%, 0.8728243708610535.3f%\n",
      "0 tensor(0.0060, device='cuda:0')\n",
      "100 tensor(0.0043, device='cuda:0')\n",
      "200 tensor(0.0087, device='cuda:0')\n",
      "300 tensor(0.0323, device='cuda:0')\n",
      "Iteration: 159 | Loss: 0.015912555158138275 | Train,Test accuracy: 0.995304524898529.3f%, 0.8751977682113647.3f%\n",
      "0 tensor(0.0118, device='cuda:0')\n",
      "100 tensor(0.0109, device='cuda:0')\n",
      "200 tensor(0.0058, device='cuda:0')\n",
      "300 tensor(0.0081, device='cuda:0')\n",
      "Iteration: 160 | Loss: 0.01725439354777336 | Train,Test accuracy: 0.9948449730873108.3f%, 0.8754944801330566.3f%\n",
      "0 tensor(0.0181, device='cuda:0')\n",
      "100 tensor(0.0087, device='cuda:0')\n",
      "200 tensor(0.0180, device='cuda:0')\n",
      "300 tensor(0.0055, device='cuda:0')\n",
      "Iteration: 161 | Loss: 0.014808150939643383 | Train,Test accuracy: 0.9949248433113098.3f%, 0.8704509735107422.3f%\n",
      "0 tensor(0.0096, device='cuda:0')\n",
      "100 tensor(0.0113, device='cuda:0')\n",
      "200 tensor(0.0199, device='cuda:0')\n",
      "300 tensor(0.0117, device='cuda:0')\n",
      "Iteration: 162 | Loss: 0.01602157950401306 | Train,Test accuracy: 0.9952645301818848.3f%, 0.871835470199585.3f%\n",
      "0 tensor(0.0472, device='cuda:0')\n",
      "100 tensor(0.0062, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "200 tensor(0.0109, device='cuda:0')\n",
      "300 tensor(0.0061, device='cuda:0')\n",
      "Iteration: 163 | Loss: 0.014909118413925171 | Train,Test accuracy: 0.9956042170524597.3f%, 0.8740110993385315.3f%\n",
      "0 tensor(0.0160, device='cuda:0')\n",
      "100 tensor(0.0383, device='cuda:0')\n",
      "200 tensor(0.0041, device='cuda:0')\n",
      "300 tensor(0.0055, device='cuda:0')\n",
      "Iteration: 164 | Loss: 0.014852884225547314 | Train,Test accuracy: 0.9958919286727905.3f%, 0.8731210231781006.3f%\n",
      "0 tensor(0.0054, device='cuda:0')\n",
      "100 tensor(0.0077, device='cuda:0')\n",
      "200 tensor(0.0206, device='cuda:0')\n",
      "300 tensor(0.0517, device='cuda:0')\n",
      "Iteration: 165 | Loss: 0.01570245437324047 | Train,Test accuracy: 0.9950447678565979.3f%, 0.8737143874168396.3f%\n",
      "0 tensor(0.0069, device='cuda:0')\n",
      "100 tensor(0.0057, device='cuda:0')\n",
      "200 tensor(0.0199, device='cuda:0')\n",
      "300 tensor(0.0037, device='cuda:0')\n",
      "Iteration: 166 | Loss: 0.015115943737328053 | Train,Test accuracy: 0.9944652915000916.3f%, 0.8691653609275818.3f%\n",
      "0 tensor(0.0070, device='cuda:0')\n",
      "100 tensor(0.0062, device='cuda:0')\n",
      "200 tensor(0.0037, device='cuda:0')\n",
      "300 tensor(0.0179, device='cuda:0')\n",
      "Iteration: 167 | Loss: 0.015615621581673622 | Train,Test accuracy: 0.9956521391868591.3f%, 0.8736155033111572.3f%\n",
      "0 tensor(0.0040, device='cuda:0')\n",
      "100 tensor(0.0210, device='cuda:0')\n",
      "200 tensor(0.0480, device='cuda:0')\n",
      "300 tensor(0.0070, device='cuda:0')\n",
      "Iteration: 168 | Loss: 0.016224326565861702 | Train,Test accuracy: 0.9946811199188232.3f%, 0.8727254867553711.3f%\n",
      "0 tensor(0.0053, device='cuda:0')\n",
      "100 tensor(0.0037, device='cuda:0')\n",
      "200 tensor(0.0076, device='cuda:0')\n",
      "300 tensor(0.0073, device='cuda:0')\n",
      "Iteration: 169 | Loss: 0.015425147488713264 | Train,Test accuracy: 0.9959718585014343.3f%, 0.8711432218551636.3f%\n",
      "0 tensor(0.0057, device='cuda:0')\n",
      "100 tensor(0.0273, device='cuda:0')\n",
      "200 tensor(0.0021, device='cuda:0')\n",
      "300 tensor(0.0097, device='cuda:0')\n",
      "Iteration: 170 | Loss: 0.014576112851500511 | Train,Test accuracy: 0.9954004287719727.3f%, 0.8695608973503113.3f%\n",
      "0 tensor(0.0515, device='cuda:0')\n",
      "100 tensor(0.0069, device='cuda:0')\n",
      "200 tensor(0.0195, device='cuda:0')\n",
      "300 tensor(0.0019, device='cuda:0')\n",
      "Iteration: 171 | Loss: 0.015138426795601845 | Train,Test accuracy: 0.9962835907936096.3f%, 0.873219907283783.3f%\n",
      "0 tensor(0.0049, device='cuda:0')\n",
      "100 tensor(0.0068, device='cuda:0')\n",
      "200 tensor(0.0163, device='cuda:0')\n",
      "300 tensor(0.0058, device='cuda:0')\n",
      "Iteration: 172 | Loss: 0.015220520086586475 | Train,Test accuracy: 0.9959239363670349.3f%, 0.8698576092720032.3f%\n",
      "0 tensor(0.0275, device='cuda:0')\n",
      "100 tensor(0.0138, device='cuda:0')\n",
      "200 tensor(0.0128, device='cuda:0')\n",
      "300 tensor(0.0259, device='cuda:0')\n",
      "Iteration: 173 | Loss: 0.01486316416412592 | Train,Test accuracy: 0.9952046275138855.3f%, 0.8711432218551636.3f%\n",
      "0 tensor(0.0064, device='cuda:0')\n",
      "100 tensor(0.0042, device='cuda:0')\n",
      "200 tensor(0.0084, device='cuda:0')\n",
      "300 tensor(0.0058, device='cuda:0')\n",
      "Iteration: 174 | Loss: 0.014271658845245838 | Train,Test accuracy: 0.9957121014595032.3f%, 0.8720332384109497.3f%\n",
      "0 tensor(0.0165, device='cuda:0')\n",
      "100 tensor(0.0295, device='cuda:0')\n",
      "200 tensor(0.0212, device='cuda:0')\n",
      "300 tensor(0.0179, device='cuda:0')\n",
      "Iteration: 175 | Loss: 0.014669666066765785 | Train,Test accuracy: 0.9953724145889282.3f%, 0.873813271522522.3f%\n",
      "0 tensor(0.0039, device='cuda:0')\n",
      "100 tensor(0.0229, device='cuda:0')\n",
      "200 tensor(0.0264, device='cuda:0')\n",
      "300 tensor(0.0071, device='cuda:0')\n",
      "Iteration: 176 | Loss: 0.014223548583686352 | Train,Test accuracy: 0.9958639740943909.3f%, 0.8768789768218994.3f%\n",
      "0 tensor(0.0089, device='cuda:0')\n",
      "100 tensor(0.0550, device='cuda:0')\n",
      "200 tensor(0.0197, device='cuda:0')\n",
      "300 tensor(0.0060, device='cuda:0')\n",
      "Iteration: 177 | Loss: 0.015241190791130066 | Train,Test accuracy: 0.99593186378479.3f%, 0.8704509735107422.3f%\n",
      "0 tensor(0.0139, device='cuda:0')\n",
      "100 tensor(0.0041, device='cuda:0')\n",
      "200 tensor(0.0019, device='cuda:0')\n",
      "300 tensor(0.0035, device='cuda:0')\n",
      "Iteration: 178 | Loss: 0.013556019403040409 | Train,Test accuracy: 0.9958839416503906.3f%, 0.8700553774833679.3f%\n",
      "0 tensor(0.0040, device='cuda:0')\n",
      "100 tensor(0.0405, device='cuda:0')\n",
      "200 tensor(0.0284, device='cuda:0')\n",
      "300 tensor(0.0219, device='cuda:0')\n",
      "Iteration: 179 | Loss: 0.015128077007830143 | Train,Test accuracy: 0.9958839416503906.3f%, 0.8715387582778931.3f%\n",
      "0 tensor(0.0133, device='cuda:0')\n",
      "100 tensor(0.0026, device='cuda:0')\n",
      "200 tensor(0.0083, device='cuda:0')\n",
      "300 tensor(0.0049, device='cuda:0')\n",
      "Iteration: 180 | Loss: 0.01372524630278349 | Train,Test accuracy: 0.9961836934089661.3f%, 0.873813271522522.3f%\n",
      "0 tensor(0.0059, device='cuda:0')\n",
      "100 tensor(0.0027, device='cuda:0')\n",
      "200 tensor(0.0020, device='cuda:0')\n",
      "300 tensor(0.0413, device='cuda:0')\n",
      "Iteration: 181 | Loss: 0.015315906144678593 | Train,Test accuracy: 0.9954203963279724.3f%, 0.8662974834442139.3f%\n",
      "0 tensor(0.0070, device='cuda:0')\n",
      "100 tensor(0.0135, device='cuda:0')\n",
      "200 tensor(0.0109, device='cuda:0')\n",
      "300 tensor(0.0314, device='cuda:0')\n",
      "Iteration: 182 | Loss: 0.014143798500299454 | Train,Test accuracy: 0.9958999752998352.3f%, 0.8702531456947327.3f%\n",
      "0 tensor(0.0193, device='cuda:0')\n",
      "100 tensor(0.0188, device='cuda:0')\n",
      "200 tensor(0.0130, device='cuda:0')\n",
      "300 tensor(0.0136, device='cuda:0')\n",
      "Iteration: 183 | Loss: 0.015756068751215935 | Train,Test accuracy: 0.996063768863678.3f%, 0.8724287748336792.3f%\n",
      "0 tensor(0.0167, device='cuda:0')\n",
      "100 tensor(0.0168, device='cuda:0')\n",
      "200 tensor(0.0154, device='cuda:0')\n",
      "300 tensor(0.0050, device='cuda:0')\n",
      "Iteration: 184 | Loss: 0.014767035841941833 | Train,Test accuracy: 0.9951046705245972.3f%, 0.8669897317886353.3f%\n",
      "0 tensor(0.0156, device='cuda:0')\n",
      "100 tensor(0.0085, device='cuda:0')\n",
      "200 tensor(0.0087, device='cuda:0')\n",
      "300 tensor(0.0040, device='cuda:0')\n",
      "Iteration: 185 | Loss: 0.01236747857183218 | Train,Test accuracy: 0.995184600353241.3f%, 0.8676819801330566.3f%\n",
      "0 tensor(0.0032, device='cuda:0')\n",
      "100 tensor(0.0053, device='cuda:0')\n",
      "200 tensor(0.0042, device='cuda:0')\n",
      "300 tensor(0.0284, device='cuda:0')\n",
      "Iteration: 186 | Loss: 0.013975048437714577 | Train,Test accuracy: 0.9957441091537476.3f%, 0.8679786324501038.3f%\n",
      "0 tensor(0.0050, device='cuda:0')\n",
      "100 tensor(0.0091, device='cuda:0')\n",
      "200 tensor(0.0058, device='cuda:0')\n",
      "300 tensor(0.0061, device='cuda:0')\n",
      "Iteration: 187 | Loss: 0.01497459877282381 | Train,Test accuracy: 0.99593186378479.3f%, 0.871242105960846.3f%\n",
      "0 tensor(0.0172, device='cuda:0')\n",
      "100 tensor(0.0053, device='cuda:0')\n",
      "200 tensor(0.0048, device='cuda:0')\n",
      "300 tensor(0.0348, device='cuda:0')\n",
      "Iteration: 188 | Loss: 0.015119063667953014 | Train,Test accuracy: 0.9968590140342712.3f%, 0.8664952516555786.3f%\n",
      "0 tensor(0.0035, device='cuda:0')\n",
      "100 tensor(0.0160, device='cuda:0')\n",
      "200 tensor(0.0182, device='cuda:0')\n",
      "300 tensor(0.0025, device='cuda:0')\n",
      "Iteration: 189 | Loss: 0.015391780063509941 | Train,Test accuracy: 0.9955043196678162.3f%, 0.868967592716217.3f%\n",
      "0 tensor(0.0050, device='cuda:0')\n",
      "100 tensor(0.0229, device='cuda:0')\n",
      "200 tensor(0.0765, device='cuda:0')\n",
      "300 tensor(0.0067, device='cuda:0')\n",
      "Iteration: 190 | Loss: 0.012863758020102978 | Train,Test accuracy: 0.9965832829475403.3f%, 0.8669897317886353.3f%\n",
      "0 tensor(0.0141, device='cuda:0')\n",
      "100 tensor(0.0095, device='cuda:0')\n",
      "200 tensor(0.0298, device='cuda:0')\n",
      "300 tensor(0.0059, device='cuda:0')\n",
      "Iteration: 191 | Loss: 0.013255833648145199 | Train,Test accuracy: 0.9958719611167908.3f%, 0.8687697649002075.3f%\n",
      "0 tensor(0.0373, device='cuda:0')\n",
      "100 tensor(0.0040, device='cuda:0')\n",
      "200 tensor(0.0064, device='cuda:0')\n",
      "300 tensor(0.0049, device='cuda:0')\n",
      "Iteration: 192 | Loss: 0.014051003381609917 | Train,Test accuracy: 0.9958319664001465.3f%, 0.8676819801330566.3f%\n",
      "0 tensor(0.0026, device='cuda:0')\n",
      "100 tensor(0.0164, device='cuda:0')\n",
      "200 tensor(0.0078, device='cuda:0')\n",
      "300 tensor(0.0106, device='cuda:0')\n",
      "Iteration: 193 | Loss: 0.014454562216997147 | Train,Test accuracy: 0.9960238337516785.3f%, 0.8671875.3f%\n",
      "0 tensor(0.0106, device='cuda:0')\n",
      "100 tensor(0.0185, device='cuda:0')\n",
      "200 tensor(0.0246, device='cuda:0')\n",
      "300 tensor(0.0196, device='cuda:0')\n",
      "Iteration: 194 | Loss: 0.013991517014801502 | Train,Test accuracy: 0.9962435960769653.3f%, 0.8661985993385315.3f%\n",
      "0 tensor(0.0235, device='cuda:0')\n",
      "100 tensor(0.0040, device='cuda:0')\n",
      "200 tensor(0.0111, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "300 tensor(0.0060, device='cuda:0')\n",
      "Iteration: 195 | Loss: 0.012667253613471985 | Train,Test accuracy: 0.9968230724334717.3f%, 0.8671875.3f%\n",
      "0 tensor(0.0027, device='cuda:0')\n",
      "100 tensor(0.0175, device='cuda:0')\n",
      "200 tensor(0.0015, device='cuda:0')\n",
      "300 tensor(0.0026, device='cuda:0')\n",
      "Iteration: 196 | Loss: 0.013943570666015148 | Train,Test accuracy: 0.9961037635803223.3f%, 0.8682753443717957.3f%\n",
      "0 tensor(0.0094, device='cuda:0')\n",
      "100 tensor(0.0016, device='cuda:0')\n",
      "200 tensor(0.0077, device='cuda:0')\n",
      "300 tensor(0.0162, device='cuda:0')\n",
      "Iteration: 197 | Loss: 0.013696941547095776 | Train,Test accuracy: 0.9950248003005981.3f%, 0.870352029800415.3f%\n",
      "0 tensor(0.0125, device='cuda:0')\n",
      "100 tensor(0.0256, device='cuda:0')\n",
      "200 tensor(0.0121, device='cuda:0')\n",
      "300 tensor(0.0070, device='cuda:0')\n",
      "Iteration: 198 | Loss: 0.013309923000633717 | Train,Test accuracy: 0.9964433908462524.3f%, 0.8722310066223145.3f%\n",
      "0 tensor(0.0096, device='cuda:0')\n",
      "100 tensor(0.0048, device='cuda:0')\n",
      "200 tensor(0.0292, device='cuda:0')\n",
      "300 tensor(0.0243, device='cuda:0')\n",
      "Iteration: 199 | Loss: 0.012944845482707024 | Train,Test accuracy: 0.9956042170524597.3f%, 0.8692642450332642.3f%\n",
      "0 tensor(0.0310, device='cuda:0')\n",
      "100 tensor(0.0255, device='cuda:0')\n",
      "200 tensor(0.0114, device='cuda:0')\n",
      "300 tensor(0.0045, device='cuda:0')\n",
      "Iteration: 200 | Loss: 0.014494632370769978 | Train,Test accuracy: 0.9960438013076782.3f%, 0.871242105960846.3f%\n"
     ]
    }
   ],
   "source": [
    "criterion = nn.CrossEntropyLoss()\n",
    "# optimizer = optim.Adam(net.parameters(), lr=0.001, weight_decay=0.0001)\n",
    "\n",
    "optimizer = optim.Adam(net.parameters(), lr=0.001, weight_decay=3e-4)\n",
    "\n",
    "# optimizer = optim.SGD(net.parameters(), lr=0.05, momentum=0.9, weight_decay=0.0002, nesterov=True)\n",
    "\n",
    "train_accuracy_Relu = []\n",
    "train_loss_Relu = []\n",
    "test_accuracy_Relu  = []\n",
    "test_loss_Relu  = []\n",
    "\n",
    "\n",
    "for epoch in range(200):\n",
    "    \n",
    "    if epoch <= 80:\n",
    "        cur_lr = 0.001\n",
    "    elif epoch <= 140:\n",
    "        cur_lr = 0.0005\n",
    "    else:    \n",
    "        cur_lr = 0.0001\n",
    "\n",
    "#     if epoch <= 60:\n",
    "#         cur_lr = 0.05\n",
    "#     elif epoch <= 120:\n",
    "#         cur_lr = 0.01\n",
    "#     elif epoch <= 160:    \n",
    "#         cur_lr = 0.002\n",
    "#     else:\n",
    "#         cur_lr = 0.0004\n",
    "#     optimizer = optim.SGD(net.parameters(), lr=cur_lr, momentum=0.9, weight_decay=0.0001)\n",
    "    \n",
    "    for g in optimizer.param_groups:\n",
    "        g['lr'] = cur_lr\n",
    "#     optimizer = optim.Adam(net.parameters(), lr=cur_lr, weight_decay=0.0001)\n",
    "    \n",
    "    running_loss = 0.0\n",
    "    for i, data in enumerate(trainloader, 0):\n",
    "        # get the inputs\n",
    "        inputs, labels = data\n",
    "\n",
    "        if args.gpu:\n",
    "            inputs = inputs.cuda()\n",
    "            labels = labels.cuda()\n",
    "\n",
    "        # wrap them in Variable\n",
    "        inputs, labels = Variable(inputs), Variable(labels)\n",
    "\n",
    "        # zero the parameter gradients\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "        # forward + backward + optimize\n",
    "        outputs = net(inputs)\n",
    "        loss = criterion(outputs, labels)\n",
    "        loss.backward()\n",
    "\n",
    "#         if epoch > 16:\n",
    "#             for group in optimizer.param_groups:\n",
    "#                 for p in group['params']:\n",
    "#                     state = optimizer.state[p]\n",
    "#                     if state['step'] >= 1024:\n",
    "#                         state['step'] = 1000\n",
    "        optimizer.step()\n",
    "\n",
    "\n",
    "        # print statistics\n",
    "        if i % 100 == 0:\n",
    "            print(i,loss.data)\n",
    "        running_loss += loss.data\n",
    "\n",
    "    # Normalizing the loss by the total number of train batches\n",
    "    running_loss /= len(trainloader)\n",
    "\n",
    "    # Calculate training/test set accuracy of the existing model\n",
    "    test_loss, test_accuracy = validation(net, testloader, criterion)\n",
    "    train_loss, train_accuracy = validation(net, trainloader, criterion)\n",
    "\n",
    "    print(\"Iteration: {0} | Loss: {1} |\".format(epoch+1, running_loss),\n",
    "          \"Train,Test accuracy: {0}.3f%, {1}.3f%\".format(train_accuracy/len(trainloader), test_accuracy/len(testloader)) )\n",
    "    \n",
    "    train_accuracy_Relu.append(train_accuracy/len(trainloader))\n",
    "    train_loss_Relu.append(train_loss)\n",
    "    \n",
    "    test_accuracy_Relu.append(test_accuracy/len(testloader))\n",
    "    test_loss_Relu.append(test_loss)\n",
    "    \n",
    "    # Specify a path\n",
    "    PATH = \"./save_models/CIFAR10_VGG11_relu_E200_iter\"+str(epoch)+\".pt\"\n",
    "    torch.save(net.state_dict(), PATH)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "qVGG_xsquare2(\n",
       "  (features): Sequential(\n",
       "    (0): QuantConv2d(\n",
       "      3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (2): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (3): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (4): QuantConv2d(\n",
       "      64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (5): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (6): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (7): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (8): QuantConv2d(\n",
       "      128, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (9): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (10): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (11): QuantConv2d(\n",
       "      256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (12): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (13): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (14): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (15): QuantConv2d(\n",
       "      256, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (16): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (17): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (18): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (19): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (20): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (21): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (22): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (23): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (24): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (25): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (26): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (27): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (28): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (29): AvgPool2d(kernel_size=1, stride=1, padding=0)\n",
       "  )\n",
       "  (classifier): Linear(in_features=512, out_features=10, bias=True)\n",
       ")"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from torch.nn import Module\n",
    "import torch.nn.functional as F\n",
    "import brevitas.nn as qnn\n",
    "from brevitas.core.quant import QuantType\n",
    "\n",
    "bit_width_sel = 8\n",
    "\n",
    "class qVGG_xsquare2(nn.Module):\n",
    "    def __init__(self, vgg_name):\n",
    "        super(qVGG_xsquare2, self).__init__()\n",
    "        self.features = self._make_layers(cfg[vgg_name])\n",
    "        self.classifier = nn.Linear(512, 10)\n",
    "\n",
    "    def forward(self, x):\n",
    "        out = self.features(x)\n",
    "        out = out.view(out.size(0), -1)\n",
    "        out = self.classifier(out)\n",
    "        return out\n",
    "\n",
    "    def _make_layers(self, cfg):\n",
    "        layers = []\n",
    "        in_channels = 3\n",
    "        for x in cfg:\n",
    "            if x == 'M':\n",
    "                #layers += [nn.MaxPool2d(kernel_size=2, stride=2)]\n",
    "                layers += [nn.AvgPool2d(kernel_size=2, stride=2)]\n",
    "            else:\n",
    "                layers += [qnn.QuantConv2d(in_channels, out_channels=x, kernel_size=3, padding=1, weight_quant_type=QuantType.INT, \n",
    "                                     weight_bit_width=bit_width_sel),\n",
    "                           nn.BatchNorm2d(x),\n",
    "                           qnn.QuantXsquare2(quant_type=QuantType.INT, bit_width=8, max_val=6)]\n",
    "                in_channels = x\n",
    "        layers += [nn.AvgPool2d(kernel_size=1, stride=1)]\n",
    "        return nn.Sequential(*layers)\n",
    "    \n",
    "    \n",
    "                    \n",
    "net = qVGG_xsquare2('VGG11')\n",
    "net.cuda()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(2.4069, device='cuda:0')\n",
      "100 tensor(2.1011, device='cuda:0')\n",
      "200 tensor(1.9429, device='cuda:0')\n",
      "300 tensor(1.6888, device='cuda:0')\n",
      "Iteration: 1 | Loss: 1.8848611116409302 | Train,Test accuracy: 0.45572251081466675.3f%, 0.42850080132484436.3f%\n",
      "0 tensor(1.3843, device='cuda:0')\n",
      "100 tensor(1.4497, device='cuda:0')\n",
      "200 tensor(1.4741, device='cuda:0')\n",
      "300 tensor(1.1314, device='cuda:0')\n",
      "Iteration: 2 | Loss: 1.286672592163086 | Train,Test accuracy: 0.6202325820922852.3f%, 0.5982990264892578.3f%\n",
      "0 tensor(1.0478, device='cuda:0')\n",
      "100 tensor(1.1821, device='cuda:0')\n",
      "200 tensor(0.9913, device='cuda:0')\n",
      "300 tensor(0.9234, device='cuda:0')\n",
      "Iteration: 3 | Loss: 0.9837508797645569 | Train,Test accuracy: 0.6982736587524414.3f%, 0.6641613841056824.3f%\n",
      "0 tensor(0.7789, device='cuda:0')\n",
      "100 tensor(0.8581, device='cuda:0')\n",
      "200 tensor(0.9102, device='cuda:0')\n",
      "300 tensor(0.7074, device='cuda:0')\n",
      "Iteration: 4 | Loss: 0.8097448348999023 | Train,Test accuracy: 0.7561261653900146.3f%, 0.7234968543052673.3f%\n",
      "0 tensor(0.8926, device='cuda:0')\n",
      "100 tensor(0.7229, device='cuda:0')\n",
      "200 tensor(0.6168, device='cuda:0')\n",
      "300 tensor(0.5998, device='cuda:0')\n",
      "Iteration: 5 | Loss: 0.6872779130935669 | Train,Test accuracy: 0.8036245107650757.3f%, 0.7670094966888428.3f%\n",
      "0 tensor(0.5555, device='cuda:0')\n",
      "100 tensor(0.5562, device='cuda:0')\n",
      "200 tensor(0.5542, device='cuda:0')\n",
      "300 tensor(0.6037, device='cuda:0')\n",
      "Iteration: 6 | Loss: 0.6053870916366577 | Train,Test accuracy: 0.8250040411949158.3f%, 0.7786787748336792.3f%\n",
      "0 tensor(0.4283, device='cuda:0')\n",
      "100 tensor(0.4928, device='cuda:0')\n",
      "200 tensor(0.4913, device='cuda:0')\n",
      "300 tensor(0.5053, device='cuda:0')\n",
      "Iteration: 7 | Loss: 0.545445442199707 | Train,Test accuracy: 0.8330522775650024.3f%, 0.7809533476829529.3f%\n",
      "0 tensor(0.4156, device='cuda:0')\n",
      "100 tensor(0.3450, device='cuda:0')\n",
      "200 tensor(0.6364, device='cuda:0')\n",
      "300 tensor(0.3975, device='cuda:0')\n",
      "Iteration: 8 | Loss: 0.5021517872810364 | Train,Test accuracy: 0.8464953303337097.3f%, 0.7871835231781006.3f%\n",
      "0 tensor(0.3738, device='cuda:0')\n",
      "100 tensor(0.3963, device='cuda:0')\n",
      "200 tensor(0.6270, device='cuda:0')\n",
      "300 tensor(0.3724, device='cuda:0')\n",
      "Iteration: 9 | Loss: 0.45945942401885986 | Train,Test accuracy: 0.872762143611908.3f%, 0.8159612417221069.3f%\n",
      "0 tensor(0.4240, device='cuda:0')\n",
      "100 tensor(0.4388, device='cuda:0')\n",
      "200 tensor(0.3801, device='cuda:0')\n",
      "300 tensor(0.3538, device='cuda:0')\n",
      "Iteration: 10 | Loss: 0.426238477230072 | Train,Test accuracy: 0.8701966404914856.3f%, 0.8057753443717957.3f%\n",
      "0 tensor(0.4302, device='cuda:0')\n",
      "100 tensor(0.4442, device='cuda:0')\n",
      "200 tensor(0.3182, device='cuda:0')\n",
      "300 tensor(0.4431, device='cuda:0')\n",
      "Iteration: 11 | Loss: 0.39845791459083557 | Train,Test accuracy: 0.8740088939666748.3f%, 0.8111155033111572.3f%\n",
      "0 tensor(0.4297, device='cuda:0')\n",
      "100 tensor(0.3387, device='cuda:0')\n",
      "200 tensor(0.4764, device='cuda:0')\n",
      "300 tensor(0.2540, device='cuda:0')\n",
      "Iteration: 12 | Loss: 0.37755918502807617 | Train,Test accuracy: 0.8888146877288818.3f%, 0.8282238841056824.3f%\n",
      "0 tensor(0.4704, device='cuda:0')\n",
      "100 tensor(0.4266, device='cuda:0')\n",
      "200 tensor(0.2488, device='cuda:0')\n",
      "300 tensor(0.3493, device='cuda:0')\n",
      "Iteration: 13 | Loss: 0.35317742824554443 | Train,Test accuracy: 0.8985893726348877.3f%, 0.8294106125831604.3f%\n",
      "0 tensor(0.3015, device='cuda:0')\n",
      "100 tensor(0.2315, device='cuda:0')\n",
      "200 tensor(0.3526, device='cuda:0')\n",
      "300 tensor(0.2909, device='cuda:0')\n",
      "Iteration: 14 | Loss: 0.33729088306427 | Train,Test accuracy: 0.904887318611145.3f%, 0.8315862417221069.3f%\n",
      "0 tensor(0.3926, device='cuda:0')\n",
      "100 tensor(0.3972, device='cuda:0')\n",
      "200 tensor(0.3921, device='cuda:0')\n",
      "300 tensor(0.2412, device='cuda:0')\n",
      "Iteration: 15 | Loss: 0.31817612051963806 | Train,Test accuracy: 0.8978540897369385.3f%, 0.8292128443717957.3f%\n",
      "0 tensor(0.3598, device='cuda:0')\n",
      "100 tensor(0.2567, device='cuda:0')\n",
      "200 tensor(0.2917, device='cuda:0')\n",
      "300 tensor(0.2746, device='cuda:0')\n",
      "Iteration: 16 | Loss: 0.3050515353679657 | Train,Test accuracy: 0.9135389924049377.3f%, 0.8367286324501038.3f%\n",
      "0 tensor(0.2608, device='cuda:0')\n",
      "100 tensor(0.3271, device='cuda:0')\n",
      "200 tensor(0.1792, device='cuda:0')\n",
      "300 tensor(0.3996, device='cuda:0')\n",
      "Iteration: 17 | Loss: 0.2911114990711212 | Train,Test accuracy: 0.9099065065383911.3f%, 0.8203125.3f%\n",
      "0 tensor(0.1347, device='cuda:0')\n",
      "100 tensor(0.2630, device='cuda:0')\n",
      "200 tensor(0.2774, device='cuda:0')\n",
      "300 tensor(0.1638, device='cuda:0')\n",
      "Iteration: 18 | Loss: 0.2443903684616089 | Train,Test accuracy: 0.9307544231414795.3f%, 0.8416732549667358.3f%\n",
      "0 tensor(0.2177, device='cuda:0')\n",
      "100 tensor(0.1547, device='cuda:0')\n",
      "200 tensor(0.2278, device='cuda:0')\n",
      "300 tensor(0.3373, device='cuda:0')\n",
      "Iteration: 19 | Loss: 0.23657144606113434 | Train,Test accuracy: 0.9321611523628235.3f%, 0.8373219966888428.3f%\n",
      "0 tensor(0.3075, device='cuda:0')\n",
      "100 tensor(0.2689, device='cuda:0')\n",
      "200 tensor(0.1442, device='cuda:0')\n",
      "300 tensor(0.2359, device='cuda:0')\n",
      "Iteration: 20 | Loss: 0.22819779813289642 | Train,Test accuracy: 0.9318094253540039.3f%, 0.8364319801330566.3f%\n",
      "0 tensor(0.1515, device='cuda:0')\n",
      "100 tensor(0.2334, device='cuda:0')\n",
      "200 tensor(0.2322, device='cuda:0')\n",
      "300 tensor(0.2698, device='cuda:0')\n",
      "Iteration: 21 | Loss: 0.2195974439382553 | Train,Test accuracy: 0.9374920129776001.3f%, 0.8451344966888428.3f%\n",
      "0 tensor(0.2090, device='cuda:0')\n",
      "100 tensor(0.2746, device='cuda:0')\n",
      "200 tensor(0.1576, device='cuda:0')\n",
      "300 tensor(0.2561, device='cuda:0')\n",
      "Iteration: 22 | Loss: 0.2093697488307953 | Train,Test accuracy: 0.9392662644386292.3f%, 0.8383108973503113.3f%\n",
      "0 tensor(0.2440, device='cuda:0')\n",
      "100 tensor(0.1675, device='cuda:0')\n",
      "200 tensor(0.1466, device='cuda:0')\n",
      "300 tensor(0.2142, device='cuda:0')\n",
      "Iteration: 23 | Loss: 0.2009860724210739 | Train,Test accuracy: 0.9377477169036865.3f%, 0.8346518874168396.3f%\n",
      "0 tensor(0.1834, device='cuda:0')\n",
      "100 tensor(0.1274, device='cuda:0')\n",
      "200 tensor(0.1597, device='cuda:0')\n",
      "300 tensor(0.1559, device='cuda:0')\n",
      "Iteration: 24 | Loss: 0.19684571027755737 | Train,Test accuracy: 0.9415640830993652.3f%, 0.8452333807945251.3f%\n",
      "0 tensor(0.1237, device='cuda:0')\n",
      "100 tensor(0.1258, device='cuda:0')\n",
      "200 tensor(0.1925, device='cuda:0')\n",
      "300 tensor(0.2674, device='cuda:0')\n",
      "Iteration: 25 | Loss: 0.19071780145168304 | Train,Test accuracy: 0.9396899342536926.3f%, 0.8433544039726257.3f%\n",
      "0 tensor(0.1135, device='cuda:0')\n",
      "100 tensor(0.2500, device='cuda:0')\n",
      "200 tensor(0.2422, device='cuda:0')\n",
      "300 tensor(0.2308, device='cuda:0')\n",
      "Iteration: 26 | Loss: 0.19014757871627808 | Train,Test accuracy: 0.9471746683120728.3f%, 0.8414754867553711.3f%\n",
      "0 tensor(0.1576, device='cuda:0')\n",
      "100 tensor(0.1197, device='cuda:0')\n",
      "200 tensor(0.2375, device='cuda:0')\n",
      "300 tensor(0.1642, device='cuda:0')\n",
      "Iteration: 27 | Loss: 0.17677703499794006 | Train,Test accuracy: 0.9474704265594482.3f%, 0.8343552350997925.3f%\n",
      "0 tensor(0.2064, device='cuda:0')\n",
      "100 tensor(0.1138, device='cuda:0')\n",
      "200 tensor(0.1775, device='cuda:0')\n",
      "300 tensor(0.1110, device='cuda:0')\n",
      "Iteration: 28 | Loss: 0.17754721641540527 | Train,Test accuracy: 0.9505195617675781.3f%, 0.8421677350997925.3f%\n",
      "0 tensor(0.1910, device='cuda:0')\n",
      "100 tensor(0.3196, device='cuda:0')\n",
      "200 tensor(0.3200, device='cuda:0')\n",
      "300 tensor(0.1857, device='cuda:0')\n",
      "Iteration: 29 | Loss: 0.16647911071777344 | Train,Test accuracy: 0.9481737613677979.3f%, 0.8515625.3f%\n",
      "0 tensor(0.0687, device='cuda:0')\n",
      "100 tensor(0.1351, device='cuda:0')\n",
      "200 tensor(0.0774, device='cuda:0')\n",
      "300 tensor(0.1794, device='cuda:0')\n",
      "Iteration: 30 | Loss: 0.17166511714458466 | Train,Test accuracy: 0.9512547850608826.3f%, 0.8482990264892578.3f%\n",
      "0 tensor(0.1207, device='cuda:0')\n",
      "100 tensor(0.1159, device='cuda:0')\n",
      "200 tensor(0.1473, device='cuda:0')\n",
      "300 tensor(0.1817, device='cuda:0')\n",
      "Iteration: 31 | Loss: 0.16413168609142303 | Train,Test accuracy: 0.9531409740447998.3f%, 0.844343364238739.3f%\n",
      "0 tensor(0.1623, device='cuda:0')\n",
      "100 tensor(0.1726, device='cuda:0')\n",
      "200 tensor(0.2546, device='cuda:0')\n",
      "300 tensor(0.1969, device='cuda:0')\n",
      "Iteration: 32 | Loss: 0.16477252542972565 | Train,Test accuracy: 0.9487132430076599.3f%, 0.847507894039154.3f%\n",
      "0 tensor(0.1134, device='cuda:0')\n",
      "100 tensor(0.1237, device='cuda:0')\n",
      "200 tensor(0.2707, device='cuda:0')\n",
      "300 tensor(0.0977, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 33 | Loss: 0.16055287420749664 | Train,Test accuracy: 0.9517542719841003.3f%, 0.8473101258277893.3f%\n",
      "0 tensor(0.2019, device='cuda:0')\n",
      "100 tensor(0.1058, device='cuda:0')\n",
      "200 tensor(0.1747, device='cuda:0')\n",
      "300 tensor(0.1181, device='cuda:0')\n",
      "Iteration: 34 | Loss: 0.15610459446907043 | Train,Test accuracy: 0.9515065550804138.3f%, 0.8468156456947327.3f%\n",
      "0 tensor(0.1056, device='cuda:0')\n",
      "100 tensor(0.1104, device='cuda:0')\n",
      "200 tensor(0.2101, device='cuda:0')\n",
      "300 tensor(0.1156, device='cuda:0')\n",
      "Iteration: 35 | Loss: 0.15624983608722687 | Train,Test accuracy: 0.953940212726593.3f%, 0.8418710231781006.3f%\n",
      "0 tensor(0.0903, device='cuda:0')\n",
      "100 tensor(0.0776, device='cuda:0')\n",
      "200 tensor(0.1325, device='cuda:0')\n",
      "300 tensor(0.1895, device='cuda:0')\n",
      "Iteration: 36 | Loss: 0.15538841485977173 | Train,Test accuracy: 0.9540161490440369.3f%, 0.8349485993385315.3f%\n",
      "0 tensor(0.2148, device='cuda:0')\n",
      "100 tensor(0.1614, device='cuda:0')\n",
      "200 tensor(0.2330, device='cuda:0')\n",
      "300 tensor(0.1213, device='cuda:0')\n",
      "Iteration: 37 | Loss: 0.1470533311367035 | Train,Test accuracy: 0.9530410766601562.3f%, 0.8381131291389465.3f%\n",
      "0 tensor(0.1604, device='cuda:0')\n",
      "100 tensor(0.0717, device='cuda:0')\n",
      "200 tensor(0.1516, device='cuda:0')\n",
      "300 tensor(0.2230, device='cuda:0')\n",
      "Iteration: 38 | Loss: 0.15074382722377777 | Train,Test accuracy: 0.9527653455734253.3f%, 0.8472112417221069.3f%\n",
      "0 tensor(0.0870, device='cuda:0')\n",
      "100 tensor(0.1498, device='cuda:0')\n",
      "200 tensor(0.1970, device='cuda:0')\n",
      "300 tensor(0.2335, device='cuda:0')\n",
      "Iteration: 39 | Loss: 0.1474580615758896 | Train,Test accuracy: 0.9565417170524597.3f%, 0.8385087251663208.3f%\n",
      "0 tensor(0.0749, device='cuda:0')\n",
      "100 tensor(0.1393, device='cuda:0')\n",
      "200 tensor(0.1964, device='cuda:0')\n",
      "300 tensor(0.1294, device='cuda:0')\n",
      "Iteration: 40 | Loss: 0.1460440456867218 | Train,Test accuracy: 0.9536924362182617.3f%, 0.8433544039726257.3f%\n",
      "0 tensor(0.1880, device='cuda:0')\n",
      "100 tensor(0.0721, device='cuda:0')\n",
      "200 tensor(0.1091, device='cuda:0')\n",
      "300 tensor(0.1222, device='cuda:0')\n",
      "Iteration: 41 | Loss: 0.14393097162246704 | Train,Test accuracy: 0.9593790173530579.3f%, 0.8505735993385315.3f%\n",
      "0 tensor(0.0857, device='cuda:0')\n",
      "100 tensor(0.1888, device='cuda:0')\n",
      "200 tensor(0.1097, device='cuda:0')\n",
      "300 tensor(0.1951, device='cuda:0')\n",
      "Iteration: 42 | Loss: 0.14510740339756012 | Train,Test accuracy: 0.958907425403595.3f%, 0.8528481125831604.3f%\n",
      "0 tensor(0.1146, device='cuda:0')\n",
      "100 tensor(0.1237, device='cuda:0')\n",
      "200 tensor(0.1432, device='cuda:0')\n",
      "300 tensor(0.1238, device='cuda:0')\n",
      "Iteration: 43 | Loss: 0.14185000956058502 | Train,Test accuracy: 0.9598905444145203.3f%, 0.8444422483444214.3f%\n",
      "0 tensor(0.1591, device='cuda:0')\n",
      "100 tensor(0.1073, device='cuda:0')\n",
      "200 tensor(0.1919, device='cuda:0')\n",
      "300 tensor(0.1023, device='cuda:0')\n",
      "Iteration: 44 | Loss: 0.14084693789482117 | Train,Test accuracy: 0.9555866122245789.3f%, 0.8432555198669434.3f%\n",
      "0 tensor(0.1609, device='cuda:0')\n",
      "100 tensor(0.1114, device='cuda:0')\n",
      "200 tensor(0.1206, device='cuda:0')\n",
      "300 tensor(0.1213, device='cuda:0')\n",
      "Iteration: 45 | Loss: 0.13842535018920898 | Train,Test accuracy: 0.9601662158966064.3f%, 0.853342592716217.3f%\n",
      "0 tensor(0.1592, device='cuda:0')\n",
      "100 tensor(0.1372, device='cuda:0')\n",
      "200 tensor(0.1676, device='cuda:0')\n",
      "300 tensor(0.0800, device='cuda:0')\n",
      "Iteration: 46 | Loss: 0.13469737768173218 | Train,Test accuracy: 0.9573529958724976.3f%, 0.8461233973503113.3f%\n",
      "0 tensor(0.0690, device='cuda:0')\n",
      "100 tensor(0.0486, device='cuda:0')\n",
      "200 tensor(0.2179, device='cuda:0')\n",
      "300 tensor(0.1720, device='cuda:0')\n",
      "Iteration: 47 | Loss: 0.13842342793941498 | Train,Test accuracy: 0.9603500962257385.3f%, 0.8525514006614685.3f%\n",
      "0 tensor(0.0684, device='cuda:0')\n",
      "100 tensor(0.0899, device='cuda:0')\n",
      "200 tensor(0.2152, device='cuda:0')\n",
      "300 tensor(0.1612, device='cuda:0')\n",
      "Iteration: 48 | Loss: 0.14116446673870087 | Train,Test accuracy: 0.9545316100120544.3f%, 0.8434533476829529.3f%\n",
      "0 tensor(0.0790, device='cuda:0')\n",
      "100 tensor(0.0463, device='cuda:0')\n",
      "200 tensor(0.1621, device='cuda:0')\n",
      "300 tensor(0.1201, device='cuda:0')\n",
      "Iteration: 49 | Loss: 0.13548992574214935 | Train,Test accuracy: 0.9616008400917053.3f%, 0.8528481125831604.3f%\n",
      "0 tensor(0.2038, device='cuda:0')\n",
      "100 tensor(0.1449, device='cuda:0')\n",
      "200 tensor(0.1405, device='cuda:0')\n",
      "300 tensor(0.2509, device='cuda:0')\n",
      "Iteration: 50 | Loss: 0.13247880339622498 | Train,Test accuracy: 0.962503969669342.3f%, 0.8461233973503113.3f%\n",
      "0 tensor(0.1141, device='cuda:0')\n",
      "100 tensor(0.2516, device='cuda:0')\n",
      "200 tensor(0.1804, device='cuda:0')\n",
      "300 tensor(0.0832, device='cuda:0')\n",
      "Iteration: 51 | Loss: 0.13457755744457245 | Train,Test accuracy: 0.9643981456756592.3f%, 0.8453322649002075.3f%\n",
      "0 tensor(0.0966, device='cuda:0')\n",
      "100 tensor(0.0941, device='cuda:0')\n",
      "200 tensor(0.1445, device='cuda:0')\n",
      "300 tensor(0.1775, device='cuda:0')\n",
      "Iteration: 52 | Loss: 0.13057716190814972 | Train,Test accuracy: 0.9614929556846619.3f%, 0.840585470199585.3f%\n",
      "0 tensor(0.1189, device='cuda:0')\n",
      "100 tensor(0.1007, device='cuda:0')\n",
      "200 tensor(0.2029, device='cuda:0')\n",
      "300 tensor(0.1124, device='cuda:0')\n",
      "Iteration: 53 | Loss: 0.130208820104599 | Train,Test accuracy: 0.9649856686592102.3f%, 0.848397970199585.3f%\n",
      "0 tensor(0.0905, device='cuda:0')\n",
      "100 tensor(0.0997, device='cuda:0')\n",
      "200 tensor(0.1109, device='cuda:0')\n",
      "300 tensor(0.1385, device='cuda:0')\n",
      "Iteration: 54 | Loss: 0.13372154533863068 | Train,Test accuracy: 0.9600743651390076.3f%, 0.8446400165557861.3f%\n",
      "0 tensor(0.1258, device='cuda:0')\n",
      "100 tensor(0.1539, device='cuda:0')\n",
      "200 tensor(0.1498, device='cuda:0')\n",
      "300 tensor(0.0688, device='cuda:0')\n",
      "Iteration: 55 | Loss: 0.1302415430545807 | Train,Test accuracy: 0.9583359956741333.3f%, 0.8411787748336792.3f%\n",
      "0 tensor(0.1880, device='cuda:0')\n",
      "100 tensor(0.0961, device='cuda:0')\n",
      "200 tensor(0.1165, device='cuda:0')\n",
      "300 tensor(0.0588, device='cuda:0')\n",
      "Iteration: 56 | Loss: 0.13346171379089355 | Train,Test accuracy: 0.9589154720306396.3f%, 0.8501780033111572.3f%\n",
      "0 tensor(0.0725, device='cuda:0')\n",
      "100 tensor(0.0648, device='cuda:0')\n",
      "200 tensor(0.2450, device='cuda:0')\n",
      "300 tensor(0.0417, device='cuda:0')\n",
      "Iteration: 57 | Loss: 0.1288796365261078 | Train,Test accuracy: 0.9635310173034668.3f%, 0.8464201092720032.3f%\n",
      "0 tensor(0.0381, device='cuda:0')\n",
      "100 tensor(0.0890, device='cuda:0')\n",
      "200 tensor(0.1419, device='cuda:0')\n",
      "300 tensor(0.1255, device='cuda:0')\n",
      "Iteration: 58 | Loss: 0.12535056471824646 | Train,Test accuracy: 0.9613491296768188.3f%, 0.8438488841056824.3f%\n",
      "0 tensor(0.1119, device='cuda:0')\n",
      "100 tensor(0.0883, device='cuda:0')\n",
      "200 tensor(0.1055, device='cuda:0')\n",
      "300 tensor(0.1119, device='cuda:0')\n",
      "Iteration: 59 | Loss: 0.1258462518453598 | Train,Test accuracy: 0.9601022601127625.3f%, 0.844936728477478.3f%\n",
      "0 tensor(0.1853, device='cuda:0')\n",
      "100 tensor(0.1586, device='cuda:0')\n",
      "200 tensor(0.0861, device='cuda:0')\n",
      "300 tensor(0.1478, device='cuda:0')\n",
      "Iteration: 60 | Loss: 0.12144709378480911 | Train,Test accuracy: 0.9618526101112366.3f%, 0.8501780033111572.3f%\n",
      "0 tensor(0.1114, device='cuda:0')\n",
      "100 tensor(0.0614, device='cuda:0')\n",
      "200 tensor(0.1086, device='cuda:0')\n",
      "300 tensor(0.1560, device='cuda:0')\n",
      "Iteration: 61 | Loss: 0.1262463480234146 | Train,Test accuracy: 0.9591312408447266.3f%, 0.8415743708610535.3f%\n",
      "0 tensor(0.1198, device='cuda:0')\n",
      "100 tensor(0.0851, device='cuda:0')\n",
      "200 tensor(0.1082, device='cuda:0')\n",
      "300 tensor(0.0800, device='cuda:0')\n",
      "Iteration: 62 | Loss: 0.12700249254703522 | Train,Test accuracy: 0.9603341221809387.3f%, 0.848397970199585.3f%\n",
      "0 tensor(0.1238, device='cuda:0')\n",
      "100 tensor(0.1441, device='cuda:0')\n",
      "200 tensor(0.1516, device='cuda:0')\n",
      "300 tensor(0.1025, device='cuda:0')\n",
      "Iteration: 63 | Loss: 0.12375813722610474 | Train,Test accuracy: 0.9610334038734436.3f%, 0.8435522317886353.3f%\n",
      "0 tensor(0.1790, device='cuda:0')\n",
      "100 tensor(0.1024, device='cuda:0')\n",
      "200 tensor(0.1411, device='cuda:0')\n",
      "300 tensor(0.1384, device='cuda:0')\n",
      "Iteration: 64 | Loss: 0.12429774552583694 | Train,Test accuracy: 0.9654651880264282.3f%, 0.8446400165557861.3f%\n",
      "0 tensor(0.1407, device='cuda:0')\n",
      "100 tensor(0.2445, device='cuda:0')\n",
      "200 tensor(0.0644, device='cuda:0')\n",
      "300 tensor(0.0807, device='cuda:0')\n",
      "Iteration: 65 | Loss: 0.12703070044517517 | Train,Test accuracy: 0.9668917655944824.3f%, 0.8554192781448364.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.1622, device='cuda:0')\n",
      "100 tensor(0.1899, device='cuda:0')\n",
      "200 tensor(0.1317, device='cuda:0')\n",
      "300 tensor(0.1208, device='cuda:0')\n",
      "Iteration: 66 | Loss: 0.12479391694068909 | Train,Test accuracy: 0.96535325050354.3f%, 0.8543314933776855.3f%\n",
      "0 tensor(0.0862, device='cuda:0')\n",
      "100 tensor(0.0834, device='cuda:0')\n",
      "200 tensor(0.2288, device='cuda:0')\n",
      "300 tensor(0.1107, device='cuda:0')\n",
      "Iteration: 67 | Loss: 0.12204067409038544 | Train,Test accuracy: 0.9609215259552002.3f%, 0.8492879867553711.3f%\n",
      "0 tensor(0.0723, device='cuda:0')\n",
      "100 tensor(0.2395, device='cuda:0')\n",
      "200 tensor(0.1095, device='cuda:0')\n",
      "300 tensor(0.1455, device='cuda:0')\n",
      "Iteration: 68 | Loss: 0.12264156341552734 | Train,Test accuracy: 0.9657408595085144.3f%, 0.8446400165557861.3f%\n",
      "0 tensor(0.0849, device='cuda:0')\n",
      "100 tensor(0.1060, device='cuda:0')\n",
      "200 tensor(0.1574, device='cuda:0')\n",
      "300 tensor(0.1541, device='cuda:0')\n",
      "Iteration: 69 | Loss: 0.11853756010532379 | Train,Test accuracy: 0.9636149406433105.3f%, 0.8410798907279968.3f%\n",
      "0 tensor(0.0905, device='cuda:0')\n",
      "100 tensor(0.1464, device='cuda:0')\n",
      "200 tensor(0.1320, device='cuda:0')\n",
      "300 tensor(0.2325, device='cuda:0')\n",
      "Iteration: 70 | Loss: 0.12383599579334259 | Train,Test accuracy: 0.9635670185089111.3f%, 0.8490902185440063.3f%\n",
      "0 tensor(0.1191, device='cuda:0')\n",
      "100 tensor(0.1010, device='cuda:0')\n",
      "200 tensor(0.1348, device='cuda:0')\n",
      "300 tensor(0.0535, device='cuda:0')\n",
      "Iteration: 71 | Loss: 0.11630094051361084 | Train,Test accuracy: 0.9636309146881104.3f%, 0.8421677350997925.3f%\n",
      "0 tensor(0.0292, device='cuda:0')\n",
      "100 tensor(0.1602, device='cuda:0')\n",
      "200 tensor(0.1151, device='cuda:0')\n",
      "300 tensor(0.1586, device='cuda:0')\n",
      "Iteration: 72 | Loss: 0.12370520830154419 | Train,Test accuracy: 0.9662164449691772.3f%, 0.8526503443717957.3f%\n",
      "0 tensor(0.0324, device='cuda:0')\n",
      "100 tensor(0.1233, device='cuda:0')\n",
      "200 tensor(0.1731, device='cuda:0')\n",
      "300 tensor(0.1041, device='cuda:0')\n",
      "Iteration: 73 | Loss: 0.11739139258861542 | Train,Test accuracy: 0.9645700454711914.3f%, 0.8460245132446289.3f%\n",
      "0 tensor(0.0840, device='cuda:0')\n",
      "100 tensor(0.0765, device='cuda:0')\n",
      "200 tensor(0.0800, device='cuda:0')\n",
      "300 tensor(0.2422, device='cuda:0')\n",
      "Iteration: 74 | Loss: 0.11317441612482071 | Train,Test accuracy: 0.9624480605125427.3f%, 0.8490902185440063.3f%\n",
      "0 tensor(0.0710, device='cuda:0')\n",
      "100 tensor(0.1083, device='cuda:0')\n",
      "200 tensor(0.0920, device='cuda:0')\n",
      "300 tensor(0.1234, device='cuda:0')\n",
      "Iteration: 75 | Loss: 0.12348592281341553 | Train,Test accuracy: 0.9657408595085144.3f%, 0.850969135761261.3f%\n",
      "0 tensor(0.1090, device='cuda:0')\n",
      "100 tensor(0.2270, device='cuda:0')\n",
      "200 tensor(0.1558, device='cuda:0')\n",
      "300 tensor(0.1413, device='cuda:0')\n",
      "Iteration: 76 | Loss: 0.11858150362968445 | Train,Test accuracy: 0.9668917655944824.3f%, 0.8461233973503113.3f%\n",
      "0 tensor(0.0487, device='cuda:0')\n",
      "100 tensor(0.1618, device='cuda:0')\n",
      "200 tensor(0.1385, device='cuda:0')\n",
      "300 tensor(0.2904, device='cuda:0')\n",
      "Iteration: 77 | Loss: 0.12375326454639435 | Train,Test accuracy: 0.9667080044746399.3f%, 0.8470134735107422.3f%\n",
      "0 tensor(0.0830, device='cuda:0')\n",
      "100 tensor(0.1458, device='cuda:0')\n",
      "200 tensor(0.1027, device='cuda:0')\n",
      "300 tensor(0.1460, device='cuda:0')\n",
      "Iteration: 78 | Loss: 0.11595525592565536 | Train,Test accuracy: 0.9627118110656738.3f%, 0.8498813509941101.3f%\n",
      "0 tensor(0.1172, device='cuda:0')\n",
      "100 tensor(0.1964, device='cuda:0')\n",
      "200 tensor(0.0964, device='cuda:0')\n",
      "300 tensor(0.1754, device='cuda:0')\n",
      "Iteration: 79 | Loss: 0.11992514133453369 | Train,Test accuracy: 0.9650256037712097.3f%, 0.8510680198669434.3f%\n",
      "0 tensor(0.0685, device='cuda:0')\n",
      "100 tensor(0.1443, device='cuda:0')\n",
      "200 tensor(0.1056, device='cuda:0')\n",
      "300 tensor(0.2590, device='cuda:0')\n",
      "Iteration: 80 | Loss: 0.11896566301584244 | Train,Test accuracy: 0.9638986587524414.3f%, 0.8479034900665283.3f%\n",
      "0 tensor(0.0469, device='cuda:0')\n",
      "100 tensor(0.1064, device='cuda:0')\n",
      "200 tensor(0.0816, device='cuda:0')\n",
      "300 tensor(0.2120, device='cuda:0')\n",
      "Iteration: 81 | Loss: 0.1173216700553894 | Train,Test accuracy: 0.965688943862915.3f%, 0.8506724834442139.3f%\n",
      "0 tensor(0.1227, device='cuda:0')\n",
      "100 tensor(0.0988, device='cuda:0')\n",
      "200 tensor(0.0658, device='cuda:0')\n",
      "300 tensor(0.0288, device='cuda:0')\n",
      "Iteration: 82 | Loss: 0.06848204880952835 | Train,Test accuracy: 0.9827645421028137.3f%, 0.8667919039726257.3f%\n",
      "0 tensor(0.0382, device='cuda:0')\n",
      "100 tensor(0.0941, device='cuda:0')\n",
      "200 tensor(0.1134, device='cuda:0')\n",
      "300 tensor(0.0490, device='cuda:0')\n",
      "Iteration: 83 | Loss: 0.048626985400915146 | Train,Test accuracy: 0.9856937527656555.3f%, 0.860561728477478.3f%\n",
      "0 tensor(0.0095, device='cuda:0')\n",
      "100 tensor(0.0367, device='cuda:0')\n",
      "200 tensor(0.0497, device='cuda:0')\n",
      "300 tensor(0.0635, device='cuda:0')\n",
      "Iteration: 84 | Loss: 0.047739703208208084 | Train,Test accuracy: 0.9837356209754944.3f%, 0.8541337251663208.3f%\n",
      "0 tensor(0.0197, device='cuda:0')\n",
      "100 tensor(0.0521, device='cuda:0')\n",
      "200 tensor(0.0345, device='cuda:0')\n",
      "300 tensor(0.0213, device='cuda:0')\n",
      "Iteration: 85 | Loss: 0.05519765987992287 | Train,Test accuracy: 0.9834838509559631.3f%, 0.859968364238739.3f%\n",
      "0 tensor(0.0270, device='cuda:0')\n",
      "100 tensor(0.0140, device='cuda:0')\n",
      "200 tensor(0.0191, device='cuda:0')\n",
      "300 tensor(0.0354, device='cuda:0')\n",
      "Iteration: 86 | Loss: 0.05186282470822334 | Train,Test accuracy: 0.9835358262062073.3f%, 0.8584849834442139.3f%\n",
      "0 tensor(0.0495, device='cuda:0')\n",
      "100 tensor(0.0420, device='cuda:0')\n",
      "200 tensor(0.0293, device='cuda:0')\n",
      "300 tensor(0.0491, device='cuda:0')\n",
      "Iteration: 87 | Loss: 0.05219743028283119 | Train,Test accuracy: 0.9850223660469055.3f%, 0.8633307218551636.3f%\n",
      "0 tensor(0.0520, device='cuda:0')\n",
      "100 tensor(0.0442, device='cuda:0')\n",
      "200 tensor(0.0320, device='cuda:0')\n",
      "300 tensor(0.0675, device='cuda:0')\n",
      "Iteration: 88 | Loss: 0.05359550565481186 | Train,Test accuracy: 0.9850743412971497.3f%, 0.8618472814559937.3f%\n",
      "0 tensor(0.0660, device='cuda:0')\n",
      "100 tensor(0.0483, device='cuda:0')\n",
      "200 tensor(0.0786, device='cuda:0')\n",
      "300 tensor(0.0215, device='cuda:0')\n",
      "Iteration: 89 | Loss: 0.04810281842947006 | Train,Test accuracy: 0.984315037727356.3f%, 0.8588805198669434.3f%\n",
      "0 tensor(0.0866, device='cuda:0')\n",
      "100 tensor(0.0256, device='cuda:0')\n",
      "200 tensor(0.0571, device='cuda:0')\n",
      "300 tensor(0.0689, device='cuda:0')\n",
      "Iteration: 90 | Loss: 0.05052487552165985 | Train,Test accuracy: 0.9845388531684875.3f%, 0.8564082384109497.3f%\n",
      "0 tensor(0.0155, device='cuda:0')\n",
      "100 tensor(0.0582, device='cuda:0')\n",
      "200 tensor(0.0348, device='cuda:0')\n",
      "300 tensor(0.0351, device='cuda:0')\n",
      "Iteration: 91 | Loss: 0.055014919489622116 | Train,Test accuracy: 0.9863331317901611.3f%, 0.8588805198669434.3f%\n",
      "0 tensor(0.0404, device='cuda:0')\n",
      "100 tensor(0.0261, device='cuda:0')\n",
      "200 tensor(0.0981, device='cuda:0')\n",
      "300 tensor(0.0835, device='cuda:0')\n",
      "Iteration: 92 | Loss: 0.04600795730948448 | Train,Test accuracy: 0.9826127290725708.3f%, 0.8515625.3f%\n",
      "0 tensor(0.0866, device='cuda:0')\n",
      "100 tensor(0.0422, device='cuda:0')\n",
      "200 tensor(0.1481, device='cuda:0')\n",
      "300 tensor(0.0337, device='cuda:0')\n",
      "Iteration: 93 | Loss: 0.05034120753407478 | Train,Test accuracy: 0.9854300022125244.3f%, 0.8571004867553711.3f%\n",
      "0 tensor(0.0428, device='cuda:0')\n",
      "100 tensor(0.0154, device='cuda:0')\n",
      "200 tensor(0.0220, device='cuda:0')\n",
      "300 tensor(0.0206, device='cuda:0')\n",
      "Iteration: 94 | Loss: 0.053695280104875565 | Train,Test accuracy: 0.9838715195655823.3f%, 0.855617105960846.3f%\n",
      "0 tensor(0.0506, device='cuda:0')\n",
      "100 tensor(0.0758, device='cuda:0')\n",
      "200 tensor(0.0840, device='cuda:0')\n",
      "300 tensor(0.0274, device='cuda:0')\n",
      "Iteration: 95 | Loss: 0.0526147335767746 | Train,Test accuracy: 0.9857016801834106.3f%, 0.8552215099334717.3f%\n",
      "0 tensor(0.0123, device='cuda:0')\n",
      "100 tensor(0.0581, device='cuda:0')\n",
      "200 tensor(0.0389, device='cuda:0')\n",
      "300 tensor(0.0663, device='cuda:0')\n",
      "Iteration: 96 | Loss: 0.049745626747608185 | Train,Test accuracy: 0.9834438562393188.3f%, 0.8512658476829529.3f%\n",
      "0 tensor(0.0624, device='cuda:0')\n",
      "100 tensor(0.0316, device='cuda:0')\n",
      "200 tensor(0.1441, device='cuda:0')\n",
      "300 tensor(0.0173, device='cuda:0')\n",
      "Iteration: 97 | Loss: 0.04868887737393379 | Train,Test accuracy: 0.9833040237426758.3f%, 0.8597705960273743.3f%\n",
      "0 tensor(0.0172, device='cuda:0')\n",
      "100 tensor(0.0783, device='cuda:0')\n",
      "200 tensor(0.0102, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "300 tensor(0.0225, device='cuda:0')\n",
      "Iteration: 98 | Loss: 0.05276075378060341 | Train,Test accuracy: 0.9845628142356873.3f%, 0.8580893874168396.3f%\n",
      "0 tensor(0.0573, device='cuda:0')\n",
      "100 tensor(0.0347, device='cuda:0')\n",
      "200 tensor(0.0754, device='cuda:0')\n",
      "300 tensor(0.0304, device='cuda:0')\n",
      "Iteration: 99 | Loss: 0.05254628509283066 | Train,Test accuracy: 0.9838155508041382.3f%, 0.8546281456947327.3f%\n",
      "0 tensor(0.0249, device='cuda:0')\n",
      "100 tensor(0.0274, device='cuda:0')\n",
      "200 tensor(0.0277, device='cuda:0')\n",
      "300 tensor(0.0280, device='cuda:0')\n",
      "Iteration: 100 | Loss: 0.052360910922288895 | Train,Test accuracy: 0.9824248552322388.3f%, 0.8542326092720032.3f%\n",
      "0 tensor(0.0355, device='cuda:0')\n",
      "100 tensor(0.0206, device='cuda:0')\n",
      "200 tensor(0.0129, device='cuda:0')\n",
      "300 tensor(0.0590, device='cuda:0')\n",
      "Iteration: 101 | Loss: 0.051820430904626846 | Train,Test accuracy: 0.9851303100585938.3f%, 0.8532436490058899.3f%\n",
      "0 tensor(0.0166, device='cuda:0')\n",
      "100 tensor(0.0190, device='cuda:0')\n",
      "200 tensor(0.0180, device='cuda:0')\n",
      "300 tensor(0.0357, device='cuda:0')\n",
      "Iteration: 102 | Loss: 0.05093114823102951 | Train,Test accuracy: 0.9848025441169739.3f%, 0.8564082384109497.3f%\n",
      "0 tensor(0.0455, device='cuda:0')\n",
      "100 tensor(0.0188, device='cuda:0')\n",
      "200 tensor(0.0267, device='cuda:0')\n",
      "300 tensor(0.0196, device='cuda:0')\n",
      "Iteration: 103 | Loss: 0.055741481482982635 | Train,Test accuracy: 0.9827445149421692.3f%, 0.854727029800415.3f%\n",
      "0 tensor(0.0458, device='cuda:0')\n",
      "100 tensor(0.0201, device='cuda:0')\n",
      "200 tensor(0.0303, device='cuda:0')\n",
      "300 tensor(0.0208, device='cuda:0')\n",
      "Iteration: 104 | Loss: 0.0495804138481617 | Train,Test accuracy: 0.9843710064888.3f%, 0.8559137582778931.3f%\n",
      "0 tensor(0.0457, device='cuda:0')\n",
      "100 tensor(0.0326, device='cuda:0')\n",
      "200 tensor(0.0292, device='cuda:0')\n",
      "300 tensor(0.0754, device='cuda:0')\n",
      "Iteration: 105 | Loss: 0.051849812269210815 | Train,Test accuracy: 0.9845947623252869.3f%, 0.8610561490058899.3f%\n",
      "0 tensor(0.0569, device='cuda:0')\n",
      "100 tensor(0.0391, device='cuda:0')\n",
      "200 tensor(0.0346, device='cuda:0')\n",
      "300 tensor(0.1545, device='cuda:0')\n",
      "Iteration: 106 | Loss: 0.05456412211060524 | Train,Test accuracy: 0.9853820204734802.3f%, 0.8601661324501038.3f%\n",
      "0 tensor(0.0383, device='cuda:0')\n",
      "100 tensor(0.0181, device='cuda:0')\n",
      "200 tensor(0.0185, device='cuda:0')\n",
      "300 tensor(0.1169, device='cuda:0')\n",
      "Iteration: 107 | Loss: 0.052458688616752625 | Train,Test accuracy: 0.9816336631774902.3f%, 0.8517602682113647.3f%\n",
      "0 tensor(0.0480, device='cuda:0')\n",
      "100 tensor(0.0085, device='cuda:0')\n",
      "200 tensor(0.0335, device='cuda:0')\n",
      "300 tensor(0.0110, device='cuda:0')\n",
      "Iteration: 108 | Loss: 0.05314749479293823 | Train,Test accuracy: 0.986820638179779.3f%, 0.8661985993385315.3f%\n",
      "0 tensor(0.0063, device='cuda:0')\n",
      "100 tensor(0.0379, device='cuda:0')\n",
      "200 tensor(0.0466, device='cuda:0')\n",
      "300 tensor(0.1659, device='cuda:0')\n",
      "Iteration: 109 | Loss: 0.050469860434532166 | Train,Test accuracy: 0.9858136177062988.3f%, 0.8549248576164246.3f%\n",
      "0 tensor(0.0710, device='cuda:0')\n",
      "100 tensor(0.0107, device='cuda:0')\n",
      "200 tensor(0.0453, device='cuda:0')\n",
      "300 tensor(0.0314, device='cuda:0')\n",
      "Iteration: 110 | Loss: 0.05011303350329399 | Train,Test accuracy: 0.9836516976356506.3f%, 0.8524525165557861.3f%\n",
      "0 tensor(0.1307, device='cuda:0')\n",
      "100 tensor(0.0148, device='cuda:0')\n",
      "200 tensor(0.0315, device='cuda:0')\n",
      "300 tensor(0.0910, device='cuda:0')\n",
      "Iteration: 111 | Loss: 0.05082453414797783 | Train,Test accuracy: 0.9851342439651489.3f%, 0.8588805198669434.3f%\n",
      "0 tensor(0.1440, device='cuda:0')\n",
      "100 tensor(0.0374, device='cuda:0')\n",
      "200 tensor(0.0881, device='cuda:0')\n",
      "300 tensor(0.0179, device='cuda:0')\n",
      "Iteration: 112 | Loss: 0.05382862687110901 | Train,Test accuracy: 0.9833320379257202.3f%, 0.861155092716217.3f%\n",
      "0 tensor(0.0438, device='cuda:0')\n",
      "100 tensor(0.0662, device='cuda:0')\n",
      "200 tensor(0.0595, device='cuda:0')\n",
      "300 tensor(0.0322, device='cuda:0')\n",
      "Iteration: 113 | Loss: 0.05396992713212967 | Train,Test accuracy: 0.9857016801834106.3f%, 0.856210470199585.3f%\n",
      "0 tensor(0.0381, device='cuda:0')\n",
      "100 tensor(0.0811, device='cuda:0')\n",
      "200 tensor(0.0420, device='cuda:0')\n",
      "300 tensor(0.0917, device='cuda:0')\n",
      "Iteration: 114 | Loss: 0.053994711488485336 | Train,Test accuracy: 0.983555793762207.3f%, 0.8594738841056824.3f%\n",
      "0 tensor(0.0320, device='cuda:0')\n",
      "100 tensor(0.0333, device='cuda:0')\n",
      "200 tensor(0.0438, device='cuda:0')\n",
      "300 tensor(0.0779, device='cuda:0')\n",
      "Iteration: 115 | Loss: 0.0499132014811039 | Train,Test accuracy: 0.9837235808372498.3f%, 0.8584849834442139.3f%\n",
      "0 tensor(0.1074, device='cuda:0')\n",
      "100 tensor(0.0726, device='cuda:0')\n",
      "200 tensor(0.0289, device='cuda:0')\n",
      "300 tensor(0.0306, device='cuda:0')\n",
      "Iteration: 116 | Loss: 0.05305192247033119 | Train,Test accuracy: 0.9836956262588501.3f%, 0.8514636158943176.3f%\n",
      "0 tensor(0.0654, device='cuda:0')\n",
      "100 tensor(0.0650, device='cuda:0')\n",
      "200 tensor(0.0162, device='cuda:0')\n",
      "300 tensor(0.0577, device='cuda:0')\n",
      "Iteration: 117 | Loss: 0.0527903214097023 | Train,Test accuracy: 0.9849984049797058.3f%, 0.8626384735107422.3f%\n",
      "0 tensor(0.0335, device='cuda:0')\n",
      "100 tensor(0.0727, device='cuda:0')\n",
      "200 tensor(0.0389, device='cuda:0')\n",
      "300 tensor(0.0961, device='cuda:0')\n",
      "Iteration: 118 | Loss: 0.05290709808468819 | Train,Test accuracy: 0.9848025441169739.3f%, 0.8551226258277893.3f%\n",
      "0 tensor(0.0509, device='cuda:0')\n",
      "100 tensor(0.0633, device='cuda:0')\n",
      "200 tensor(0.0537, device='cuda:0')\n",
      "300 tensor(0.0702, device='cuda:0')\n",
      "Iteration: 119 | Loss: 0.05336315184831619 | Train,Test accuracy: 0.985529899597168.3f%, 0.8563093543052673.3f%\n",
      "0 tensor(0.0769, device='cuda:0')\n",
      "100 tensor(0.0625, device='cuda:0')\n",
      "200 tensor(0.0294, device='cuda:0')\n",
      "300 tensor(0.0244, device='cuda:0')\n",
      "Iteration: 120 | Loss: 0.05315898731350899 | Train,Test accuracy: 0.9839514493942261.3f%, 0.8585838675498962.3f%\n",
      "0 tensor(0.0617, device='cuda:0')\n",
      "100 tensor(0.0766, device='cuda:0')\n",
      "200 tensor(0.0197, device='cuda:0')\n",
      "300 tensor(0.0331, device='cuda:0')\n",
      "Iteration: 121 | Loss: 0.05250406265258789 | Train,Test accuracy: 0.9846027493476868.3f%, 0.8569027185440063.3f%\n",
      "0 tensor(0.0744, device='cuda:0')\n",
      "100 tensor(0.1527, device='cuda:0')\n",
      "200 tensor(0.0382, device='cuda:0')\n",
      "300 tensor(0.0428, device='cuda:0')\n",
      "Iteration: 122 | Loss: 0.05565039813518524 | Train,Test accuracy: 0.9830322861671448.3f%, 0.853342592716217.3f%\n",
      "0 tensor(0.0847, device='cuda:0')\n",
      "100 tensor(0.0346, device='cuda:0')\n",
      "200 tensor(0.0949, device='cuda:0')\n",
      "300 tensor(0.0870, device='cuda:0')\n",
      "Iteration: 123 | Loss: 0.04979327693581581 | Train,Test accuracy: 0.9859694838523865.3f%, 0.8535403609275818.3f%\n",
      "0 tensor(0.0177, device='cuda:0')\n",
      "100 tensor(0.0373, device='cuda:0')\n",
      "200 tensor(0.0166, device='cuda:0')\n",
      "300 tensor(0.0503, device='cuda:0')\n",
      "Iteration: 124 | Loss: 0.056142523884773254 | Train,Test accuracy: 0.9832839965820312.3f%, 0.8529469966888428.3f%\n",
      "0 tensor(0.0909, device='cuda:0')\n",
      "100 tensor(0.0817, device='cuda:0')\n",
      "200 tensor(0.0489, device='cuda:0')\n",
      "300 tensor(0.0182, device='cuda:0')\n",
      "Iteration: 125 | Loss: 0.051277678459882736 | Train,Test accuracy: 0.9842551350593567.3f%, 0.8580893874168396.3f%\n",
      "0 tensor(0.0396, device='cuda:0')\n",
      "100 tensor(0.0669, device='cuda:0')\n",
      "200 tensor(0.0835, device='cuda:0')\n",
      "300 tensor(0.0473, device='cuda:0')\n",
      "Iteration: 126 | Loss: 0.05626244097948074 | Train,Test accuracy: 0.9849424362182617.3f%, 0.8535403609275818.3f%\n",
      "0 tensor(0.0216, device='cuda:0')\n",
      "100 tensor(0.0625, device='cuda:0')\n",
      "200 tensor(0.0284, device='cuda:0')\n",
      "300 tensor(0.0079, device='cuda:0')\n",
      "Iteration: 127 | Loss: 0.05444957688450813 | Train,Test accuracy: 0.9840033054351807.3f%, 0.8559137582778931.3f%\n",
      "0 tensor(0.0746, device='cuda:0')\n",
      "100 tensor(0.0593, device='cuda:0')\n",
      "200 tensor(0.0132, device='cuda:0')\n",
      "300 tensor(0.0367, device='cuda:0')\n",
      "Iteration: 128 | Loss: 0.04916450008749962 | Train,Test accuracy: 0.981801450252533.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0274, device='cuda:0')\n",
      "100 tensor(0.0460, device='cuda:0')\n",
      "200 tensor(0.0549, device='cuda:0')\n",
      "300 tensor(0.0235, device='cuda:0')\n",
      "Iteration: 129 | Loss: 0.051128704100847244 | Train,Test accuracy: 0.9827086329460144.3f%, 0.8505735993385315.3f%\n",
      "0 tensor(0.0834, device='cuda:0')\n",
      "100 tensor(0.0122, device='cuda:0')\n",
      "200 tensor(0.0785, device='cuda:0')\n",
      "300 tensor(0.0676, device='cuda:0')\n",
      "Iteration: 130 | Loss: 0.053153250366449356 | Train,Test accuracy: 0.9849984049797058.3f%, 0.8522547483444214.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.0637, device='cuda:0')\n",
      "100 tensor(0.0369, device='cuda:0')\n",
      "200 tensor(0.0419, device='cuda:0')\n",
      "300 tensor(0.0944, device='cuda:0')\n",
      "Iteration: 131 | Loss: 0.05280294641852379 | Train,Test accuracy: 0.9838834404945374.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0162, device='cuda:0')\n",
      "100 tensor(0.0623, device='cuda:0')\n",
      "200 tensor(0.0662, device='cuda:0')\n",
      "300 tensor(0.0136, device='cuda:0')\n",
      "Iteration: 132 | Loss: 0.05186932161450386 | Train,Test accuracy: 0.9833439588546753.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0685, device='cuda:0')\n",
      "100 tensor(0.0403, device='cuda:0')\n",
      "200 tensor(0.0969, device='cuda:0')\n",
      "300 tensor(0.0717, device='cuda:0')\n",
      "Iteration: 133 | Loss: 0.053128719329833984 | Train,Test accuracy: 0.9852342009544373.3f%, 0.853342592716217.3f%\n",
      "0 tensor(0.0313, device='cuda:0')\n",
      "100 tensor(0.0407, device='cuda:0')\n",
      "200 tensor(0.0236, device='cuda:0')\n",
      "300 tensor(0.0771, device='cuda:0')\n",
      "Iteration: 134 | Loss: 0.048060342669487 | Train,Test accuracy: 0.984043300151825.3f%, 0.8546281456947327.3f%\n",
      "0 tensor(0.0232, device='cuda:0')\n",
      "100 tensor(0.0408, device='cuda:0')\n",
      "200 tensor(0.0349, device='cuda:0')\n",
      "300 tensor(0.0425, device='cuda:0')\n",
      "Iteration: 135 | Loss: 0.051847051829099655 | Train,Test accuracy: 0.9814578294754028.3f%, 0.8499802350997925.3f%\n",
      "0 tensor(0.1156, device='cuda:0')\n",
      "100 tensor(0.0795, device='cuda:0')\n",
      "200 tensor(0.0111, device='cuda:0')\n",
      "300 tensor(0.0388, device='cuda:0')\n",
      "Iteration: 136 | Loss: 0.05324248597025871 | Train,Test accuracy: 0.9840033054351807.3f%, 0.8551226258277893.3f%\n",
      "0 tensor(0.0737, device='cuda:0')\n",
      "100 tensor(0.0670, device='cuda:0')\n",
      "200 tensor(0.0577, device='cuda:0')\n",
      "300 tensor(0.1040, device='cuda:0')\n",
      "Iteration: 137 | Loss: 0.05240204185247421 | Train,Test accuracy: 0.984522819519043.3f%, 0.8582871556282043.3f%\n",
      "0 tensor(0.0795, device='cuda:0')\n",
      "100 tensor(0.0741, device='cuda:0')\n",
      "200 tensor(0.0547, device='cuda:0')\n",
      "300 tensor(0.0475, device='cuda:0')\n",
      "Iteration: 138 | Loss: 0.05275028198957443 | Train,Test accuracy: 0.9850423336029053.3f%, 0.8568037748336792.3f%\n",
      "0 tensor(0.0486, device='cuda:0')\n",
      "100 tensor(0.0807, device='cuda:0')\n",
      "200 tensor(0.0679, device='cuda:0')\n",
      "300 tensor(0.0949, device='cuda:0')\n",
      "Iteration: 139 | Loss: 0.05395760014653206 | Train,Test accuracy: 0.984043300151825.3f%, 0.8597705960273743.3f%\n",
      "0 tensor(0.0577, device='cuda:0')\n",
      "100 tensor(0.0368, device='cuda:0')\n",
      "200 tensor(0.0461, device='cuda:0')\n",
      "300 tensor(0.0622, device='cuda:0')\n",
      "Iteration: 140 | Loss: 0.05133286491036415 | Train,Test accuracy: 0.9830842018127441.3f%, 0.8529469966888428.3f%\n",
      "0 tensor(0.1445, device='cuda:0')\n",
      "100 tensor(0.0458, device='cuda:0')\n",
      "200 tensor(0.0461, device='cuda:0')\n",
      "300 tensor(0.0583, device='cuda:0')\n",
      "Iteration: 141 | Loss: 0.051673728972673416 | Train,Test accuracy: 0.9837316274642944.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0557, device='cuda:0')\n",
      "100 tensor(0.0490, device='cuda:0')\n",
      "200 tensor(0.0340, device='cuda:0')\n",
      "300 tensor(0.0272, device='cuda:0')\n",
      "Iteration: 142 | Loss: 0.029841676354408264 | Train,Test accuracy: 0.9933623671531677.3f%, 0.866594135761261.3f%\n",
      "0 tensor(0.0052, device='cuda:0')\n",
      "100 tensor(0.0212, device='cuda:0')\n",
      "200 tensor(0.0212, device='cuda:0')\n",
      "300 tensor(0.0218, device='cuda:0')\n",
      "Iteration: 143 | Loss: 0.018711339682340622 | Train,Test accuracy: 0.9952046275138855.3f%, 0.8676819801330566.3f%\n",
      "0 tensor(0.0140, device='cuda:0')\n",
      "100 tensor(0.0515, device='cuda:0')\n",
      "200 tensor(0.0322, device='cuda:0')\n",
      "300 tensor(0.0030, device='cuda:0')\n",
      "Iteration: 144 | Loss: 0.015201980248093605 | Train,Test accuracy: 0.9966192841529846.3f%, 0.868374228477478.3f%\n",
      "0 tensor(0.0045, device='cuda:0')\n",
      "100 tensor(0.0338, device='cuda:0')\n",
      "200 tensor(0.0040, device='cuda:0')\n",
      "300 tensor(0.0088, device='cuda:0')\n",
      "Iteration: 145 | Loss: 0.013038501143455505 | Train,Test accuracy: 0.9968630075454712.3f%, 0.8716376423835754.3f%\n",
      "0 tensor(0.0009, device='cuda:0')\n",
      "100 tensor(0.0050, device='cuda:0')\n",
      "200 tensor(0.0053, device='cuda:0')\n",
      "300 tensor(0.0060, device='cuda:0')\n",
      "Iteration: 146 | Loss: 0.011461419053375721 | Train,Test accuracy: 0.9968630075454712.3f%, 0.8728243708610535.3f%\n",
      "0 tensor(0.0089, device='cuda:0')\n",
      "100 tensor(0.0035, device='cuda:0')\n",
      "200 tensor(0.0074, device='cuda:0')\n",
      "300 tensor(0.0084, device='cuda:0')\n",
      "Iteration: 147 | Loss: 0.010813015513122082 | Train,Test accuracy: 0.9970628023147583.3f%, 0.8729232549667358.3f%\n",
      "0 tensor(0.0091, device='cuda:0')\n",
      "100 tensor(0.0046, device='cuda:0')\n",
      "200 tensor(0.0108, device='cuda:0')\n",
      "300 tensor(0.0034, device='cuda:0')\n",
      "Iteration: 148 | Loss: 0.009931707754731178 | Train,Test accuracy: 0.9973185658454895.3f%, 0.8751977682113647.3f%\n",
      "0 tensor(0.0109, device='cuda:0')\n",
      "100 tensor(0.0030, device='cuda:0')\n",
      "200 tensor(0.0046, device='cuda:0')\n",
      "300 tensor(0.0050, device='cuda:0')\n",
      "Iteration: 149 | Loss: 0.009989509359002113 | Train,Test accuracy: 0.9976223111152649.3f%, 0.8723298907279968.3f%\n",
      "0 tensor(0.0012, device='cuda:0')\n",
      "100 tensor(0.0160, device='cuda:0')\n",
      "200 tensor(0.0025, device='cuda:0')\n",
      "300 tensor(0.0018, device='cuda:0')\n",
      "Iteration: 150 | Loss: 0.009514286182820797 | Train,Test accuracy: 0.9979020357131958.3f%, 0.8708465099334717.3f%\n",
      "0 tensor(0.0044, device='cuda:0')\n",
      "100 tensor(0.0056, device='cuda:0')\n",
      "200 tensor(0.0481, device='cuda:0')\n",
      "300 tensor(0.0033, device='cuda:0')\n",
      "Iteration: 151 | Loss: 0.008989457972347736 | Train,Test accuracy: 0.9975223541259766.3f%, 0.8717365264892578.3f%\n",
      "0 tensor(0.0017, device='cuda:0')\n",
      "100 tensor(0.0076, device='cuda:0')\n",
      "200 tensor(0.0055, device='cuda:0')\n",
      "300 tensor(0.0016, device='cuda:0')\n",
      "Iteration: 152 | Loss: 0.008200379088521004 | Train,Test accuracy: 0.9972026944160461.3f%, 0.875.3f%\n",
      "0 tensor(0.0099, device='cuda:0')\n",
      "100 tensor(0.0088, device='cuda:0')\n",
      "200 tensor(0.0254, device='cuda:0')\n",
      "300 tensor(0.0049, device='cuda:0')\n",
      "Iteration: 153 | Loss: 0.008581436239182949 | Train,Test accuracy: 0.9975423812866211.3f%, 0.8660996556282043.3f%\n",
      "0 tensor(0.0080, device='cuda:0')\n",
      "100 tensor(0.0093, device='cuda:0')\n",
      "200 tensor(0.0074, device='cuda:0')\n",
      "300 tensor(0.0054, device='cuda:0')\n",
      "Iteration: 154 | Loss: 0.009070077911019325 | Train,Test accuracy: 0.9979419708251953.3f%, 0.8699564933776855.3f%\n",
      "0 tensor(0.0078, device='cuda:0')\n",
      "100 tensor(0.0023, device='cuda:0')\n",
      "200 tensor(0.0030, device='cuda:0')\n",
      "300 tensor(0.0008, device='cuda:0')\n",
      "Iteration: 155 | Loss: 0.008486218750476837 | Train,Test accuracy: 0.9981297850608826.3f%, 0.8697587251663208.3f%\n",
      "0 tensor(0.0011, device='cuda:0')\n",
      "100 tensor(0.0279, device='cuda:0')\n",
      "200 tensor(0.0051, device='cuda:0')\n",
      "300 tensor(0.0084, device='cuda:0')\n",
      "Iteration: 156 | Loss: 0.008010569028556347 | Train,Test accuracy: 0.9980378746986389.3f%, 0.8726266026496887.3f%\n",
      "0 tensor(0.0092, device='cuda:0')\n",
      "100 tensor(0.0045, device='cuda:0')\n",
      "200 tensor(0.0219, device='cuda:0')\n",
      "300 tensor(0.0190, device='cuda:0')\n",
      "Iteration: 157 | Loss: 0.007090769708156586 | Train,Test accuracy: 0.9980019330978394.3f%, 0.8741099834442139.3f%\n",
      "0 tensor(0.0027, device='cuda:0')\n",
      "100 tensor(0.0019, device='cuda:0')\n",
      "200 tensor(0.0032, device='cuda:0')\n",
      "300 tensor(0.0050, device='cuda:0')\n",
      "Iteration: 158 | Loss: 0.00753862364217639 | Train,Test accuracy: 0.9978620409965515.3f%, 0.8742088675498962.3f%\n",
      "0 tensor(0.0007, device='cuda:0')\n",
      "100 tensor(0.0077, device='cuda:0')\n",
      "200 tensor(0.0049, device='cuda:0')\n",
      "300 tensor(0.0118, device='cuda:0')\n",
      "Iteration: 159 | Loss: 0.0075094024650752544 | Train,Test accuracy: 0.9977222084999084.3f%, 0.8695608973503113.3f%\n",
      "0 tensor(0.0111, device='cuda:0')\n",
      "100 tensor(0.0031, device='cuda:0')\n",
      "200 tensor(0.0024, device='cuda:0')\n",
      "300 tensor(0.0010, device='cuda:0')\n",
      "Iteration: 160 | Loss: 0.007094698958098888 | Train,Test accuracy: 0.9980418682098389.3f%, 0.8716376423835754.3f%\n",
      "0 tensor(0.0022, device='cuda:0')\n",
      "100 tensor(0.0022, device='cuda:0')\n",
      "200 tensor(0.0005, device='cuda:0')\n",
      "300 tensor(0.0081, device='cuda:0')\n",
      "Iteration: 161 | Loss: 0.006802024785429239 | Train,Test accuracy: 0.9981817603111267.3f%, 0.8739121556282043.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0016, device='cuda:0')\n",
      "200 tensor(0.0011, device='cuda:0')\n",
      "300 tensor(0.0015, device='cuda:0')\n",
      "Iteration: 162 | Loss: 0.007102069910615683 | Train,Test accuracy: 0.9981817603111267.3f%, 0.8713409900665283.3f%\n",
      "0 tensor(0.0033, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "100 tensor(0.0172, device='cuda:0')\n",
      "200 tensor(0.0011, device='cuda:0')\n",
      "300 tensor(0.0057, device='cuda:0')\n",
      "Iteration: 163 | Loss: 0.007399177644401789 | Train,Test accuracy: 0.9979619383811951.3f%, 0.8727254867553711.3f%\n",
      "0 tensor(0.0011, device='cuda:0')\n",
      "100 tensor(0.0102, device='cuda:0')\n",
      "200 tensor(0.0010, device='cuda:0')\n",
      "300 tensor(0.0025, device='cuda:0')\n",
      "Iteration: 164 | Loss: 0.006926909554749727 | Train,Test accuracy: 0.9976822137832642.3f%, 0.8729232549667358.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0198, device='cuda:0')\n",
      "200 tensor(0.0004, device='cuda:0')\n",
      "300 tensor(0.0285, device='cuda:0')\n",
      "Iteration: 165 | Loss: 0.007756717968732119 | Train,Test accuracy: 0.9981817603111267.3f%, 0.8710442781448364.3f%\n",
      "0 tensor(0.0014, device='cuda:0')\n",
      "100 tensor(0.0141, device='cuda:0')\n",
      "200 tensor(0.0070, device='cuda:0')\n",
      "300 tensor(0.0051, device='cuda:0')\n",
      "Iteration: 166 | Loss: 0.007576040457934141 | Train,Test accuracy: 0.997482419013977.3f%, 0.8688686490058899.3f%\n",
      "0 tensor(0.0090, device='cuda:0')\n",
      "100 tensor(0.0016, device='cuda:0')\n",
      "200 tensor(0.0010, device='cuda:0')\n",
      "300 tensor(0.0013, device='cuda:0')\n",
      "Iteration: 167 | Loss: 0.006242012605071068 | Train,Test accuracy: 0.9980818629264832.3f%, 0.8728243708610535.3f%\n",
      "0 tensor(0.0014, device='cuda:0')\n",
      "100 tensor(0.0177, device='cuda:0')\n",
      "200 tensor(0.0038, device='cuda:0')\n",
      "300 tensor(0.0012, device='cuda:0')\n",
      "Iteration: 168 | Loss: 0.006438688840717077 | Train,Test accuracy: 0.9982017278671265.3f%, 0.8697587251663208.3f%\n",
      "0 tensor(0.0455, device='cuda:0')\n",
      "100 tensor(0.0084, device='cuda:0')\n",
      "200 tensor(0.0018, device='cuda:0')\n",
      "300 tensor(0.0008, device='cuda:0')\n",
      "Iteration: 169 | Loss: 0.007695586886256933 | Train,Test accuracy: 0.9976102709770203.3f%, 0.8690664768218994.3f%\n",
      "0 tensor(0.0112, device='cuda:0')\n",
      "100 tensor(0.0012, device='cuda:0')\n",
      "200 tensor(0.0233, device='cuda:0')\n",
      "300 tensor(0.0301, device='cuda:0')\n",
      "Iteration: 170 | Loss: 0.00767182745039463 | Train,Test accuracy: 0.9980618357658386.3f%, 0.8699564933776855.3f%\n",
      "0 tensor(0.0016, device='cuda:0')\n",
      "100 tensor(0.0030, device='cuda:0')\n",
      "200 tensor(0.0037, device='cuda:0')\n",
      "300 tensor(0.0069, device='cuda:0')\n",
      "Iteration: 171 | Loss: 0.006897815503180027 | Train,Test accuracy: 0.9981217980384827.3f%, 0.8748022317886353.3f%\n",
      "0 tensor(0.0021, device='cuda:0')\n",
      "100 tensor(0.0053, device='cuda:0')\n",
      "200 tensor(0.0041, device='cuda:0')\n",
      "300 tensor(0.0044, device='cuda:0')\n",
      "Iteration: 172 | Loss: 0.006569176912307739 | Train,Test accuracy: 0.9981018304824829.3f%, 0.8742088675498962.3f%\n",
      "0 tensor(0.0302, device='cuda:0')\n",
      "100 tensor(0.0125, device='cuda:0')\n",
      "200 tensor(0.0011, device='cuda:0')\n",
      "300 tensor(0.0009, device='cuda:0')\n",
      "Iteration: 173 | Loss: 0.007396455388516188 | Train,Test accuracy: 0.9983215928077698.3f%, 0.8690664768218994.3f%\n",
      "0 tensor(0.0045, device='cuda:0')\n",
      "100 tensor(0.0182, device='cuda:0')\n",
      "200 tensor(0.0007, device='cuda:0')\n",
      "300 tensor(0.0109, device='cuda:0')\n",
      "Iteration: 174 | Loss: 0.006542656570672989 | Train,Test accuracy: 0.9979819655418396.3f%, 0.8752966523170471.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0022, device='cuda:0')\n",
      "200 tensor(0.0021, device='cuda:0')\n",
      "300 tensor(0.0112, device='cuda:0')\n",
      "Iteration: 175 | Loss: 0.006709451321512461 | Train,Test accuracy: 0.9981018304824829.3f%, 0.870945394039154.3f%\n",
      "0 tensor(0.0020, device='cuda:0')\n",
      "100 tensor(0.0012, device='cuda:0')\n",
      "200 tensor(0.0006, device='cuda:0')\n",
      "300 tensor(0.0035, device='cuda:0')\n",
      "Iteration: 176 | Loss: 0.007354232482612133 | Train,Test accuracy: 0.9984814524650574.3f%, 0.8717365264892578.3f%\n",
      "0 tensor(0.0019, device='cuda:0')\n",
      "100 tensor(0.0010, device='cuda:0')\n",
      "200 tensor(0.0049, device='cuda:0')\n",
      "300 tensor(0.0093, device='cuda:0')\n",
      "Iteration: 177 | Loss: 0.0056660473346710205 | Train,Test accuracy: 0.9980818629264832.3f%, 0.8702531456947327.3f%\n",
      "0 tensor(0.0271, device='cuda:0')\n",
      "100 tensor(0.0018, device='cuda:0')\n",
      "200 tensor(0.0011, device='cuda:0')\n",
      "300 tensor(0.0012, device='cuda:0')\n",
      "Iteration: 178 | Loss: 0.007982213981449604 | Train,Test accuracy: 0.9980897903442383.3f%, 0.8696597814559937.3f%\n",
      "0 tensor(0.0039, device='cuda:0')\n",
      "100 tensor(0.0054, device='cuda:0')\n",
      "200 tensor(0.0087, device='cuda:0')\n",
      "300 tensor(0.0020, device='cuda:0')\n",
      "Iteration: 179 | Loss: 0.007246931549161673 | Train,Test accuracy: 0.9977821111679077.3f%, 0.870945394039154.3f%\n",
      "0 tensor(0.0492, device='cuda:0')\n",
      "100 tensor(0.0004, device='cuda:0')\n",
      "200 tensor(0.0009, device='cuda:0')\n",
      "300 tensor(0.0006, device='cuda:0')\n",
      "Iteration: 180 | Loss: 0.006443744525313377 | Train,Test accuracy: 0.998161792755127.3f%, 0.8701542615890503.3f%\n",
      "0 tensor(0.0019, device='cuda:0')\n",
      "100 tensor(0.0021, device='cuda:0')\n",
      "200 tensor(0.0008, device='cuda:0')\n",
      "300 tensor(0.0020, device='cuda:0')\n",
      "Iteration: 181 | Loss: 0.006047403439879417 | Train,Test accuracy: 0.9982097148895264.3f%, 0.8714398741722107.3f%\n",
      "0 tensor(0.0084, device='cuda:0')\n",
      "100 tensor(0.0126, device='cuda:0')\n",
      "200 tensor(0.0044, device='cuda:0')\n",
      "300 tensor(0.0012, device='cuda:0')\n",
      "Iteration: 182 | Loss: 0.007436038926243782 | Train,Test accuracy: 0.9980579018592834.3f%, 0.8711432218551636.3f%\n",
      "0 tensor(0.0245, device='cuda:0')\n",
      "100 tensor(0.0225, device='cuda:0')\n",
      "200 tensor(0.0076, device='cuda:0')\n",
      "300 tensor(0.0040, device='cuda:0')\n",
      "Iteration: 183 | Loss: 0.007027592975646257 | Train,Test accuracy: 0.9981817603111267.3f%, 0.8708465099334717.3f%\n",
      "0 tensor(0.0146, device='cuda:0')\n",
      "100 tensor(0.0074, device='cuda:0')\n",
      "200 tensor(0.0070, device='cuda:0')\n",
      "300 tensor(0.0009, device='cuda:0')\n",
      "Iteration: 184 | Loss: 0.00760949170216918 | Train,Test accuracy: 0.9982017278671265.3f%, 0.8729232549667358.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0054, device='cuda:0')\n",
      "200 tensor(0.0060, device='cuda:0')\n",
      "300 tensor(0.0010, device='cuda:0')\n",
      "Iteration: 185 | Loss: 0.007806888781487942 | Train,Test accuracy: 0.9983416199684143.3f%, 0.8748022317886353.3f%\n",
      "0 tensor(0.0012, device='cuda:0')\n",
      "100 tensor(0.0010, device='cuda:0')\n",
      "200 tensor(0.0026, device='cuda:0')\n",
      "300 tensor(0.0082, device='cuda:0')\n",
      "Iteration: 186 | Loss: 0.0069940718822181225 | Train,Test accuracy: 0.9978021383285522.3f%, 0.8705498576164246.3f%\n",
      "0 tensor(0.0051, device='cuda:0')\n",
      "100 tensor(0.0178, device='cuda:0')\n",
      "200 tensor(0.0180, device='cuda:0')\n",
      "300 tensor(0.0086, device='cuda:0')\n",
      "Iteration: 187 | Loss: 0.007060096599161625 | Train,Test accuracy: 0.997762143611908.3f%, 0.868374228477478.3f%\n",
      "0 tensor(0.0246, device='cuda:0')\n",
      "100 tensor(0.0245, device='cuda:0')\n",
      "200 tensor(0.0018, device='cuda:0')\n",
      "300 tensor(0.0308, device='cuda:0')\n",
      "Iteration: 188 | Loss: 0.00687339948490262 | Train,Test accuracy: 0.9986612796783447.3f%, 0.8719343543052673.3f%\n",
      "0 tensor(0.0027, device='cuda:0')\n",
      "100 tensor(0.0047, device='cuda:0')\n",
      "200 tensor(0.0179, device='cuda:0')\n",
      "300 tensor(0.0069, device='cuda:0')\n",
      "Iteration: 189 | Loss: 0.0065715317614376545 | Train,Test accuracy: 0.9980418682098389.3f%, 0.871835470199585.3f%\n",
      "0 tensor(0.0017, device='cuda:0')\n",
      "100 tensor(0.0165, device='cuda:0')\n",
      "200 tensor(0.0017, device='cuda:0')\n",
      "300 tensor(0.0010, device='cuda:0')\n",
      "Iteration: 190 | Loss: 0.007950118742883205 | Train,Test accuracy: 0.9979020357131958.3f%, 0.8724287748336792.3f%\n",
      "0 tensor(0.0009, device='cuda:0')\n",
      "100 tensor(0.0031, device='cuda:0')\n",
      "200 tensor(0.0040, device='cuda:0')\n",
      "300 tensor(0.0295, device='cuda:0')\n",
      "Iteration: 191 | Loss: 0.007499221712350845 | Train,Test accuracy: 0.9977421760559082.3f%, 0.871242105960846.3f%\n",
      "0 tensor(0.0088, device='cuda:0')\n",
      "100 tensor(0.0013, device='cuda:0')\n",
      "200 tensor(0.0014, device='cuda:0')\n",
      "300 tensor(0.0093, device='cuda:0')\n",
      "Iteration: 192 | Loss: 0.006277809850871563 | Train,Test accuracy: 0.9981018304824829.3f%, 0.870352029800415.3f%\n",
      "0 tensor(0.0017, device='cuda:0')\n",
      "100 tensor(0.0108, device='cuda:0')\n",
      "200 tensor(0.0009, device='cuda:0')\n",
      "300 tensor(0.0106, device='cuda:0')\n",
      "Iteration: 193 | Loss: 0.005901625845581293 | Train,Test accuracy: 0.9980618357658386.3f%, 0.8671875.3f%\n",
      "0 tensor(0.0034, device='cuda:0')\n",
      "100 tensor(0.0083, device='cuda:0')\n",
      "200 tensor(0.0015, device='cuda:0')\n",
      "300 tensor(0.0007, device='cuda:0')\n",
      "Iteration: 194 | Loss: 0.00697740213945508 | Train,Test accuracy: 0.9985414147377014.3f%, 0.8710442781448364.3f%\n",
      "0 tensor(0.0026, device='cuda:0')\n",
      "100 tensor(0.0023, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "200 tensor(0.0005, device='cuda:0')\n",
      "300 tensor(0.0050, device='cuda:0')\n",
      "Iteration: 195 | Loss: 0.006790527608245611 | Train,Test accuracy: 0.9985813498497009.3f%, 0.8700553774833679.3f%\n",
      "0 tensor(0.0242, device='cuda:0')\n",
      "100 tensor(0.0012, device='cuda:0')\n",
      "200 tensor(0.0189, device='cuda:0')\n",
      "300 tensor(0.0102, device='cuda:0')\n",
      "Iteration: 196 | Loss: 0.006438868585973978 | Train,Test accuracy: 0.9985613822937012.3f%, 0.8728243708610535.3f%\n",
      "0 tensor(0.0034, device='cuda:0')\n",
      "100 tensor(0.0029, device='cuda:0')\n",
      "200 tensor(0.0153, device='cuda:0')\n",
      "300 tensor(0.0175, device='cuda:0')\n",
      "Iteration: 197 | Loss: 0.007481008302420378 | Train,Test accuracy: 0.9976622462272644.3f%, 0.8717365264892578.3f%\n",
      "0 tensor(0.0025, device='cuda:0')\n",
      "100 tensor(0.0072, device='cuda:0')\n",
      "200 tensor(0.0120, device='cuda:0')\n",
      "300 tensor(0.0039, device='cuda:0')\n",
      "Iteration: 198 | Loss: 0.007488665170967579 | Train,Test accuracy: 0.9978820085525513.3f%, 0.8746044039726257.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0025, device='cuda:0')\n",
      "200 tensor(0.0013, device='cuda:0')\n",
      "300 tensor(0.0688, device='cuda:0')\n",
      "Iteration: 199 | Loss: 0.00675368495285511 | Train,Test accuracy: 0.9981417655944824.3f%, 0.8713409900665283.3f%\n",
      "0 tensor(0.0016, device='cuda:0')\n",
      "100 tensor(0.0007, device='cuda:0')\n",
      "200 tensor(0.0173, device='cuda:0')\n",
      "300 tensor(0.0021, device='cuda:0')\n",
      "Iteration: 200 | Loss: 0.007075566332787275 | Train,Test accuracy: 0.9978820085525513.3f%, 0.8652096390724182.3f%\n",
      "==> Finished Training ...\n"
     ]
    }
   ],
   "source": [
    "# net = DNNCifar(args=args).to(args.device)\n",
    "\n",
    "criterion = nn.CrossEntropyLoss()\n",
    "optimizer = optim.Adam(net.parameters(), lr=0.001, weight_decay=3e-4)\n",
    "\n",
    "# optimizer = optim.SGD(net.parameters(), lr=0.05, momentum=0.9, weight_decay=0.0001)\n",
    "\n",
    "train_accuracy_qXsquare2 = []\n",
    "train_loss_qXsquare2 = []\n",
    "test_accuracy_qXsquare2  = []\n",
    "test_loss_qXsquare2  = []\n",
    "\n",
    "\n",
    "for epoch in range(200):\n",
    "    \n",
    "    if epoch <= 80:\n",
    "        cur_lr = 0.001\n",
    "    elif epoch <= 140:\n",
    "        cur_lr = 0.0005\n",
    "    else:    \n",
    "        cur_lr = 0.0001\n",
    "#     else:\n",
    "#         cur_lr = 0.0004\n",
    "    \n",
    "    for g in optimizer.param_groups:\n",
    "        g['lr'] = cur_lr\n",
    "        \n",
    "    running_loss = 0.0\n",
    "    for i, data in enumerate(trainloader, 0):\n",
    "        # get the inputs\n",
    "        inputs, labels = data\n",
    "\n",
    "        if args.gpu:\n",
    "            inputs = inputs.cuda()\n",
    "            labels = labels.cuda()\n",
    "\n",
    "        # wrap them in Variable\n",
    "        inputs, labels = Variable(inputs), Variable(labels)\n",
    "\n",
    "        # zero the parameter gradients\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "        # forward + backward + optimize\n",
    "        outputs = net(inputs)\n",
    "        loss = criterion(outputs, labels)\n",
    "        loss.backward()\n",
    "\n",
    "        if epoch > 16:\n",
    "            for group in optimizer.param_groups:\n",
    "                for p in group['params']:\n",
    "                    state = optimizer.state[p]\n",
    "                    if state['step'] >= 1024:\n",
    "                        state['step'] = 1000\n",
    "        optimizer.step()\n",
    "\n",
    "\n",
    "        # print statistics\n",
    "        if i % 100 == 0:\n",
    "            print(i,loss.data)\n",
    "        running_loss += loss.data\n",
    "\n",
    "    # Normalizing the loss by the total number of train batches\n",
    "    running_loss /= len(trainloader)\n",
    "\n",
    "    # Calculate training/test set accuracy of the existing model\n",
    "    test_loss, test_accuracy = validation(net, testloader, criterion)\n",
    "    train_loss, train_accuracy = validation(net, trainloader, criterion)\n",
    "\n",
    "    print(\"Iteration: {0} | Loss: {1} |\".format(epoch+1, running_loss),\n",
    "          \"Train,Test accuracy: {0}.3f%, {1}.3f%\".format(train_accuracy/len(trainloader), test_accuracy/len(testloader)) )\n",
    "    \n",
    "    train_accuracy_qXsquare2.append(train_accuracy/len(trainloader))\n",
    "    train_loss_qXsquare2.append(train_loss)\n",
    "    \n",
    "    test_accuracy_qXsquare2.append(test_accuracy/len(testloader))\n",
    "    test_loss_qXsquare2.append(test_loss)\n",
    "    \n",
    "    # Specify a path\n",
    "    PATH = \"./save_models/CIFAR10_VGG11_xsq2_E200_iter\"+str(epoch)+\"_v1.pt\"\n",
    "    torch.save(net.state_dict(), PATH)\n",
    "\n",
    "    # save model\n",
    "#     if epoch % 50 == 0:\n",
    "#         print('==> Saving model ...')\n",
    "#         state = {\n",
    "#             'net': net.module if opt.is_gpu else net,\n",
    "#             'epoch': epoch,\n",
    "#         }\n",
    "#         if not os.path.isdir('checkpoint'):\n",
    "#             os.mkdir('checkpoint')\n",
    "#         torch.save(state, '../checkpoint/ckpt.t7')\n",
    "\n",
    "print('==> Finished Training ...')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "qVGG_xsquare(\n",
       "  (features): Sequential(\n",
       "    (0): QuantConv2d(\n",
       "      3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (2): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (3): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (4): QuantConv2d(\n",
       "      64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (5): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (6): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (7): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (8): QuantConv2d(\n",
       "      128, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (9): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (10): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (11): QuantConv2d(\n",
       "      256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (12): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (13): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (14): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (15): QuantConv2d(\n",
       "      256, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (16): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (17): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (18): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (19): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (20): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (21): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (22): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (23): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (24): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (25): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (26): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
       "    (27): QuantXsquare(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (28): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (29): AvgPool2d(kernel_size=1, stride=1, padding=0)\n",
       "  )\n",
       "  (classifier): Linear(in_features=512, out_features=10, bias=True)\n",
       ")"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from torch.nn import Module\n",
    "import torch.nn.functional as F\n",
    "import brevitas.nn as qnn\n",
    "from brevitas.core.quant import QuantType\n",
    "\n",
    "bit_width_sel = 8\n",
    "\n",
    "class qVGG_xsquare(nn.Module):\n",
    "    def __init__(self, vgg_name):\n",
    "        super(qVGG_xsquare, self).__init__()\n",
    "        self.features = self._make_layers(cfg[vgg_name])\n",
    "        self.classifier = nn.Linear(512, 10)\n",
    "\n",
    "    def forward(self, x):\n",
    "        out = self.features(x)\n",
    "        out = out.view(out.size(0), -1)\n",
    "        out = self.classifier(out)\n",
    "        return out\n",
    "\n",
    "    def _make_layers(self, cfg):\n",
    "        layers = []\n",
    "        in_channels = 3\n",
    "        for x in cfg:\n",
    "            if x == 'M':\n",
    "                #layers += [nn.MaxPool2d(kernel_size=2, stride=2)]\n",
    "                layers += [nn.AvgPool2d(kernel_size=2, stride=2)]\n",
    "            else:\n",
    "                layers += [qnn.QuantConv2d(in_channels, out_channels=x, kernel_size=3, padding=1, weight_quant_type=QuantType.INT, \n",
    "                                     weight_bit_width=bit_width_sel),\n",
    "                           nn.BatchNorm2d(x),\n",
    "                           qnn.QuantXsquare(quant_type=QuantType.INT, bit_width=8, max_val=6)]\n",
    "                in_channels = x\n",
    "        layers += [nn.AvgPool2d(kernel_size=1, stride=1)]\n",
    "        return nn.Sequential(*layers)\n",
    "    \n",
    "    \n",
    "                    \n",
    "net = qVGG_xsquare('VGG11')\n",
    "net.cuda()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(2.4825, device='cuda:0')\n",
      "100 tensor(2.3049, device='cuda:0')\n",
      "200 tensor(2.1837, device='cuda:0')\n",
      "300 tensor(2.0935, device='cuda:0')\n",
      "Iteration: 1 | Loss: 2.2176079750061035 | Train,Test accuracy: 0.2139306217432022.3f%, 0.20065268874168396.3f%\n",
      "0 tensor(2.1044, device='cuda:0')\n",
      "100 tensor(2.0587, device='cuda:0')\n",
      "200 tensor(1.9165, device='cuda:0')\n",
      "300 tensor(1.7028, device='cuda:0')\n",
      "Iteration: 2 | Loss: 1.8930039405822754 | Train,Test accuracy: 0.35620203614234924.3f%, 0.36085838079452515.3f%\n",
      "0 tensor(1.8674, device='cuda:0')\n",
      "100 tensor(1.5362, device='cuda:0')\n",
      "200 tensor(1.5074, device='cuda:0')\n",
      "300 tensor(1.4186, device='cuda:0')\n",
      "Iteration: 3 | Loss: 1.5230740308761597 | Train,Test accuracy: 0.5346307158470154.3f%, 0.5048457384109497.3f%\n",
      "0 tensor(1.3298, device='cuda:0')\n",
      "100 tensor(1.3659, device='cuda:0')\n",
      "200 tensor(1.0783, device='cuda:0')\n",
      "300 tensor(1.0243, device='cuda:0')\n",
      "Iteration: 4 | Loss: 1.1532636880874634 | Train,Test accuracy: 0.6573768854141235.3f%, 0.6210442781448364.3f%\n",
      "0 tensor(0.9366, device='cuda:0')\n",
      "100 tensor(1.0661, device='cuda:0')\n",
      "200 tensor(1.0054, device='cuda:0')\n",
      "300 tensor(0.9187, device='cuda:0')\n",
      "Iteration: 5 | Loss: 0.9291924834251404 | Train,Test accuracy: 0.7213115096092224.3f%, 0.6776107549667358.3f%\n",
      "0 tensor(0.7550, device='cuda:0')\n",
      "100 tensor(0.8169, device='cuda:0')\n",
      "200 tensor(0.7120, device='cuda:0')\n",
      "300 tensor(0.7717, device='cuda:0')\n",
      "Iteration: 6 | Loss: 0.7598826885223389 | Train,Test accuracy: 0.7760030031204224.3f%, 0.736155092716217.3f%\n",
      "0 tensor(0.5350, device='cuda:0')\n",
      "100 tensor(0.7239, device='cuda:0')\n",
      "200 tensor(0.6021, device='cuda:0')\n",
      "300 tensor(0.5322, device='cuda:0')\n",
      "Iteration: 7 | Loss: 0.6460302472114563 | Train,Test accuracy: 0.8144261240959167.3f%, 0.761867105960846.3f%\n",
      "0 tensor(0.4907, device='cuda:0')\n",
      "100 tensor(0.5601, device='cuda:0')\n",
      "200 tensor(0.5749, device='cuda:0')\n",
      "300 tensor(0.4458, device='cuda:0')\n",
      "Iteration: 8 | Loss: 0.5705034136772156 | Train,Test accuracy: 0.8323888778686523.3f%, 0.7787777185440063.3f%\n",
      "0 tensor(0.4483, device='cuda:0')\n",
      "100 tensor(0.5061, device='cuda:0')\n",
      "200 tensor(0.4942, device='cuda:0')\n",
      "300 tensor(0.3955, device='cuda:0')\n",
      "Iteration: 9 | Loss: 0.5093491673469543 | Train,Test accuracy: 0.8500199913978577.3f%, 0.7996439933776855.3f%\n",
      "0 tensor(0.3178, device='cuda:0')\n",
      "100 tensor(0.3564, device='cuda:0')\n",
      "200 tensor(0.4029, device='cuda:0')\n",
      "300 tensor(0.5631, device='cuda:0')\n",
      "Iteration: 10 | Loss: 0.4694652557373047 | Train,Test accuracy: 0.860190212726593.3f%, 0.7879746556282043.3f%\n",
      "0 tensor(0.3597, device='cuda:0')\n",
      "100 tensor(0.4066, device='cuda:0')\n",
      "200 tensor(0.3024, device='cuda:0')\n",
      "300 tensor(0.5301, device='cuda:0')\n",
      "Iteration: 11 | Loss: 0.43443623185157776 | Train,Test accuracy: 0.8647778034210205.3f%, 0.801522970199585.3f%\n",
      "0 tensor(0.3582, device='cuda:0')\n",
      "100 tensor(0.4398, device='cuda:0')\n",
      "200 tensor(0.3355, device='cuda:0')\n",
      "300 tensor(0.3444, device='cuda:0')\n",
      "Iteration: 12 | Loss: 0.4089670777320862 | Train,Test accuracy: 0.8844988346099854.3f%, 0.8164557218551636.3f%\n",
      "0 tensor(0.1887, device='cuda:0')\n",
      "100 tensor(0.3967, device='cuda:0')\n",
      "200 tensor(0.4094, device='cuda:0')\n",
      "300 tensor(0.2918, device='cuda:0')\n",
      "Iteration: 13 | Loss: 0.3776015341281891 | Train,Test accuracy: 0.8823889493942261.3f%, 0.8179391026496887.3f%\n",
      "0 tensor(0.3333, device='cuda:0')\n",
      "100 tensor(0.3356, device='cuda:0')\n",
      "200 tensor(0.3610, device='cuda:0')\n",
      "300 tensor(0.3133, device='cuda:0')\n",
      "Iteration: 14 | Loss: 0.35693225264549255 | Train,Test accuracy: 0.8886309266090393.3f%, 0.805280864238739.3f%\n",
      "0 tensor(0.2936, device='cuda:0')\n",
      "100 tensor(0.3938, device='cuda:0')\n",
      "200 tensor(0.3054, device='cuda:0')\n",
      "300 tensor(0.3269, device='cuda:0')\n",
      "Iteration: 15 | Loss: 0.3365142345428467 | Train,Test accuracy: 0.9000759124755859.3f%, 0.8303995132446289.3f%\n",
      "0 tensor(0.2586, device='cuda:0')\n",
      "100 tensor(0.3546, device='cuda:0')\n",
      "200 tensor(0.3645, device='cuda:0')\n",
      "300 tensor(0.5015, device='cuda:0')\n",
      "Iteration: 16 | Loss: 0.32334259152412415 | Train,Test accuracy: 0.9042679071426392.3f%, 0.8295094966888428.3f%\n",
      "0 tensor(0.3299, device='cuda:0')\n",
      "100 tensor(0.3217, device='cuda:0')\n",
      "200 tensor(0.3684, device='cuda:0')\n",
      "300 tensor(0.2546, device='cuda:0')\n",
      "Iteration: 17 | Loss: 0.30644726753234863 | Train,Test accuracy: 0.9131313562393188.3f%, 0.8296083807945251.3f%\n",
      "0 tensor(0.2720, device='cuda:0')\n",
      "100 tensor(0.1717, device='cuda:0')\n",
      "200 tensor(0.1643, device='cuda:0')\n",
      "300 tensor(0.2206, device='cuda:0')\n",
      "Iteration: 18 | Loss: 0.25851941108703613 | Train,Test accuracy: 0.9265465140342712.3f%, 0.8388053774833679.3f%\n",
      "0 tensor(0.3209, device='cuda:0')\n",
      "100 tensor(0.3118, device='cuda:0')\n",
      "200 tensor(0.3082, device='cuda:0')\n",
      "300 tensor(0.2043, device='cuda:0')\n",
      "Iteration: 19 | Loss: 0.24730846285820007 | Train,Test accuracy: 0.9278852343559265.3f%, 0.8326740264892578.3f%\n",
      "0 tensor(0.1485, device='cuda:0')\n",
      "100 tensor(0.2536, device='cuda:0')\n",
      "200 tensor(0.2979, device='cuda:0')\n",
      "300 tensor(0.2674, device='cuda:0')\n",
      "Iteration: 20 | Loss: 0.2336621731519699 | Train,Test accuracy: 0.9313498735427856.3f%, 0.8334652185440063.3f%\n",
      "0 tensor(0.2187, device='cuda:0')\n",
      "100 tensor(0.2038, device='cuda:0')\n",
      "200 tensor(0.3004, device='cuda:0')\n",
      "300 tensor(0.2653, device='cuda:0')\n",
      "Iteration: 21 | Loss: 0.22540408372879028 | Train,Test accuracy: 0.9368006587028503.3f%, 0.8375197649002075.3f%\n",
      "0 tensor(0.0963, device='cuda:0')\n",
      "100 tensor(0.2136, device='cuda:0')\n",
      "200 tensor(0.2668, device='cuda:0')\n",
      "300 tensor(0.2045, device='cuda:0')\n",
      "Iteration: 22 | Loss: 0.21807627379894257 | Train,Test accuracy: 0.9373601078987122.3f%, 0.8361352682113647.3f%\n",
      "0 tensor(0.1349, device='cuda:0')\n",
      "100 tensor(0.1413, device='cuda:0')\n",
      "200 tensor(0.3706, device='cuda:0')\n",
      "300 tensor(0.1542, device='cuda:0')\n",
      "Iteration: 23 | Loss: 0.2120073437690735 | Train,Test accuracy: 0.9367647171020508.3f%, 0.8339596390724182.3f%\n",
      "0 tensor(0.2190, device='cuda:0')\n",
      "100 tensor(0.1612, device='cuda:0')\n",
      "200 tensor(0.2071, device='cuda:0')\n",
      "300 tensor(0.2433, device='cuda:0')\n",
      "Iteration: 24 | Loss: 0.20447759330272675 | Train,Test accuracy: 0.9362532496452332.3f%, 0.8322784900665283.3f%\n",
      "0 tensor(0.2120, device='cuda:0')\n",
      "100 tensor(0.1199, device='cuda:0')\n",
      "200 tensor(0.3032, device='cuda:0')\n",
      "300 tensor(0.1925, device='cuda:0')\n",
      "Iteration: 25 | Loss: 0.19512759149074554 | Train,Test accuracy: 0.9432504773139954.3f%, 0.8298061490058899.3f%\n",
      "0 tensor(0.1453, device='cuda:0')\n",
      "100 tensor(0.2368, device='cuda:0')\n",
      "200 tensor(0.1840, device='cuda:0')\n",
      "300 tensor(0.2543, device='cuda:0')\n",
      "Iteration: 26 | Loss: 0.18784956634044647 | Train,Test accuracy: 0.9403333067893982.3f%, 0.8368275165557861.3f%\n",
      "0 tensor(0.1401, device='cuda:0')\n",
      "100 tensor(0.1803, device='cuda:0')\n",
      "200 tensor(0.1464, device='cuda:0')\n",
      "300 tensor(0.3592, device='cuda:0')\n",
      "Iteration: 27 | Loss: 0.18521173298358917 | Train,Test accuracy: 0.9479379653930664.3f%, 0.8359375.3f%\n",
      "0 tensor(0.2474, device='cuda:0')\n",
      "100 tensor(0.1147, device='cuda:0')\n",
      "200 tensor(0.2232, device='cuda:0')\n",
      "300 tensor(0.1563, device='cuda:0')\n",
      "Iteration: 28 | Loss: 0.18075130879878998 | Train,Test accuracy: 0.9491128325462341.3f%, 0.843156635761261.3f%\n",
      "0 tensor(0.0603, device='cuda:0')\n",
      "100 tensor(0.1322, device='cuda:0')\n",
      "200 tensor(0.2159, device='cuda:0')\n",
      "300 tensor(0.1899, device='cuda:0')\n",
      "Iteration: 29 | Loss: 0.17850017547607422 | Train,Test accuracy: 0.9449608325958252.3f%, 0.8256527185440063.3f%\n",
      "0 tensor(0.2628, device='cuda:0')\n",
      "100 tensor(0.1369, device='cuda:0')\n",
      "200 tensor(0.1425, device='cuda:0')\n",
      "300 tensor(0.1881, device='cuda:0')\n",
      "Iteration: 30 | Loss: 0.1730067878961563 | Train,Test accuracy: 0.9490728974342346.3f%, 0.8337618708610535.3f%\n",
      "0 tensor(0.1148, device='cuda:0')\n",
      "100 tensor(0.1365, device='cuda:0')\n",
      "200 tensor(0.1183, device='cuda:0')\n",
      "300 tensor(0.1482, device='cuda:0')\n",
      "Iteration: 31 | Loss: 0.16918030381202698 | Train,Test accuracy: 0.950343668460846.3f%, 0.8420688509941101.3f%\n",
      "0 tensor(0.0840, device='cuda:0')\n",
      "100 tensor(0.1712, device='cuda:0')\n",
      "200 tensor(0.1829, device='cuda:0')\n",
      "300 tensor(0.0985, device='cuda:0')\n",
      "Iteration: 32 | Loss: 0.17056846618652344 | Train,Test accuracy: 0.9547234773635864.3f%, 0.8404865264892578.3f%\n",
      "0 tensor(0.1253, device='cuda:0')\n",
      "100 tensor(0.1372, device='cuda:0')\n",
      "200 tensor(0.2859, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "300 tensor(0.1795, device='cuda:0')\n",
      "Iteration: 33 | Loss: 0.15842460095882416 | Train,Test accuracy: 0.9508112072944641.3f%, 0.8390031456947327.3f%\n",
      "0 tensor(0.1140, device='cuda:0')\n",
      "100 tensor(0.2567, device='cuda:0')\n",
      "200 tensor(0.1303, device='cuda:0')\n",
      "300 tensor(0.1283, device='cuda:0')\n",
      "Iteration: 34 | Loss: 0.16433629393577576 | Train,Test accuracy: 0.95414799451828.3f%, 0.8363330960273743.3f%\n",
      "0 tensor(0.1333, device='cuda:0')\n",
      "100 tensor(0.1069, device='cuda:0')\n",
      "200 tensor(0.0813, device='cuda:0')\n",
      "300 tensor(0.1712, device='cuda:0')\n",
      "Iteration: 35 | Loss: 0.15894900262355804 | Train,Test accuracy: 0.9511988759040833.3f%, 0.8433544039726257.3f%\n",
      "0 tensor(0.1134, device='cuda:0')\n",
      "100 tensor(0.2731, device='cuda:0')\n",
      "200 tensor(0.1097, device='cuda:0')\n",
      "300 tensor(0.0937, device='cuda:0')\n",
      "Iteration: 36 | Loss: 0.15414714813232422 | Train,Test accuracy: 0.9555466771125793.3f%, 0.8448378443717957.3f%\n",
      "0 tensor(0.0802, device='cuda:0')\n",
      "100 tensor(0.1583, device='cuda:0')\n",
      "200 tensor(0.1862, device='cuda:0')\n",
      "300 tensor(0.1587, device='cuda:0')\n",
      "Iteration: 37 | Loss: 0.15752261877059937 | Train,Test accuracy: 0.954615592956543.3f%, 0.839992105960846.3f%\n",
      "0 tensor(0.1091, device='cuda:0')\n",
      "100 tensor(0.1635, device='cuda:0')\n",
      "200 tensor(0.1809, device='cuda:0')\n",
      "300 tensor(0.0908, device='cuda:0')\n",
      "Iteration: 38 | Loss: 0.14996300637722015 | Train,Test accuracy: 0.9549392461776733.3f%, 0.8402887582778931.3f%\n",
      "0 tensor(0.0843, device='cuda:0')\n",
      "100 tensor(0.1746, device='cuda:0')\n",
      "200 tensor(0.1800, device='cuda:0')\n",
      "300 tensor(0.2076, device='cuda:0')\n",
      "Iteration: 39 | Loss: 0.1504337340593338 | Train,Test accuracy: 0.955159068107605.3f%, 0.8313884735107422.3f%\n",
      "0 tensor(0.1384, device='cuda:0')\n",
      "100 tensor(0.1423, device='cuda:0')\n",
      "200 tensor(0.1510, device='cuda:0')\n",
      "300 tensor(0.1057, device='cuda:0')\n",
      "Iteration: 40 | Loss: 0.1493544727563858 | Train,Test accuracy: 0.9567894339561462.3f%, 0.8453322649002075.3f%\n",
      "0 tensor(0.1015, device='cuda:0')\n",
      "100 tensor(0.1976, device='cuda:0')\n",
      "200 tensor(0.1341, device='cuda:0')\n",
      "300 tensor(0.1321, device='cuda:0')\n",
      "Iteration: 41 | Loss: 0.14785027503967285 | Train,Test accuracy: 0.9542639255523682.3f%, 0.8403876423835754.3f%\n",
      "0 tensor(0.1180, device='cuda:0')\n",
      "100 tensor(0.2581, device='cuda:0')\n",
      "200 tensor(0.1699, device='cuda:0')\n",
      "300 tensor(0.1333, device='cuda:0')\n",
      "Iteration: 42 | Loss: 0.14280085265636444 | Train,Test accuracy: 0.9591512680053711.3f%, 0.839695394039154.3f%\n",
      "0 tensor(0.0976, device='cuda:0')\n",
      "100 tensor(0.1286, device='cuda:0')\n",
      "200 tensor(0.1341, device='cuda:0')\n",
      "300 tensor(0.1424, device='cuda:0')\n",
      "Iteration: 43 | Loss: 0.14628729224205017 | Train,Test accuracy: 0.9581202268600464.3f%, 0.8386076092720032.3f%\n",
      "0 tensor(0.1398, device='cuda:0')\n",
      "100 tensor(0.1248, device='cuda:0')\n",
      "200 tensor(0.2550, device='cuda:0')\n",
      "300 tensor(0.0611, device='cuda:0')\n",
      "Iteration: 44 | Loss: 0.14797867834568024 | Train,Test accuracy: 0.9593230485916138.3f%, 0.8398932218551636.3f%\n",
      "0 tensor(0.0734, device='cuda:0')\n",
      "100 tensor(0.2005, device='cuda:0')\n",
      "200 tensor(0.1450, device='cuda:0')\n",
      "300 tensor(0.1489, device='cuda:0')\n",
      "Iteration: 45 | Loss: 0.14521916210651398 | Train,Test accuracy: 0.9601821899414062.3f%, 0.8459256291389465.3f%\n",
      "0 tensor(0.0916, device='cuda:0')\n",
      "100 tensor(0.1847, device='cuda:0')\n",
      "200 tensor(0.0921, device='cuda:0')\n",
      "300 tensor(0.2311, device='cuda:0')\n",
      "Iteration: 46 | Loss: 0.13850785791873932 | Train,Test accuracy: 0.961273193359375.3f%, 0.8487935066223145.3f%\n",
      "0 tensor(0.1885, device='cuda:0')\n",
      "100 tensor(0.1699, device='cuda:0')\n",
      "200 tensor(0.1396, device='cuda:0')\n",
      "300 tensor(0.1199, device='cuda:0')\n",
      "Iteration: 47 | Loss: 0.13496792316436768 | Train,Test accuracy: 0.9592551589012146.3f%, 0.8352452516555786.3f%\n",
      "0 tensor(0.1271, device='cuda:0')\n",
      "100 tensor(0.1892, device='cuda:0')\n",
      "200 tensor(0.1725, device='cuda:0')\n",
      "300 tensor(0.1516, device='cuda:0')\n",
      "Iteration: 48 | Loss: 0.13948562741279602 | Train,Test accuracy: 0.9608255624771118.3f%, 0.8452333807945251.3f%\n",
      "0 tensor(0.1026, device='cuda:0')\n",
      "100 tensor(0.1319, device='cuda:0')\n",
      "200 tensor(0.1447, device='cuda:0')\n",
      "300 tensor(0.1716, device='cuda:0')\n",
      "Iteration: 49 | Loss: 0.13566020131111145 | Train,Test accuracy: 0.9583240151405334.3f%, 0.8373219966888428.3f%\n",
      "0 tensor(0.1781, device='cuda:0')\n",
      "100 tensor(0.1487, device='cuda:0')\n",
      "200 tensor(0.1533, device='cuda:0')\n",
      "300 tensor(0.1426, device='cuda:0')\n",
      "Iteration: 50 | Loss: 0.13493740558624268 | Train,Test accuracy: 0.960729718208313.3f%, 0.8436511158943176.3f%\n",
      "0 tensor(0.0674, device='cuda:0')\n",
      "100 tensor(0.0637, device='cuda:0')\n",
      "200 tensor(0.1180, device='cuda:0')\n",
      "300 tensor(0.1743, device='cuda:0')\n",
      "Iteration: 51 | Loss: 0.13366466760635376 | Train,Test accuracy: 0.956913411617279.3f%, 0.8395965099334717.3f%\n",
      "0 tensor(0.1439, device='cuda:0')\n",
      "100 tensor(0.1489, device='cuda:0')\n",
      "200 tensor(0.1636, device='cuda:0')\n",
      "300 tensor(0.1258, device='cuda:0')\n",
      "Iteration: 52 | Loss: 0.13486424088478088 | Train,Test accuracy: 0.9615689516067505.3f%, 0.8434533476829529.3f%\n",
      "0 tensor(0.0315, device='cuda:0')\n",
      "100 tensor(0.1054, device='cuda:0')\n",
      "200 tensor(0.2792, device='cuda:0')\n",
      "300 tensor(0.1276, device='cuda:0')\n",
      "Iteration: 53 | Loss: 0.1340857595205307 | Train,Test accuracy: 0.962971568107605.3f%, 0.8421677350997925.3f%\n",
      "0 tensor(0.2112, device='cuda:0')\n",
      "100 tensor(0.1144, device='cuda:0')\n",
      "200 tensor(0.1590, device='cuda:0')\n",
      "300 tensor(0.1514, device='cuda:0')\n",
      "Iteration: 54 | Loss: 0.1280236393213272 | Train,Test accuracy: 0.9600423574447632.3f%, 0.8325751423835754.3f%\n",
      "0 tensor(0.1051, device='cuda:0')\n",
      "100 tensor(0.0856, device='cuda:0')\n",
      "200 tensor(0.1430, device='cuda:0')\n",
      "300 tensor(0.1279, device='cuda:0')\n",
      "Iteration: 55 | Loss: 0.1276153177022934 | Train,Test accuracy: 0.963111400604248.3f%, 0.8494857549667358.3f%\n",
      "0 tensor(0.1048, device='cuda:0')\n",
      "100 tensor(0.1162, device='cuda:0')\n",
      "200 tensor(0.2077, device='cuda:0')\n",
      "300 tensor(0.1463, device='cuda:0')\n",
      "Iteration: 56 | Loss: 0.12795785069465637 | Train,Test accuracy: 0.96433025598526.3f%, 0.8510680198669434.3f%\n",
      "0 tensor(0.1052, device='cuda:0')\n",
      "100 tensor(0.0571, device='cuda:0')\n",
      "200 tensor(0.0854, device='cuda:0')\n",
      "300 tensor(0.2122, device='cuda:0')\n",
      "Iteration: 57 | Loss: 0.131869375705719 | Train,Test accuracy: 0.9652373790740967.3f%, 0.8432555198669434.3f%\n",
      "0 tensor(0.1310, device='cuda:0')\n",
      "100 tensor(0.1572, device='cuda:0')\n",
      "200 tensor(0.1030, device='cuda:0')\n",
      "300 tensor(0.1453, device='cuda:0')\n",
      "Iteration: 58 | Loss: 0.13127940893173218 | Train,Test accuracy: 0.9633951187133789.3f%, 0.8442444801330566.3f%\n",
      "0 tensor(0.1753, device='cuda:0')\n",
      "100 tensor(0.0768, device='cuda:0')\n",
      "200 tensor(0.1543, device='cuda:0')\n",
      "300 tensor(0.1352, device='cuda:0')\n",
      "Iteration: 59 | Loss: 0.125573992729187 | Train,Test accuracy: 0.9611852169036865.3f%, 0.8395965099334717.3f%\n",
      "0 tensor(0.0910, device='cuda:0')\n",
      "100 tensor(0.0570, device='cuda:0')\n",
      "200 tensor(0.1364, device='cuda:0')\n",
      "300 tensor(0.0908, device='cuda:0')\n",
      "Iteration: 60 | Loss: 0.12394355237483978 | Train,Test accuracy: 0.9620324373245239.3f%, 0.8409810066223145.3f%\n",
      "0 tensor(0.1499, device='cuda:0')\n",
      "100 tensor(0.1017, device='cuda:0')\n",
      "200 tensor(0.1064, device='cuda:0')\n",
      "300 tensor(0.0977, device='cuda:0')\n",
      "Iteration: 61 | Loss: 0.12623478472232819 | Train,Test accuracy: 0.963323175907135.3f%, 0.8404865264892578.3f%\n",
      "0 tensor(0.1000, device='cuda:0')\n",
      "100 tensor(0.1312, device='cuda:0')\n",
      "200 tensor(0.1037, device='cuda:0')\n",
      "300 tensor(0.1852, device='cuda:0')\n",
      "Iteration: 62 | Loss: 0.12977126240730286 | Train,Test accuracy: 0.9610613584518433.3f%, 0.844343364238739.3f%\n",
      "0 tensor(0.1719, device='cuda:0')\n",
      "100 tensor(0.0595, device='cuda:0')\n",
      "200 tensor(0.0802, device='cuda:0')\n",
      "300 tensor(0.0842, device='cuda:0')\n",
      "Iteration: 63 | Loss: 0.12350454926490784 | Train,Test accuracy: 0.9638386964797974.3f%, 0.8375197649002075.3f%\n",
      "0 tensor(0.0912, device='cuda:0')\n",
      "100 tensor(0.1068, device='cuda:0')\n",
      "200 tensor(0.1303, device='cuda:0')\n",
      "300 tensor(0.1279, device='cuda:0')\n",
      "Iteration: 64 | Loss: 0.12799285352230072 | Train,Test accuracy: 0.9656530022621155.3f%, 0.837717592716217.3f%\n",
      "0 tensor(0.0745, device='cuda:0')\n",
      "100 tensor(0.0991, device='cuda:0')\n",
      "200 tensor(0.1290, device='cuda:0')\n",
      "300 tensor(0.0595, device='cuda:0')\n",
      "Iteration: 65 | Loss: 0.12004116922616959 | Train,Test accuracy: 0.9623640775680542.3f%, 0.8356408476829529.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.0998, device='cuda:0')\n",
      "100 tensor(0.0931, device='cuda:0')\n",
      "200 tensor(0.2760, device='cuda:0')\n",
      "300 tensor(0.0701, device='cuda:0')\n",
      "Iteration: 66 | Loss: 0.12435042858123779 | Train,Test accuracy: 0.9659087657928467.3f%, 0.8404865264892578.3f%\n",
      "0 tensor(0.1630, device='cuda:0')\n",
      "100 tensor(0.1546, device='cuda:0')\n",
      "200 tensor(0.0669, device='cuda:0')\n",
      "300 tensor(0.1274, device='cuda:0')\n",
      "Iteration: 67 | Loss: 0.12174427509307861 | Train,Test accuracy: 0.9644980430603027.3f%, 0.8474090099334717.3f%\n",
      "0 tensor(0.0932, device='cuda:0')\n",
      "100 tensor(0.1055, device='cuda:0')\n",
      "200 tensor(0.1278, device='cuda:0')\n",
      "300 tensor(0.1592, device='cuda:0')\n",
      "Iteration: 68 | Loss: 0.12501846253871918 | Train,Test accuracy: 0.968957781791687.3f%, 0.8441455960273743.3f%\n",
      "0 tensor(0.0750, device='cuda:0')\n",
      "100 tensor(0.0660, device='cuda:0')\n",
      "200 tensor(0.1560, device='cuda:0')\n",
      "300 tensor(0.0459, device='cuda:0')\n",
      "Iteration: 69 | Loss: 0.12076500058174133 | Train,Test accuracy: 0.959574818611145.3f%, 0.8414754867553711.3f%\n",
      "0 tensor(0.0938, device='cuda:0')\n",
      "100 tensor(0.1361, device='cuda:0')\n",
      "200 tensor(0.0696, device='cuda:0')\n",
      "300 tensor(0.1095, device='cuda:0')\n",
      "Iteration: 70 | Loss: 0.12126409262418747 | Train,Test accuracy: 0.9667559266090393.3f%, 0.8502768874168396.3f%\n",
      "0 tensor(0.0284, device='cuda:0')\n",
      "100 tensor(0.1271, device='cuda:0')\n",
      "200 tensor(0.0985, device='cuda:0')\n",
      "300 tensor(0.1188, device='cuda:0')\n",
      "Iteration: 71 | Loss: 0.12273896485567093 | Train,Test accuracy: 0.965896725654602.3f%, 0.8418710231781006.3f%\n",
      "0 tensor(0.1117, device='cuda:0')\n",
      "100 tensor(0.1331, device='cuda:0')\n",
      "200 tensor(0.1044, device='cuda:0')\n",
      "300 tensor(0.1091, device='cuda:0')\n",
      "Iteration: 72 | Loss: 0.12064085155725479 | Train,Test accuracy: 0.9673313498497009.3f%, 0.8436511158943176.3f%\n",
      "0 tensor(0.0587, device='cuda:0')\n",
      "100 tensor(0.1334, device='cuda:0')\n",
      "200 tensor(0.1279, device='cuda:0')\n",
      "300 tensor(0.0683, device='cuda:0')\n",
      "Iteration: 73 | Loss: 0.12160734087228775 | Train,Test accuracy: 0.9663483500480652.3f%, 0.8500791192054749.3f%\n",
      "0 tensor(0.0329, device='cuda:0')\n",
      "100 tensor(0.1073, device='cuda:0')\n",
      "200 tensor(0.0660, device='cuda:0')\n",
      "300 tensor(0.1223, device='cuda:0')\n",
      "Iteration: 74 | Loss: 0.12149234861135483 | Train,Test accuracy: 0.9613970518112183.3f%, 0.8364319801330566.3f%\n",
      "0 tensor(0.1346, device='cuda:0')\n",
      "100 tensor(0.0390, device='cuda:0')\n",
      "200 tensor(0.1642, device='cuda:0')\n",
      "300 tensor(0.1285, device='cuda:0')\n",
      "Iteration: 75 | Loss: 0.11888726055622101 | Train,Test accuracy: 0.9660845994949341.3f%, 0.8499802350997925.3f%\n",
      "0 tensor(0.0637, device='cuda:0')\n",
      "100 tensor(0.1383, device='cuda:0')\n",
      "200 tensor(0.1878, device='cuda:0')\n",
      "300 tensor(0.1451, device='cuda:0')\n",
      "Iteration: 76 | Loss: 0.1194959208369255 | Train,Test accuracy: 0.9681185483932495.3f%, 0.8479034900665283.3f%\n",
      "0 tensor(0.1130, device='cuda:0')\n",
      "100 tensor(0.1313, device='cuda:0')\n",
      "200 tensor(0.1302, device='cuda:0')\n",
      "300 tensor(0.1021, device='cuda:0')\n",
      "Iteration: 77 | Loss: 0.11594841629266739 | Train,Test accuracy: 0.9666000604629517.3f%, 0.8486946225166321.3f%\n",
      "0 tensor(0.1287, device='cuda:0')\n",
      "100 tensor(0.0995, device='cuda:0')\n",
      "200 tensor(0.1180, device='cuda:0')\n",
      "300 tensor(0.1131, device='cuda:0')\n",
      "Iteration: 78 | Loss: 0.11528903990983963 | Train,Test accuracy: 0.9647858142852783.3f%, 0.842563271522522.3f%\n",
      "0 tensor(0.1174, device='cuda:0')\n",
      "100 tensor(0.1796, device='cuda:0')\n",
      "200 tensor(0.0989, device='cuda:0')\n",
      "300 tensor(0.1331, device='cuda:0')\n",
      "Iteration: 79 | Loss: 0.11717347800731659 | Train,Test accuracy: 0.963515043258667.3f%, 0.8407832384109497.3f%\n",
      "0 tensor(0.0692, device='cuda:0')\n",
      "100 tensor(0.1273, device='cuda:0')\n",
      "200 tensor(0.1594, device='cuda:0')\n",
      "300 tensor(0.1730, device='cuda:0')\n",
      "Iteration: 80 | Loss: 0.11308786273002625 | Train,Test accuracy: 0.9622882604598999.3f%, 0.8459256291389465.3f%\n",
      "0 tensor(0.1089, device='cuda:0')\n",
      "100 tensor(0.0541, device='cuda:0')\n",
      "200 tensor(0.0680, device='cuda:0')\n",
      "300 tensor(0.1096, device='cuda:0')\n",
      "Iteration: 81 | Loss: 0.12177310883998871 | Train,Test accuracy: 0.9660086631774902.3f%, 0.8459256291389465.3f%\n",
      "0 tensor(0.1013, device='cuda:0')\n",
      "100 tensor(0.0428, device='cuda:0')\n",
      "200 tensor(0.0655, device='cuda:0')\n",
      "300 tensor(0.0661, device='cuda:0')\n",
      "Iteration: 82 | Loss: 0.06634362041950226 | Train,Test accuracy: 0.9847306609153748.3f%, 0.8590783476829529.3f%\n",
      "0 tensor(0.0471, device='cuda:0')\n",
      "100 tensor(0.0583, device='cuda:0')\n",
      "200 tensor(0.0099, device='cuda:0')\n",
      "300 tensor(0.0662, device='cuda:0')\n",
      "Iteration: 83 | Loss: 0.04995349794626236 | Train,Test accuracy: 0.9861932396888733.3f%, 0.8577927350997925.3f%\n",
      "0 tensor(0.0443, device='cuda:0')\n",
      "100 tensor(0.0618, device='cuda:0')\n",
      "200 tensor(0.0507, device='cuda:0')\n",
      "300 tensor(0.1259, device='cuda:0')\n",
      "Iteration: 84 | Loss: 0.0475645437836647 | Train,Test accuracy: 0.9845308661460876.3f%, 0.8560126423835754.3f%\n",
      "0 tensor(0.0643, device='cuda:0')\n",
      "100 tensor(0.0601, device='cuda:0')\n",
      "200 tensor(0.0466, device='cuda:0')\n",
      "300 tensor(0.0522, device='cuda:0')\n",
      "Iteration: 85 | Loss: 0.05013248696923256 | Train,Test accuracy: 0.9838115572929382.3f%, 0.8518591523170471.3f%\n",
      "0 tensor(0.0087, device='cuda:0')\n",
      "100 tensor(0.0252, device='cuda:0')\n",
      "200 tensor(0.0455, device='cuda:0')\n",
      "300 tensor(0.1065, device='cuda:0')\n",
      "Iteration: 86 | Loss: 0.04987291246652603 | Train,Test accuracy: 0.9831921458244324.3f%, 0.8493868708610535.3f%\n",
      "0 tensor(0.0512, device='cuda:0')\n",
      "100 tensor(0.0394, device='cuda:0')\n",
      "200 tensor(0.0434, device='cuda:0')\n",
      "300 tensor(0.0211, device='cuda:0')\n",
      "Iteration: 87 | Loss: 0.0493948720395565 | Train,Test accuracy: 0.9828644394874573.3f%, 0.8592761158943176.3f%\n",
      "0 tensor(0.0936, device='cuda:0')\n",
      "100 tensor(0.0598, device='cuda:0')\n",
      "200 tensor(0.0348, device='cuda:0')\n",
      "300 tensor(0.0506, device='cuda:0')\n",
      "Iteration: 88 | Loss: 0.04955730587244034 | Train,Test accuracy: 0.9851222634315491.3f%, 0.8530458807945251.3f%\n",
      "0 tensor(0.0544, device='cuda:0')\n",
      "100 tensor(0.1065, device='cuda:0')\n",
      "200 tensor(0.1003, device='cuda:0')\n",
      "300 tensor(0.0154, device='cuda:0')\n",
      "Iteration: 89 | Loss: 0.05069981515407562 | Train,Test accuracy: 0.9843510389328003.3f%, 0.8487935066223145.3f%\n",
      "0 tensor(0.0436, device='cuda:0')\n",
      "100 tensor(0.0342, device='cuda:0')\n",
      "200 tensor(0.0798, device='cuda:0')\n",
      "300 tensor(0.0247, device='cuda:0')\n",
      "Iteration: 90 | Loss: 0.05343973636627197 | Train,Test accuracy: 0.9832001328468323.3f%, 0.8548259735107422.3f%\n",
      "0 tensor(0.0243, device='cuda:0')\n",
      "100 tensor(0.0750, device='cuda:0')\n",
      "200 tensor(0.0589, device='cuda:0')\n",
      "300 tensor(0.0299, device='cuda:0')\n",
      "Iteration: 91 | Loss: 0.05387293919920921 | Train,Test accuracy: 0.9854899644851685.3f%, 0.8538370132446289.3f%\n",
      "0 tensor(0.0337, device='cuda:0')\n",
      "100 tensor(0.0896, device='cuda:0')\n",
      "200 tensor(0.1057, device='cuda:0')\n",
      "300 tensor(0.0528, device='cuda:0')\n",
      "Iteration: 92 | Loss: 0.05136014148592949 | Train,Test accuracy: 0.9843230247497559.3f%, 0.8517602682113647.3f%\n",
      "0 tensor(0.0294, device='cuda:0')\n",
      "100 tensor(0.0519, device='cuda:0')\n",
      "200 tensor(0.0224, device='cuda:0')\n",
      "300 tensor(0.0588, device='cuda:0')\n",
      "Iteration: 93 | Loss: 0.049435898661613464 | Train,Test accuracy: 0.9852221608161926.3f%, 0.8592761158943176.3f%\n",
      "0 tensor(0.0480, device='cuda:0')\n",
      "100 tensor(0.0063, device='cuda:0')\n",
      "200 tensor(0.0634, device='cuda:0')\n",
      "300 tensor(0.0424, device='cuda:0')\n",
      "Iteration: 94 | Loss: 0.0542776994407177 | Train,Test accuracy: 0.9842031598091125.3f%, 0.8516613841056824.3f%\n",
      "0 tensor(0.0498, device='cuda:0')\n",
      "100 tensor(0.0079, device='cuda:0')\n",
      "200 tensor(0.0301, device='cuda:0')\n",
      "300 tensor(0.0750, device='cuda:0')\n",
      "Iteration: 95 | Loss: 0.04755368083715439 | Train,Test accuracy: 0.9853420257568359.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0916, device='cuda:0')\n",
      "100 tensor(0.0331, device='cuda:0')\n",
      "200 tensor(0.0596, device='cuda:0')\n",
      "300 tensor(0.0374, device='cuda:0')\n",
      "Iteration: 96 | Loss: 0.05156093090772629 | Train,Test accuracy: 0.9851022958755493.3f%, 0.8614517450332642.3f%\n",
      "0 tensor(0.0945, device='cuda:0')\n",
      "100 tensor(0.0620, device='cuda:0')\n",
      "200 tensor(0.0305, device='cuda:0')\n",
      "300 tensor(0.0461, device='cuda:0')\n",
      "Iteration: 97 | Loss: 0.048189856112003326 | Train,Test accuracy: 0.9838514924049377.3f%, 0.8585838675498962.3f%\n",
      "0 tensor(0.1031, device='cuda:0')\n",
      "100 tensor(0.0575, device='cuda:0')\n",
      "200 tensor(0.0387, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "300 tensor(0.0312, device='cuda:0')\n",
      "Iteration: 98 | Loss: 0.05257264897227287 | Train,Test accuracy: 0.9845427870750427.3f%, 0.855617105960846.3f%\n",
      "0 tensor(0.0593, device='cuda:0')\n",
      "100 tensor(0.1132, device='cuda:0')\n",
      "200 tensor(0.0415, device='cuda:0')\n",
      "300 tensor(0.0172, device='cuda:0')\n",
      "Iteration: 99 | Loss: 0.05008157342672348 | Train,Test accuracy: 0.9840952754020691.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0330, device='cuda:0')\n",
      "100 tensor(0.0566, device='cuda:0')\n",
      "200 tensor(0.0697, device='cuda:0')\n",
      "300 tensor(0.0335, device='cuda:0')\n",
      "Iteration: 100 | Loss: 0.053936414420604706 | Train,Test accuracy: 0.9858136177062988.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0210, device='cuda:0')\n",
      "100 tensor(0.0586, device='cuda:0')\n",
      "200 tensor(0.0553, device='cuda:0')\n",
      "300 tensor(0.1396, device='cuda:0')\n",
      "Iteration: 101 | Loss: 0.04991893470287323 | Train,Test accuracy: 0.9864929914474487.3f%, 0.8519580960273743.3f%\n",
      "0 tensor(0.0243, device='cuda:0')\n",
      "100 tensor(0.0949, device='cuda:0')\n",
      "200 tensor(0.0131, device='cuda:0')\n",
      "300 tensor(0.0175, device='cuda:0')\n",
      "Iteration: 102 | Loss: 0.050475094467401505 | Train,Test accuracy: 0.983491837978363.3f%, 0.8534414768218994.3f%\n",
      "0 tensor(0.0264, device='cuda:0')\n",
      "100 tensor(0.0440, device='cuda:0')\n",
      "200 tensor(0.0566, device='cuda:0')\n",
      "300 tensor(0.0417, device='cuda:0')\n",
      "Iteration: 103 | Loss: 0.05536965653300285 | Train,Test accuracy: 0.9855618476867676.3f%, 0.8572982549667358.3f%\n",
      "0 tensor(0.0413, device='cuda:0')\n",
      "100 tensor(0.0707, device='cuda:0')\n",
      "200 tensor(0.0320, device='cuda:0')\n",
      "300 tensor(0.0649, device='cuda:0')\n",
      "Iteration: 104 | Loss: 0.05079928785562515 | Train,Test accuracy: 0.9820332527160645.3f%, 0.8404865264892578.3f%\n",
      "0 tensor(0.0175, device='cuda:0')\n",
      "100 tensor(0.0560, device='cuda:0')\n",
      "200 tensor(0.0676, device='cuda:0')\n",
      "300 tensor(0.0103, device='cuda:0')\n",
      "Iteration: 105 | Loss: 0.04996856674551964 | Train,Test accuracy: 0.9834238886833191.3f%, 0.8535403609275818.3f%\n",
      "0 tensor(0.0525, device='cuda:0')\n",
      "100 tensor(0.0491, device='cuda:0')\n",
      "200 tensor(0.0969, device='cuda:0')\n",
      "300 tensor(0.0221, device='cuda:0')\n",
      "Iteration: 106 | Loss: 0.05118275433778763 | Train,Test accuracy: 0.9840872883796692.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0100, device='cuda:0')\n",
      "100 tensor(0.0182, device='cuda:0')\n",
      "200 tensor(0.0426, device='cuda:0')\n",
      "300 tensor(0.0257, device='cuda:0')\n",
      "Iteration: 107 | Loss: 0.05185829848051071 | Train,Test accuracy: 0.9847825765609741.3f%, 0.8518591523170471.3f%\n",
      "0 tensor(0.0152, device='cuda:0')\n",
      "100 tensor(0.0493, device='cuda:0')\n",
      "200 tensor(0.0784, device='cuda:0')\n",
      "300 tensor(0.0285, device='cuda:0')\n",
      "Iteration: 108 | Loss: 0.05128544941544533 | Train,Test accuracy: 0.9861612319946289.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0933, device='cuda:0')\n",
      "100 tensor(0.0122, device='cuda:0')\n",
      "200 tensor(0.0430, device='cuda:0')\n",
      "300 tensor(0.0476, device='cuda:0')\n",
      "Iteration: 109 | Loss: 0.04926787689328194 | Train,Test accuracy: 0.9855338931083679.3f%, 0.8583860993385315.3f%\n",
      "0 tensor(0.0184, device='cuda:0')\n",
      "100 tensor(0.0346, device='cuda:0')\n",
      "200 tensor(0.0196, device='cuda:0')\n",
      "300 tensor(0.0849, device='cuda:0')\n",
      "Iteration: 110 | Loss: 0.04865703731775284 | Train,Test accuracy: 0.9849104881286621.3f%, 0.8522547483444214.3f%\n",
      "0 tensor(0.0124, device='cuda:0')\n",
      "100 tensor(0.0442, device='cuda:0')\n",
      "200 tensor(0.0582, device='cuda:0')\n",
      "300 tensor(0.0818, device='cuda:0')\n",
      "Iteration: 111 | Loss: 0.05177057161927223 | Train,Test accuracy: 0.985529899597168.3f%, 0.8588805198669434.3f%\n",
      "0 tensor(0.0372, device='cuda:0')\n",
      "100 tensor(0.0568, device='cuda:0')\n",
      "200 tensor(0.1279, device='cuda:0')\n",
      "300 tensor(0.0657, device='cuda:0')\n",
      "Iteration: 112 | Loss: 0.0507141649723053 | Train,Test accuracy: 0.9848745465278625.3f%, 0.8518591523170471.3f%\n",
      "0 tensor(0.0981, device='cuda:0')\n",
      "100 tensor(0.0615, device='cuda:0')\n",
      "200 tensor(0.0429, device='cuda:0')\n",
      "300 tensor(0.0381, device='cuda:0')\n",
      "Iteration: 113 | Loss: 0.05203668400645256 | Train,Test accuracy: 0.9844110012054443.3f%, 0.8564082384109497.3f%\n",
      "0 tensor(0.0272, device='cuda:0')\n",
      "100 tensor(0.0403, device='cuda:0')\n",
      "200 tensor(0.0677, device='cuda:0')\n",
      "300 tensor(0.0625, device='cuda:0')\n",
      "Iteration: 114 | Loss: 0.05236676335334778 | Train,Test accuracy: 0.9833999276161194.3f%, 0.8583860993385315.3f%\n",
      "0 tensor(0.0815, device='cuda:0')\n",
      "100 tensor(0.0390, device='cuda:0')\n",
      "200 tensor(0.0597, device='cuda:0')\n",
      "300 tensor(0.0394, device='cuda:0')\n",
      "Iteration: 115 | Loss: 0.049463387578725815 | Train,Test accuracy: 0.9855618476867676.3f%, 0.8528481125831604.3f%\n",
      "0 tensor(0.0538, device='cuda:0')\n",
      "100 tensor(0.1190, device='cuda:0')\n",
      "200 tensor(0.0218, device='cuda:0')\n",
      "300 tensor(0.0540, device='cuda:0')\n",
      "Iteration: 116 | Loss: 0.051679711788892746 | Train,Test accuracy: 0.9863170981407166.3f%, 0.8569027185440063.3f%\n",
      "0 tensor(0.0728, device='cuda:0')\n",
      "100 tensor(0.0701, device='cuda:0')\n",
      "200 tensor(0.0743, device='cuda:0')\n",
      "300 tensor(0.1501, device='cuda:0')\n",
      "Iteration: 117 | Loss: 0.048461250960826874 | Train,Test accuracy: 0.9823848605155945.3f%, 0.8432555198669434.3f%\n",
      "0 tensor(0.0676, device='cuda:0')\n",
      "100 tensor(0.0551, device='cuda:0')\n",
      "200 tensor(0.0554, device='cuda:0')\n",
      "300 tensor(0.1032, device='cuda:0')\n",
      "Iteration: 118 | Loss: 0.052138715982437134 | Train,Test accuracy: 0.9863530993461609.3f%, 0.8559137582778931.3f%\n",
      "0 tensor(0.0751, device='cuda:0')\n",
      "100 tensor(0.0146, device='cuda:0')\n",
      "200 tensor(0.0499, device='cuda:0')\n",
      "300 tensor(0.0281, device='cuda:0')\n",
      "Iteration: 119 | Loss: 0.05077066272497177 | Train,Test accuracy: 0.9843429923057556.3f%, 0.8545292615890503.3f%\n",
      "0 tensor(0.0331, device='cuda:0')\n",
      "100 tensor(0.0403, device='cuda:0')\n",
      "200 tensor(0.0366, device='cuda:0')\n",
      "300 tensor(0.0538, device='cuda:0')\n",
      "Iteration: 120 | Loss: 0.05211425572633743 | Train,Test accuracy: 0.9842430949211121.3f%, 0.8546281456947327.3f%\n",
      "0 tensor(0.0205, device='cuda:0')\n",
      "100 tensor(0.0451, device='cuda:0')\n",
      "200 tensor(0.0474, device='cuda:0')\n",
      "300 tensor(0.0754, device='cuda:0')\n",
      "Iteration: 121 | Loss: 0.05430443957448006 | Train,Test accuracy: 0.9857416749000549.3f%, 0.8544303774833679.3f%\n",
      "0 tensor(0.0788, device='cuda:0')\n",
      "100 tensor(0.0380, device='cuda:0')\n",
      "200 tensor(0.0676, device='cuda:0')\n",
      "300 tensor(0.0597, device='cuda:0')\n",
      "Iteration: 122 | Loss: 0.04867756739258766 | Train,Test accuracy: 0.9849104881286621.3f%, 0.8501780033111572.3f%\n",
      "0 tensor(0.0277, device='cuda:0')\n",
      "100 tensor(0.0219, device='cuda:0')\n",
      "200 tensor(0.0152, device='cuda:0')\n",
      "300 tensor(0.0737, device='cuda:0')\n",
      "Iteration: 123 | Loss: 0.048635389655828476 | Train,Test accuracy: 0.9842430949211121.3f%, 0.8595727682113647.3f%\n",
      "0 tensor(0.0355, device='cuda:0')\n",
      "100 tensor(0.0322, device='cuda:0')\n",
      "200 tensor(0.0566, device='cuda:0')\n",
      "300 tensor(0.1004, device='cuda:0')\n",
      "Iteration: 124 | Loss: 0.05513441562652588 | Train,Test accuracy: 0.985002338886261.3f%, 0.8541337251663208.3f%\n",
      "0 tensor(0.0293, device='cuda:0')\n",
      "100 tensor(0.0355, device='cuda:0')\n",
      "200 tensor(0.0426, device='cuda:0')\n",
      "300 tensor(0.0915, device='cuda:0')\n",
      "Iteration: 125 | Loss: 0.04964165389537811 | Train,Test accuracy: 0.9836236834526062.3f%, 0.8524525165557861.3f%\n",
      "0 tensor(0.0589, device='cuda:0')\n",
      "100 tensor(0.0217, device='cuda:0')\n",
      "200 tensor(0.0719, device='cuda:0')\n",
      "300 tensor(0.0567, device='cuda:0')\n",
      "Iteration: 126 | Loss: 0.05646113306283951 | Train,Test accuracy: 0.9863091707229614.3f%, 0.8608583807945251.3f%\n",
      "0 tensor(0.0226, device='cuda:0')\n",
      "100 tensor(0.1213, device='cuda:0')\n",
      "200 tensor(0.0221, device='cuda:0')\n",
      "300 tensor(0.0369, device='cuda:0')\n",
      "Iteration: 127 | Loss: 0.054350849241018295 | Train,Test accuracy: 0.9865808486938477.3f%, 0.8595727682113647.3f%\n",
      "0 tensor(0.0301, device='cuda:0')\n",
      "100 tensor(0.0284, device='cuda:0')\n",
      "200 tensor(0.0285, device='cuda:0')\n",
      "300 tensor(0.0623, device='cuda:0')\n",
      "Iteration: 128 | Loss: 0.048566535115242004 | Train,Test accuracy: 0.9838355183601379.3f%, 0.853342592716217.3f%\n",
      "0 tensor(0.0414, device='cuda:0')\n",
      "100 tensor(0.0570, device='cuda:0')\n",
      "200 tensor(0.0903, device='cuda:0')\n",
      "300 tensor(0.0489, device='cuda:0')\n",
      "Iteration: 129 | Loss: 0.04962329566478729 | Train,Test accuracy: 0.9849024415016174.3f%, 0.8510680198669434.3f%\n",
      "0 tensor(0.0867, device='cuda:0')\n",
      "100 tensor(0.0623, device='cuda:0')\n",
      "200 tensor(0.0230, device='cuda:0')\n",
      "300 tensor(0.0095, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Iteration: 130 | Loss: 0.05286867544054985 | Train,Test accuracy: 0.9820332527160645.3f%, 0.8536392450332642.3f%\n",
      "0 tensor(0.0389, device='cuda:0')\n",
      "100 tensor(0.0463, device='cuda:0')\n",
      "200 tensor(0.0182, device='cuda:0')\n",
      "300 tensor(0.1154, device='cuda:0')\n",
      "Iteration: 131 | Loss: 0.05282042548060417 | Train,Test accuracy: 0.9833838939666748.3f%, 0.8594738841056824.3f%\n",
      "0 tensor(0.0428, device='cuda:0')\n",
      "100 tensor(0.0438, device='cuda:0')\n",
      "200 tensor(0.0188, device='cuda:0')\n",
      "300 tensor(0.0647, device='cuda:0')\n",
      "Iteration: 132 | Loss: 0.05032088980078697 | Train,Test accuracy: 0.9847426414489746.3f%, 0.8573971390724182.3f%\n",
      "0 tensor(0.0496, device='cuda:0')\n",
      "100 tensor(0.0118, device='cuda:0')\n",
      "200 tensor(0.0906, device='cuda:0')\n",
      "300 tensor(0.0878, device='cuda:0')\n",
      "Iteration: 133 | Loss: 0.05243371054530144 | Train,Test accuracy: 0.9821251034736633.3f%, 0.8558148741722107.3f%\n",
      "0 tensor(0.0720, device='cuda:0')\n",
      "100 tensor(0.0241, device='cuda:0')\n",
      "200 tensor(0.0378, device='cuda:0')\n",
      "300 tensor(0.0291, device='cuda:0')\n",
      "Iteration: 134 | Loss: 0.0519622303545475 | Train,Test accuracy: 0.9855178594589233.3f%, 0.8571004867553711.3f%\n",
      "0 tensor(0.0072, device='cuda:0')\n",
      "100 tensor(0.0391, device='cuda:0')\n",
      "200 tensor(0.0890, device='cuda:0')\n",
      "300 tensor(0.0197, device='cuda:0')\n",
      "Iteration: 135 | Loss: 0.048015519976615906 | Train,Test accuracy: 0.9833359718322754.3f%, 0.8574960231781006.3f%\n",
      "0 tensor(0.0783, device='cuda:0')\n",
      "100 tensor(0.0876, device='cuda:0')\n",
      "200 tensor(0.0785, device='cuda:0')\n",
      "300 tensor(0.0948, device='cuda:0')\n",
      "Iteration: 136 | Loss: 0.052523210644721985 | Train,Test accuracy: 0.9849424362182617.3f%, 0.859968364238739.3f%\n",
      "0 tensor(0.0546, device='cuda:0')\n",
      "100 tensor(0.0679, device='cuda:0')\n",
      "200 tensor(0.0527, device='cuda:0')\n",
      "300 tensor(0.0140, device='cuda:0')\n",
      "Iteration: 137 | Loss: 0.05159846693277359 | Train,Test accuracy: 0.9834319353103638.3f%, 0.857594907283783.3f%\n",
      "0 tensor(0.0355, device='cuda:0')\n",
      "100 tensor(0.0999, device='cuda:0')\n",
      "200 tensor(0.0607, device='cuda:0')\n",
      "300 tensor(0.0458, device='cuda:0')\n",
      "Iteration: 138 | Loss: 0.052241001278162 | Train,Test accuracy: 0.9870124459266663.3f%, 0.8567048907279968.3f%\n",
      "0 tensor(0.0602, device='cuda:0')\n",
      "100 tensor(0.0193, device='cuda:0')\n",
      "200 tensor(0.0787, device='cuda:0')\n",
      "300 tensor(0.0470, device='cuda:0')\n",
      "Iteration: 139 | Loss: 0.04921931028366089 | Train,Test accuracy: 0.984231173992157.3f%, 0.8525514006614685.3f%\n",
      "0 tensor(0.0505, device='cuda:0')\n",
      "100 tensor(0.0315, device='cuda:0')\n",
      "200 tensor(0.0530, device='cuda:0')\n",
      "300 tensor(0.0724, device='cuda:0')\n",
      "Iteration: 140 | Loss: 0.04865355044603348 | Train,Test accuracy: 0.9856697916984558.3f%, 0.8506724834442139.3f%\n",
      "0 tensor(0.0724, device='cuda:0')\n",
      "100 tensor(0.0392, device='cuda:0')\n",
      "200 tensor(0.0267, device='cuda:0')\n",
      "300 tensor(0.0156, device='cuda:0')\n",
      "Iteration: 141 | Loss: 0.05040649324655533 | Train,Test accuracy: 0.9828364849090576.3f%, 0.8566060066223145.3f%\n",
      "0 tensor(0.0913, device='cuda:0')\n",
      "100 tensor(0.0117, device='cuda:0')\n",
      "200 tensor(0.0065, device='cuda:0')\n",
      "300 tensor(0.0192, device='cuda:0')\n",
      "Iteration: 142 | Loss: 0.02931545116007328 | Train,Test accuracy: 0.9946730732917786.3f%, 0.8672863841056824.3f%\n",
      "0 tensor(0.0043, device='cuda:0')\n",
      "100 tensor(0.0204, device='cuda:0')\n",
      "200 tensor(0.0231, device='cuda:0')\n",
      "300 tensor(0.0776, device='cuda:0')\n",
      "Iteration: 143 | Loss: 0.018080227077007294 | Train,Test accuracy: 0.9958239793777466.3f%, 0.8678797483444214.3f%\n",
      "0 tensor(0.0238, device='cuda:0')\n",
      "100 tensor(0.0048, device='cuda:0')\n",
      "200 tensor(0.0159, device='cuda:0')\n",
      "300 tensor(0.0133, device='cuda:0')\n",
      "Iteration: 144 | Loss: 0.014279049821197987 | Train,Test accuracy: 0.9967591166496277.3f%, 0.868967592716217.3f%\n",
      "0 tensor(0.0059, device='cuda:0')\n",
      "100 tensor(0.0063, device='cuda:0')\n",
      "200 tensor(0.0045, device='cuda:0')\n",
      "300 tensor(0.0046, device='cuda:0')\n",
      "Iteration: 145 | Loss: 0.012358453124761581 | Train,Test accuracy: 0.9965433478355408.3f%, 0.8664952516555786.3f%\n",
      "0 tensor(0.0019, device='cuda:0')\n",
      "100 tensor(0.0041, device='cuda:0')\n",
      "200 tensor(0.0027, device='cuda:0')\n",
      "300 tensor(0.0340, device='cuda:0')\n",
      "Iteration: 146 | Loss: 0.011495385318994522 | Train,Test accuracy: 0.9975623488426208.3f%, 0.868967592716217.3f%\n",
      "0 tensor(0.0036, device='cuda:0')\n",
      "100 tensor(0.0071, device='cuda:0')\n",
      "200 tensor(0.0239, device='cuda:0')\n",
      "300 tensor(0.0079, device='cuda:0')\n",
      "Iteration: 147 | Loss: 0.009654407389461994 | Train,Test accuracy: 0.9972905516624451.3f%, 0.8684731125831604.3f%\n",
      "0 tensor(0.0231, device='cuda:0')\n",
      "100 tensor(0.0052, device='cuda:0')\n",
      "200 tensor(0.0034, device='cuda:0')\n",
      "300 tensor(0.0068, device='cuda:0')\n",
      "Iteration: 148 | Loss: 0.009506581351161003 | Train,Test accuracy: 0.9977222084999084.3f%, 0.8697587251663208.3f%\n",
      "0 tensor(0.0036, device='cuda:0')\n",
      "100 tensor(0.0037, device='cuda:0')\n",
      "200 tensor(0.0080, device='cuda:0')\n",
      "300 tensor(0.0085, device='cuda:0')\n",
      "Iteration: 149 | Loss: 0.008159025572240353 | Train,Test accuracy: 0.9975623488426208.3f%, 0.8674841523170471.3f%\n",
      "0 tensor(0.0592, device='cuda:0')\n",
      "100 tensor(0.0183, device='cuda:0')\n",
      "200 tensor(0.0020, device='cuda:0')\n",
      "300 tensor(0.0031, device='cuda:0')\n",
      "Iteration: 150 | Loss: 0.007647613529115915 | Train,Test accuracy: 0.9978820085525513.3f%, 0.866594135761261.3f%\n",
      "0 tensor(0.0024, device='cuda:0')\n",
      "100 tensor(0.0025, device='cuda:0')\n",
      "200 tensor(0.0018, device='cuda:0')\n",
      "300 tensor(0.0105, device='cuda:0')\n",
      "Iteration: 151 | Loss: 0.007896623574197292 | Train,Test accuracy: 0.9980098605155945.3f%, 0.8700553774833679.3f%\n",
      "0 tensor(0.0022, device='cuda:0')\n",
      "100 tensor(0.0066, device='cuda:0')\n",
      "200 tensor(0.0113, device='cuda:0')\n",
      "300 tensor(0.0026, device='cuda:0')\n",
      "Iteration: 152 | Loss: 0.007725658360868692 | Train,Test accuracy: 0.9977501034736633.3f%, 0.8690664768218994.3f%\n",
      "0 tensor(0.0011, device='cuda:0')\n",
      "100 tensor(0.0016, device='cuda:0')\n",
      "200 tensor(0.0035, device='cuda:0')\n",
      "300 tensor(0.0130, device='cuda:0')\n",
      "Iteration: 153 | Loss: 0.007649260573089123 | Train,Test accuracy: 0.9977900981903076.3f%, 0.8699564933776855.3f%\n",
      "0 tensor(0.0006, device='cuda:0')\n",
      "100 tensor(0.0011, device='cuda:0')\n",
      "200 tensor(0.0027, device='cuda:0')\n",
      "300 tensor(0.0093, device='cuda:0')\n",
      "Iteration: 154 | Loss: 0.007163956295698881 | Train,Test accuracy: 0.9979220032691956.3f%, 0.8701542615890503.3f%\n",
      "0 tensor(0.0194, device='cuda:0')\n",
      "100 tensor(0.0025, device='cuda:0')\n",
      "200 tensor(0.0328, device='cuda:0')\n",
      "300 tensor(0.0004, device='cuda:0')\n",
      "Iteration: 155 | Loss: 0.007855166681110859 | Train,Test accuracy: 0.9973825216293335.3f%, 0.8686708807945251.3f%\n",
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0035, device='cuda:0')\n",
      "200 tensor(0.0010, device='cuda:0')\n",
      "300 tensor(0.0035, device='cuda:0')\n",
      "Iteration: 156 | Loss: 0.007151004858314991 | Train,Test accuracy: 0.9977821111679077.3f%, 0.8691653609275818.3f%\n",
      "0 tensor(0.0004, device='cuda:0')\n",
      "100 tensor(0.0008, device='cuda:0')\n",
      "200 tensor(0.0062, device='cuda:0')\n",
      "300 tensor(0.0006, device='cuda:0')\n",
      "Iteration: 157 | Loss: 0.00816000159829855 | Train,Test accuracy: 0.9972506165504456.3f%, 0.8711432218551636.3f%\n",
      "0 tensor(0.0094, device='cuda:0')\n",
      "100 tensor(0.0028, device='cuda:0')\n",
      "200 tensor(0.0081, device='cuda:0')\n",
      "300 tensor(0.0342, device='cuda:0')\n",
      "Iteration: 158 | Loss: 0.007877795957028866 | Train,Test accuracy: 0.9978820085525513.3f%, 0.8701542615890503.3f%\n",
      "0 tensor(0.0017, device='cuda:0')\n",
      "100 tensor(0.0006, device='cuda:0')\n",
      "200 tensor(0.0047, device='cuda:0')\n",
      "300 tensor(0.0023, device='cuda:0')\n",
      "Iteration: 159 | Loss: 0.0069506107829511166 | Train,Test accuracy: 0.9977821111679077.3f%, 0.8701542615890503.3f%\n",
      "0 tensor(0.0303, device='cuda:0')\n",
      "100 tensor(0.0037, device='cuda:0')\n",
      "200 tensor(0.0022, device='cuda:0')\n",
      "300 tensor(0.0052, device='cuda:0')\n",
      "Iteration: 160 | Loss: 0.0072236028499901295 | Train,Test accuracy: 0.9983815550804138.3f%, 0.8667919039726257.3f%\n",
      "0 tensor(0.0128, device='cuda:0')\n",
      "100 tensor(0.0064, device='cuda:0')\n",
      "200 tensor(0.0076, device='cuda:0')\n",
      "300 tensor(0.0024, device='cuda:0')\n",
      "Iteration: 161 | Loss: 0.006903031375259161 | Train,Test accuracy: 0.9978820085525513.3f%, 0.8675830960273743.3f%\n",
      "0 tensor(0.0014, device='cuda:0')\n",
      "100 tensor(0.0027, device='cuda:0')\n",
      "200 tensor(0.0009, device='cuda:0')\n",
      "300 tensor(0.0024, device='cuda:0')\n",
      "Iteration: 162 | Loss: 0.007585871033370495 | Train,Test accuracy: 0.9979099631309509.3f%, 0.8682753443717957.3f%\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 tensor(0.0013, device='cuda:0')\n",
      "100 tensor(0.0147, device='cuda:0')\n",
      "200 tensor(0.0061, device='cuda:0')\n",
      "300 tensor(0.0017, device='cuda:0')\n",
      "Iteration: 163 | Loss: 0.007735142949968576 | Train,Test accuracy: 0.9977021813392639.3f%, 0.8688686490058899.3f%\n",
      "0 tensor(0.0028, device='cuda:0')\n",
      "100 tensor(0.0006, device='cuda:0')\n",
      "200 tensor(0.0034, device='cuda:0')\n",
      "300 tensor(0.0005, device='cuda:0')\n",
      "Iteration: 164 | Loss: 0.006307836156338453 | Train,Test accuracy: 0.9980019330978394.3f%, 0.8663963675498962.3f%\n",
      "0 tensor(0.0008, device='cuda:0')\n",
      "100 tensor(0.0129, device='cuda:0')\n",
      "200 tensor(0.0016, device='cuda:0')\n",
      "300 tensor(0.0040, device='cuda:0')\n",
      "Iteration: 165 | Loss: 0.007146948017179966 | Train,Test accuracy: 0.9984415173530579.3f%, 0.871835470199585.3f%\n",
      "0 tensor(0.0015, device='cuda:0')\n",
      "100 tensor(0.0184, device='cuda:0')\n",
      "200 tensor(0.0149, device='cuda:0')\n",
      "300 tensor(0.0014, device='cuda:0')\n",
      "Iteration: 166 | Loss: 0.006230125669389963 | Train,Test accuracy: 0.9982816576957703.3f%, 0.8660996556282043.3f%\n",
      "0 tensor(0.0095, device='cuda:0')\n",
      "100 tensor(0.0137, device='cuda:0')\n",
      "200 tensor(0.0007, device='cuda:0')\n",
      "300 tensor(0.0015, device='cuda:0')\n",
      "Iteration: 167 | Loss: 0.008125276304781437 | Train,Test accuracy: 0.9976702332496643.3f%, 0.8669897317886353.3f%\n",
      "0 tensor(0.0018, device='cuda:0')\n",
      "100 tensor(0.0349, device='cuda:0')\n",
      "200 tensor(0.0151, device='cuda:0')\n",
      "300 tensor(0.0331, device='cuda:0')\n",
      "Iteration: 168 | Loss: 0.007183344569057226 | Train,Test accuracy: 0.9986013174057007.3f%, 0.8661985993385315.3f%\n",
      "0 tensor(0.0082, device='cuda:0')\n",
      "100 tensor(0.0012, device='cuda:0')\n",
      "200 tensor(0.0111, device='cuda:0')\n",
      "300 tensor(0.0120, device='cuda:0')\n",
      "Iteration: 169 | Loss: 0.007305528968572617 | Train,Test accuracy: 0.9979619383811951.3f%, 0.8652096390724182.3f%\n",
      "0 tensor(0.0066, device='cuda:0')\n",
      "100 tensor(0.0066, device='cuda:0')\n",
      "200 tensor(0.0043, device='cuda:0')\n",
      "300 tensor(0.0008, device='cuda:0')\n",
      "Iteration: 170 | Loss: 0.006744915619492531 | Train,Test accuracy: 0.99830162525177.3f%, 0.8680775165557861.3f%\n",
      "0 tensor(0.0021, device='cuda:0')\n",
      "100 tensor(0.0098, device='cuda:0')\n",
      "200 tensor(0.0029, device='cuda:0')\n",
      "300 tensor(0.0035, device='cuda:0')\n",
      "Iteration: 171 | Loss: 0.006335947662591934 | Train,Test accuracy: 0.9982816576957703.3f%, 0.8676819801330566.3f%\n",
      "0 tensor(0.0059, device='cuda:0')\n",
      "100 tensor(0.0026, device='cuda:0')\n",
      "200 tensor(0.0318, device='cuda:0')\n",
      "300 tensor(0.0020, device='cuda:0')\n",
      "Iteration: 172 | Loss: 0.007136533036828041 | Train,Test accuracy: 0.9978300333023071.3f%, 0.8626384735107422.3f%\n",
      "0 tensor(0.0126, device='cuda:0')\n",
      "100 tensor(0.0036, device='cuda:0')\n",
      "200 tensor(0.0008, device='cuda:0')\n",
      "300 tensor(0.0015, device='cuda:0')\n",
      "Iteration: 173 | Loss: 0.0064928289502859116 | Train,Test accuracy: 0.9983416199684143.3f%, 0.8644185066223145.3f%\n",
      "0 tensor(0.0068, device='cuda:0')\n",
      "100 tensor(0.0031, device='cuda:0')\n",
      "200 tensor(0.0020, device='cuda:0')\n",
      "300 tensor(0.0008, device='cuda:0')\n",
      "Iteration: 174 | Loss: 0.0066260118037462234 | Train,Test accuracy: 0.9982216954231262.3f%, 0.8619462251663208.3f%\n",
      "0 tensor(0.0227, device='cuda:0')\n",
      "100 tensor(0.0013, device='cuda:0')\n",
      "200 tensor(0.0013, device='cuda:0')\n",
      "300 tensor(0.0013, device='cuda:0')\n",
      "Iteration: 175 | Loss: 0.006580490153282881 | Train,Test accuracy: 0.9983215928077698.3f%, 0.8651107549667358.3f%\n",
      "0 tensor(0.0012, device='cuda:0')\n",
      "100 tensor(0.0057, device='cuda:0')\n",
      "200 tensor(0.0186, device='cuda:0')\n",
      "300 tensor(0.0119, device='cuda:0')\n",
      "Iteration: 176 | Loss: 0.006124137435108423 | Train,Test accuracy: 0.9984415173530579.3f%, 0.8674841523170471.3f%\n",
      "0 tensor(0.0043, device='cuda:0')\n",
      "100 tensor(0.0080, device='cuda:0')\n",
      "200 tensor(0.0009, device='cuda:0')\n",
      "300 tensor(0.0014, device='cuda:0')\n",
      "Iteration: 177 | Loss: 0.00643379520624876 | Train,Test accuracy: 0.9981018304824829.3f%, 0.8627373576164246.3f%\n",
      "0 tensor(0.0107, device='cuda:0')\n",
      "100 tensor(0.0052, device='cuda:0')\n",
      "200 tensor(0.0020, device='cuda:0')\n",
      "300 tensor(0.0010, device='cuda:0')\n",
      "Iteration: 178 | Loss: 0.005717102903872728 | Train,Test accuracy: 0.9978620409965515.3f%, 0.8678797483444214.3f%\n",
      "0 tensor(0.0057, device='cuda:0')\n",
      "100 tensor(0.0008, device='cuda:0')\n",
      "200 tensor(0.0006, device='cuda:0')\n",
      "300 tensor(0.0012, device='cuda:0')\n",
      "Iteration: 179 | Loss: 0.006996474228799343 | Train,Test accuracy: 0.9986812472343445.3f%, 0.868967592716217.3f%\n",
      "0 tensor(0.0077, device='cuda:0')\n",
      "100 tensor(0.0009, device='cuda:0')\n",
      "200 tensor(0.0106, device='cuda:0')\n",
      "300 tensor(0.0007, device='cuda:0')\n",
      "Iteration: 180 | Loss: 0.006947373505681753 | Train,Test accuracy: 0.9982616901397705.3f%, 0.8706487417221069.3f%\n",
      "0 tensor(0.0012, device='cuda:0')\n",
      "100 tensor(0.0010, device='cuda:0')\n",
      "200 tensor(0.0033, device='cuda:0')\n",
      "300 tensor(0.0004, device='cuda:0')\n",
      "Iteration: 181 | Loss: 0.00633002957329154 | Train,Test accuracy: 0.9978620409965515.3f%, 0.8702531456947327.3f%\n",
      "0 tensor(0.0008, device='cuda:0')\n",
      "100 tensor(0.0024, device='cuda:0')\n",
      "200 tensor(0.0042, device='cuda:0')\n",
      "300 tensor(0.0164, device='cuda:0')\n",
      "Iteration: 182 | Loss: 0.0076082320883870125 | Train,Test accuracy: 0.9980098605155945.3f%, 0.8681764006614685.3f%\n",
      "0 tensor(0.0074, device='cuda:0')\n",
      "100 tensor(0.0037, device='cuda:0')\n",
      "200 tensor(0.0029, device='cuda:0')\n",
      "300 tensor(0.0062, device='cuda:0')\n",
      "Iteration: 183 | Loss: 0.006935884710401297 | Train,Test accuracy: 0.997762143611908.3f%, 0.8681764006614685.3f%\n",
      "0 tensor(0.0142, device='cuda:0')\n",
      "100 tensor(0.0154, device='cuda:0')\n",
      "200 tensor(0.0049, device='cuda:0')\n",
      "300 tensor(0.0015, device='cuda:0')\n",
      "Iteration: 184 | Loss: 0.006899609230458736 | Train,Test accuracy: 0.998241662979126.3f%, 0.8669897317886353.3f%\n",
      "0 tensor(0.0014, device='cuda:0')\n",
      "100 tensor(0.0246, device='cuda:0')\n",
      "200 tensor(0.0012, device='cuda:0')\n",
      "300 tensor(0.0008, device='cuda:0')\n",
      "Iteration: 185 | Loss: 0.006973450072109699 | Train,Test accuracy: 0.9983295798301697.3f%, 0.8678797483444214.3f%\n",
      "0 tensor(0.0011, device='cuda:0')\n",
      "100 tensor(0.0026, device='cuda:0')\n",
      "200 tensor(0.0038, device='cuda:0')\n",
      "300 tensor(0.0014, device='cuda:0')\n",
      "Iteration: 186 | Loss: 0.006328115239739418 | Train,Test accuracy: 0.9982017278671265.3f%, 0.8727254867553711.3f%\n",
      "0 tensor(0.0017, device='cuda:0')\n",
      "100 tensor(0.0044, device='cuda:0')\n",
      "200 tensor(0.0005, device='cuda:0')\n",
      "300 tensor(0.0183, device='cuda:0')\n",
      "Iteration: 187 | Loss: 0.006698484532535076 | Train,Test accuracy: 0.9978420734405518.3f%, 0.8656052350997925.3f%\n",
      "0 tensor(0.0019, device='cuda:0')\n",
      "100 tensor(0.0297, device='cuda:0')\n",
      "200 tensor(0.0272, device='cuda:0')\n",
      "300 tensor(0.0041, device='cuda:0')\n",
      "Iteration: 188 | Loss: 0.007148502394556999 | Train,Test accuracy: 0.9982017278671265.3f%, 0.8685719966888428.3f%\n",
      "0 tensor(0.0005, device='cuda:0')\n",
      "100 tensor(0.0015, device='cuda:0')\n",
      "200 tensor(0.0032, device='cuda:0')\n",
      "300 tensor(0.0058, device='cuda:0')\n",
      "Iteration: 189 | Loss: 0.006339447572827339 | Train,Test accuracy: 0.997822105884552.3f%, 0.8691653609275818.3f%\n",
      "0 tensor(0.0038, device='cuda:0')\n",
      "100 tensor(0.0056, device='cuda:0')\n",
      "200 tensor(0.0509, device='cuda:0')\n",
      "300 tensor(0.0021, device='cuda:0')\n",
      "Iteration: 190 | Loss: 0.006523753050714731 | Train,Test accuracy: 0.9981018304824829.3f%, 0.8675830960273743.3f%\n",
      "0 tensor(0.0141, device='cuda:0')\n",
      "100 tensor(0.0060, device='cuda:0')\n",
      "200 tensor(0.0013, device='cuda:0')\n",
      "300 tensor(0.0015, device='cuda:0')\n",
      "Iteration: 191 | Loss: 0.005712644662708044 | Train,Test accuracy: 0.9979898929595947.3f%, 0.8684731125831604.3f%\n",
      "0 tensor(0.0012, device='cuda:0')\n",
      "100 tensor(0.0201, device='cuda:0')\n",
      "200 tensor(0.0193, device='cuda:0')\n",
      "300 tensor(0.0035, device='cuda:0')\n",
      "Iteration: 192 | Loss: 0.00668451888486743 | Train,Test accuracy: 0.9975783228874207.3f%, 0.8667919039726257.3f%\n",
      "0 tensor(0.0020, device='cuda:0')\n",
      "100 tensor(0.0011, device='cuda:0')\n",
      "200 tensor(0.0006, device='cuda:0')\n",
      "300 tensor(0.0014, device='cuda:0')\n",
      "Iteration: 193 | Loss: 0.00719740055501461 | Train,Test accuracy: 0.9978620409965515.3f%, 0.8660996556282043.3f%\n",
      "0 tensor(0.0034, device='cuda:0')\n",
      "100 tensor(0.0052, device='cuda:0')\n",
      "200 tensor(0.0006, device='cuda:0')\n",
      "300 tensor(0.0007, device='cuda:0')\n",
      "Iteration: 194 | Loss: 0.005806194618344307 | Train,Test accuracy: 0.9982216954231262.3f%, 0.866594135761261.3f%\n",
      "0 tensor(0.0015, device='cuda:0')\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "100 tensor(0.0470, device='cuda:0')\n",
      "200 tensor(0.0010, device='cuda:0')\n",
      "300 tensor(0.0009, device='cuda:0')\n",
      "Iteration: 195 | Loss: 0.007358235772699118 | Train,Test accuracy: 0.997822105884552.3f%, 0.8658030033111572.3f%\n",
      "0 tensor(0.0029, device='cuda:0')\n",
      "100 tensor(0.0009, device='cuda:0')\n",
      "200 tensor(0.0453, device='cuda:0')\n",
      "300 tensor(0.0022, device='cuda:0')\n",
      "Iteration: 196 | Loss: 0.007463912013918161 | Train,Test accuracy: 0.9977821111679077.3f%, 0.8674841523170471.3f%\n",
      "0 tensor(0.0051, device='cuda:0')\n",
      "100 tensor(0.0099, device='cuda:0')\n",
      "200 tensor(0.0074, device='cuda:0')\n",
      "300 tensor(0.0059, device='cuda:0')\n",
      "Iteration: 197 | Loss: 0.007066397462040186 | Train,Test accuracy: 0.9978500604629517.3f%, 0.8672863841056824.3f%\n",
      "0 tensor(0.0079, device='cuda:0')\n",
      "100 tensor(0.0039, device='cuda:0')\n",
      "200 tensor(0.0027, device='cuda:0')\n",
      "300 tensor(0.0091, device='cuda:0')\n",
      "Iteration: 198 | Loss: 0.007193475030362606 | Train,Test accuracy: 0.9980019330978394.3f%, 0.8658030033111572.3f%\n",
      "0 tensor(0.0027, device='cuda:0')\n",
      "100 tensor(0.0172, device='cuda:0')\n",
      "200 tensor(0.0016, device='cuda:0')\n",
      "300 tensor(0.0101, device='cuda:0')\n",
      "Iteration: 199 | Loss: 0.0063530635088682175 | Train,Test accuracy: 0.9983615875244141.3f%, 0.8653085231781006.3f%\n",
      "0 tensor(0.0054, device='cuda:0')\n",
      "100 tensor(0.0196, device='cuda:0')\n",
      "200 tensor(0.0029, device='cuda:0')\n",
      "300 tensor(0.0009, device='cuda:0')\n",
      "Iteration: 200 | Loss: 0.006094716489315033 | Train,Test accuracy: 0.9980418682098389.3f%, 0.8632317781448364.3f%\n",
      "==> Finished Training ...\n"
     ]
    }
   ],
   "source": [
    "# net = DNNCifar(args=args).to(args.device)\n",
    "\n",
    "criterion = nn.CrossEntropyLoss()\n",
    "optimizer = optim.Adam(net.parameters(), lr=0.001, weight_decay=3e-4)\n",
    "\n",
    "# optimizer = optim.SGD(net.parameters(), lr=0.05, momentum=0.9, weight_decay=0.0001)\n",
    "\n",
    "train_accuracy_qXsquare = []\n",
    "train_loss_qXsquare = []\n",
    "test_accuracy_qXsquare  = []\n",
    "test_loss_qXsquare  = []\n",
    "\n",
    "\n",
    "for epoch in range(200):\n",
    "    \n",
    "    if epoch <= 80:\n",
    "        cur_lr = 0.001\n",
    "    elif epoch <= 140:\n",
    "        cur_lr = 0.0005\n",
    "    else:    \n",
    "        cur_lr = 0.0001\n",
    "#     else:\n",
    "#         cur_lr = 0.0004\n",
    "    \n",
    "    for g in optimizer.param_groups:\n",
    "        g['lr'] = cur_lr\n",
    "        \n",
    "    running_loss = 0.0\n",
    "    for i, data in enumerate(trainloader, 0):\n",
    "        # get the inputs\n",
    "        inputs, labels = data\n",
    "\n",
    "        if args.gpu:\n",
    "            inputs = inputs.cuda()\n",
    "            labels = labels.cuda()\n",
    "\n",
    "        # wrap them in Variable\n",
    "        inputs, labels = Variable(inputs), Variable(labels)\n",
    "\n",
    "        # zero the parameter gradients\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "        # forward + backward + optimize\n",
    "        outputs = net(inputs)\n",
    "        loss = criterion(outputs, labels)\n",
    "        loss.backward()\n",
    "\n",
    "        if epoch > 16:\n",
    "            for group in optimizer.param_groups:\n",
    "                for p in group['params']:\n",
    "                    state = optimizer.state[p]\n",
    "                    if state['step'] >= 1024:\n",
    "                        state['step'] = 1000\n",
    "        optimizer.step()\n",
    "\n",
    "\n",
    "        # print statistics\n",
    "        if i % 100 == 0:\n",
    "            print(i,loss.data)\n",
    "        running_loss += loss.data\n",
    "\n",
    "    # Normalizing the loss by the total number of train batches\n",
    "    running_loss /= len(trainloader)\n",
    "\n",
    "    # Calculate training/test set accuracy of the existing model\n",
    "    test_loss, test_accuracy = validation(net, testloader, criterion)\n",
    "    train_loss, train_accuracy = validation(net, trainloader, criterion)\n",
    "\n",
    "    print(\"Iteration: {0} | Loss: {1} |\".format(epoch+1, running_loss),\n",
    "          \"Train,Test accuracy: {0}.3f%, {1}.3f%\".format(train_accuracy/len(trainloader), test_accuracy/len(testloader)) )\n",
    "    \n",
    "    train_accuracy_qXsquare.append(train_accuracy/len(trainloader))\n",
    "    train_loss_qXsquare.append(train_loss)\n",
    "    \n",
    "    test_accuracy_qXsquare.append(test_accuracy/len(testloader))\n",
    "    test_loss_qXsquare.append(test_loss)\n",
    "    \n",
    "    # Specify a path\n",
    "    PATH = \"./save_models/CIFAR10_VGG11_xsq_E200_iter\"+str(epoch)+\"_v1.pt\"\n",
    "    torch.save(net.state_dict(), PATH)\n",
    "\n",
    "    # save model\n",
    "#     if epoch % 50 == 0:\n",
    "#         print('==> Saving model ...')\n",
    "#         state = {\n",
    "#             'net': net.module if opt.is_gpu else net,\n",
    "#             'epoch': epoch,\n",
    "#         }\n",
    "#         if not os.path.isdir('checkpoint'):\n",
    "#             os.mkdir('checkpoint')\n",
    "#         torch.save(state, '../checkpoint/ckpt.t7')\n",
    "\n",
    "print('==> Finished Training ...')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_ReLU_train\",\"wb\")\n",
    "pickle.dump(train_accuracy_Relu,filehandler)\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_ReLU_test\",\"wb\")\n",
    "pickle.dump(test_accuracy_Relu,filehandler)\n",
    "\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_Xsq2_train\",\"wb\")\n",
    "pickle.dump(train_accuracy_qXsquare2,filehandler)\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_Xsq2_test\",\"wb\")\n",
    "pickle.dump(test_accuracy_qXsquare2,filehandler)\n",
    "\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_Xsq_train\",\"wb\")\n",
    "pickle.dump(train_accuracy_qXsquare,filehandler)\n",
    "filehandler = open(\"./plot/CIFAR10_VGG11_BN_Xsq_test\",\"wb\")\n",
    "pickle.dump(test_accuracy_qXsquare,filehandler)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "tensor(0.8493) tensor(0.8712)\n",
      "tensor(0.8461) tensor(0.8652)\n",
      "tensor(0.8437) tensor(0.8632)\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYUAAAEKCAYAAAD9xUlFAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjMsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+AADFEAAAgAElEQVR4nOydeXxN1/r/3/ucnJzM8yCDWQhJJIIqig4uGq6qSzWtmorSakuraEvTUdOitD8t33vV1IG2lGqLtnq5VWoojUhEJGYSIvN0kpzh+f1xklMRIVFz9/v1Oq/svfbaaz17b9az9xo+jyIiqKioqKioAGhutAEqKioqKjcPqlNQUVFRUbGhOgUVFRUVFRuqU1BRUVFRsaE6BRUVFRUVG6pTUFFRUVGxcc2cgqIoixVFyVIUJem8NC9FUX5SFCWt8q9nZfrdiqIUKIqSUPl75VrZpaKioqJSO9fyS2Ep0OeCtGnAzyISAvxcuV/FVhGJqvy9fg3tUlFRUVGphWvmFETkFyD3guQHgGWV28uAAdeqfhUVFRWV+mN3nevzF5FMABHJVBTF77xjnRVF2QdkAJNFJPliBSiKMhYYC+Do6Ni+YcOGV2SIxWJBo7k5h1RuVttUu+rHzWoX3Ly2qXbVjyu169ChQ9ki4nvRgyJyzX5AEyDpvP38C47nVf51A1wqt2OAtLqU3759e7lSNm/efMXnXmtuVttUu+rHzWqXyM1rm2pX/bhSu4DfpZZ29Xq7vrOKogQAVP7NAhCRQhEprtxeD+gURfG5zrapqKio/O253k5hHTC8cns48A2AoigNFEVRKrfvqLQr5zrbpqKiovK355qNKSiKsgK4G/BRFOUUEAfEA18qivI4cAIYXJl9EDBeURQTYAAervzEUVFRUVG5jlwzpyAisbUcuu8ieecD869GvUajkVOnTlFWVnbJfO7u7qSkpFyNKq86N6ttt6JdDg4OBAcHo9PprrNVKiq3Jtd79tE159SpU7i6utKkSRMqe6QuSlFREa6urtfRsrpzs9p2q9klIuTk5HDq1CmaNm16AyxTUbn1uPnmWP1FysrK8Pb2vqRDUPl7oCgK3t7el/1qVFFR+ZPbzikAqkNQsaH+W1BRqR+3pVNQUVFRUbkyVKdwlcnJySEqKoqoqCgaNGhAUFCQbb+ioqJOZYwfP57U1NR6111UVIS3tzfFxcXV0vv168fXX38NwPr16+nYsSOhoaFERUURGxvLqVOnAGsf/OzZswkNDaVt27ZERkYyefJkzGYzAHFxcQQHB+Ph4VGt/M2bN9OuXTvs7OxYu3ZtrfZNnz7ddj/atGnDl19+edlrmj59OvPmzauWlp6eTlRU1GXzqaio1B/VKVxlvL29SUhIICEhgXHjxjFp0iTbvr29PWBtfC0WS61lLFiwgFatWtW7bldXV+69916++eYbW1peXh47d+4kJiaGffv2MXHiRD799FMOHjzIH3/8wZAhQzh+/DgAH374IZs3b2bnzp0kJiaya9cuvLy8KC8vByAmJoYdO3bUqLdJkyYsX76chx566LI2vvDCCyQkJPD1118zZswYm8NRUVG5OVCdwnUiPT2d8PBwxo0bR3R0NJmZmYwdO5YOHToQFhbG66//KQzbq1cvEhISMJlMeHh4MG3aNCIjI+ncuTNZWVmXrCc2NpaVK1fa9levXk3fvn1xcHAgPj6eGTNm2ByOoigMGDCArl27AjBz5kwWLlyIu7s7AHq9npdeegknJycAOnXqRIMGDWrU2bRpUyIiIuqlwRIaGopOp6OgoACAtLQ0evfuTfv27enevTuHDh2qc1kqKipXj9tuSur5TJw4kYSEhIseM5vNaLXaepcZFRV1xd0UBw4cYMmSJSxcuBCA+Ph4vLy8MJlM3HPPPQwaNIg2bdpUO6egoIAePXoQHx/Pc889x+LFi5k2bdrFigegb9++PPHEE+Tl5eHp6cnKlSt54YUXAEhOTmb69OkXPS8vLw+j0ciVCgzWl927dxMeHo6XlxcAY8eOZdGiRTRv3pxt27YxYcIEfvzxx+tii4qKyp+oXwrXkebNm9OxY0fb/ooVK4iOjiY6OpqUlBQOHDhQ4xxHR0fuv/9+ANq3b8+xY8cuWYder6dv3758/fXXnD17luTkZO67r8Z6QbKysoiKiiIkJIR58+Zx4QLy9evXExUVRePGjdm1a9cVXO3FmTVrFi1btqRLly68+uqrAOTn57Njxw7+9a9/ERUVxVNPPUVGRkatZdQ2o0idaaSi8te5rb8ULvVGfyMWYjk7O9u209LSeP/999m1axceHh4MHTr0ovPpq8YhALRaLSaT6bL1xMbGMnv2bAwGAwMHDsTOzvqYw8LC2Lt3L2FhYfj5+ZGQkEB8fDzFxcV4eXlhZ2fHiRMnaNSoETExMcTExNCnT586D5BfyLRp09i4cSN2dnb8/vvvgHVMYeLEiXz55ZcMGzaMtLQ0RAQfH59av+ouxNvbm7y8vGppubm5tG7d+orsVFFR+RP1S+EGUVhYiKurK25ubmRmZvLDDz/U6/xVq1YxY8aMix7r2bMnycnJLFy4kNjYP9VGpkyZwuuvv15tZlNpaalt+8UXX2T8+PG2fn4R+UsLv+Lj40lISLA5hPN56KGHiIiI4NNPP8XT05OAgADWrFkDWDXi9+3bV2u5Hh4eeHp68r///Q+wzvj68ccfbWMjKioqV47qFG4Q0dHRtGnThvDwcMaMGVPvBi09PR03N7eLHtNqtTz44IMUFhZWK7ddu3a89957PPLII7Rq1YquXbuSnp7Oww8/DMDTTz9N9+7d6dixI23btqVr16506tSJyMhIwOo0mjRpQmFhIcHBwbz55psA/PbbbwQHB7NmzRpGjx5N27Zt63QNr7zyCnPmzEFEWLlyJQsXLiQyMpKwsDC+++47W75XX32V4OBggoODadKkCQCffvopr7zyClFRUfTv358333zTdkxFReUvUFughVvhd7EgOwcOHKhTkInCwsI65bsR1MW2hx9+WLKzs6+DNX9ys96zy9lV138TV5ubNTCLyM1rm2pX/bgWQXZu6zGF25kVK1bcaBNUVFRuQ9TuIxUVFRUVG6pTUFFRUVGxoToFFRUVFRUbqlNQUVFRUbGhOgUVFRUVFRuqU7jKXA3pbIDFixdz5syZOudPT0+ncePGNeQqwsPD2bt3LwDLli0jIiKCsLAwIiMjGTt2rG2hmtFoZNq0abRo0YKoqCjatWtHfHy8rZzhw4fTtGnTGpLVX3zxBW3atEGj0VxyRfLQoUNt50dGRrJ58+bLXtPQoUNrSHFv2rSJAQMGVEsbPXr0JSW7VVRU6o7qFK4ydZHOrgv1dQotWrTAz8+P7du329KSk5MxGo1ER0fz3XffMX/+fH744QeSk5PZu3cvd9xxB+fOnQOsC9POnTtHcnIyCQkJ/PLLLzbJbIBRo0bx1Vdf1ag3IiKCtWvX0qVLl8vaOHfuXBISEpg9ezZPPvlkna9NRUXl+qGuU7iOLFu2jA8//JCKigq6dOnC/PnzsVgsjBw5koSEBESEsWPH4ubmRkJCAkOGDMHR0ZFdu3bVyaFUyWZXrWJesWKFTebirbfe4r333iMwMBCwrnoePXo0YNWBWrZsGceOHUOv1wPW2AxxcXG2snv06HHRL4ELVV3rQufOnTl9+rRtf/fu3UyePJni4mL8/PxYunQp/v7+9S5XRUXlr3PbO4W77777ounnS2f369ePyZMn2/KPGDGCESNGkJ2dzaBBg6qdt2XLliuyIykpiTVr1rB9+3bs7OwYO3YsK1eupHnz5mRnZ7N//37Aqhiq1WpZtGgR8+fPr9FdcymGDBlCx44dmTdvHlqtli+++IJvv/0WsMp2R0dHX/S8tLQ0mjRpUk2w71qyceNGWxdQeXk5zz77LOvWrcPHx4fPPvuMGTNm8O9///u62KKiolKd294p3Cxs2rSJ3bt306FDBwAMBgMNGzakd+/epKam8uyzzxITE0OvXr1qhNOsK0FBQbRs2ZItW7bg7u6Oq6sroaGhNfIlJCQwYsQICgsLmTVrFk2bNq12vMohZWdns3v3bgICAq7InguZNGkSkyZNIjs72ybHnZKSQnJyMj179gSszjo4OLjWMlTZbBWVa8tt7xRqe7OvTTr7/Pw+Pj5X/GVwISLCqFGjeOONN2ocS0xMZMOGDXzwwQesXr2aOXPmXHE9VV1I7u7u1RRS27Rpw969e+nWrRtRUVG2MQ+DwUBISAhHjx6lpKQEZ2dnRo8ezejRowkNDb3icJnDhg0jMTGRRo0asW7dOsA6pvDPf/6TuXPnMmLECHbu3ImI0LZtW7Zu3Vqnci8mm52Xl4ePj88V2amiolIddaD5OtGzZ0++/PJLsrOzAesspRMnTnDu3DlEhMGDB/Paa6/ZZgq5urpSVFRkO3/KlCm2rqBLMWjQIL799lu++uorhgwZYkt/8cUXee6556oFrzEYDLa6hg0bxjPPPGMbXDaZTBiNxiu+3uXLl5OQkGBzCFVotVqef/55SktL+fnnn2nTpg2nT5+2fTlUVFSQnJxca7mhoaEcP37cFq7z6NGjHDx4sM7KrCoqKpdGdQrXiYiICOLi4ujZsydt27alV69enD17lpMnT9K9e3eioqIYM2YMM2fOBGDkyJGMHj3aNpU1MTHxovGRL8Tb25v27dvTsGFDGjVqZEvv378/48ePp1evXoSFhdGlSxccHR1t3Tbx8fF4e3vTpk0b2rVrR48ePRg9erRtwHfw4MH06dOHAwcOEBwczNKlSwH46quvCA4OZvfu3fTu3Zu+ffte1kZFUZg+fTrvvvsuer2eVatW8dxzzxEZGUm7du3YuXOnLe/o0aNtstndunXDwcGB5cuX89hjjxEVFcWQIUP48MMPr3vAJBWV25ba5FP/6g9YDGQBSeeleQE/AWmVfz0r0xXgAyAdSASi61LH30U622KxSK9evW6QNX9ys94zVTq7/tystql21Y9rIZ19Lb8UlgJ9LkibBvwsIiHAz5X7APcDIZW/scCCa2jXLYeiKPWOzKaioqJyJVwzpyAivwC5FyQ/ACyr3F4GDDgvfXmlE9sBeCiKcnWmvKioqKio1JnrPabgLyKZAJV//SrTg4CT5+U7VZmmoqKi8pewWKrvFxXBeYv1L4uYLYip+iy8o0ehsPAKDDlxAi6QoqlBXh5kZMDp05CZefn8V5mbZUrqxSaZX/ROKIoyFmsXE/7+/jWmjLq7u1ebtVMbZrO5TvluBDerbbeqXWVlZVdtanF9KC4uviH11oUbYdupU44cOuSKr3sx2ekmck8InuVnKTgLGfke5Nl5Y+/myceBiVgKyjHmVaAtKaUTO9BbDBy1NCXM4yjl9s5sL4xG0Wk4VejFnnMtaWp/gla6dLAIbo5lWJwcSSlvwaGcQLKM3rjrS2jrnk6D8pN8U/APdBozEb7HyCxwp8TogAPltNUlYTDrSTSFY681gQLFZmeKLU7o6UJjXTpNHE5xxuzPvtLWADS3O0ZbXTKKVqFCo6eBcoYT5QEcqGhJqcUJndaEh5OBZm6ZSE4JmWXeNLdPQFwdybA0QG9vJkCXRRtTElkmHw4XBXKyvAGNOU5TjiIolLt6UOgbRH6xA0cKAsg1udPEKZMH7k6j/VjNVX+OilxDL6QoShPgOxEJr9xPBe4WkczK7qEtItJKUZT/q9xecWG+S5XfoUMH+f3336ulpaSk0Lp168vaVts6hZuBm9W2W9Wuuv6buNps2bKl1hX1N5rrYdvBAxbefyKZ/YngYCxks+FOLGhr5NNgJkiTiYcllwLcOYs/jhhwopQKRU+21FyD4koRdhjxUvLp5pnEEUtjjpYFoCiQU+6C2aIhjCQiXI4R7JxH9lkTvyg9OK404bFGv2DOziWhuAXNXLJwczGSVWZPckU4Tnro5H8cU0ExGE24O5lw9NWTmWMgp8iXI6VBOIiBIayk0MGTvZr2pJa3RismFEsFmUZfGjrnEu13GjdHExXZhZw5p3DQ3BKN1oTW7gyltACTEGg5jknsOUJzssUHB6WMpo4n8XLN4Wi+F/lGX3R2GvRmE/bmUjw0+TRxzCDAtYz0PC/u73qGjjN8r+g5KoqyR0Q6XOzY9f5SWAcMB+Ir/35zXvoERVFWAp2Agss5BBUVlZuTM2dg6jMGPvlKjz0h3OF8gCz7YCY338iQlglkOTelYUtHmrVzp8AvBI82gTg4B7N/cxpb/28mIU5OdBs+HF3r1uxMTyM1NZWyMiPOzuf45ZcSsrOzsLf/g6KifJydnWnZvj1hukNkZWWRmppKamoq6emH2Ws2cdqlAcOGDeNfEREUr32F/N924PjgQ/y8aRNp+/dzUHGl6MyfX5l2FXY4tmxP6plUysrKCHIP4ugfR7Fc0Ae1B6DMuu3i4oKhzGBb6Hm4woHWUf0o12j4/fffOWI6AoDGoqFRg0YcO3YMgEy9/jzRSU/KJJ+UUoFSq8Cll4MDSUlJeHh44OLmRtKJEySVACXWM6IiJwH9r/rzu2ZOQVGUFcDdgI+iKKeAOKzO4EtFUR4HTgCDK7OvB2KwTkktBUZeK7uuNTk5Odx3330AnDlzBq1Wi6+vL0Cdhe3Gjx/PjBkzaNWqVb3qLioqokmTJhw/fhwXFxdber9+/Rg1ahQDBw5k/fr1xMXFUVRUhIODA61bt2bWrFkEBwcjIsyZM4dFixZhb2+Poij84x//4J133kGr1RIXF8eXX35JcXEx+fn5tvI3b97Mc889x/79+1m1alUNaesqpk+fzpIlS/D19cVsNhMfH3/JdQ3Tp0/Hx8eHiRMn1us+qNxYnh5RxLc/2POC3Tyenx2A3zMPg6Ig0oiDB5uR9P33vPP99+yftx97e3siIyNxdHRkzZo1tjJa79gBWL/yLsTX1xcPDw88PDxITU1l9erVANjb2xMSEkJYWBgDBw6kYcOGrF+/njlz5vCu2YyjoyN33XUX77//PoGBgcycO5fU1FQCAwMZMmQImZmZbNiwgV9++YXBgwfj5ubG8ePHGTp0KGazmfDwcBRFsf2CgoIoKChg7dq1+Pr6Eh0djZubGytXruTHH3/E3t6esLAwnnzySYKDg+ncuTOBgYEsXrwYsK76379/P2lpaVgsFnx8fAgICCAwMNDWZuzdu5fXXnuNzMxMPl62jOLiYhITE4mKiuKOO+4gKSnp6j/A2uaq3gq/m32dQlxcnMyaNatGusViEbPZXOt5f8W2QYMGyaeffmrbz83NFR8fHzEYDJKQkCAhISFy8OBBmx1r1qyRX3/9VURE/t//+38SExMj+fn5IiJSVlYmb731lpSUlIiIyE8//SQnT54Ud3f3anUeOXJEEhMTJTY2VtasWVOrbS+//LLMnTtXRET2798vPj4+YrFY6pT/UqjrFOrPtbStseMZecT+S5Hdu0VEJD8/XyZPnizNmjUTrGOFEhERIU888YSMHDlSQkJCxNnZWeLi4uTzzz+XjRs3SlBQkISGhsonn3wiW7dulV27dsn+/ftt/xbPJz8/XwoLC8VkMl3Unvz8fNmwYYOcOnVKRETOnTsnBoOhXtd0sz7La7FO4WYZaL7tSU9PZ8CAAdx1113s3LmT7777ziZrYTAYGDJkCK+88goAvXr1YsGCBYSHh+Pj48O4cePYsGEDTk5OfPPNN/j5+dVaT2xsLEuWLOHRRx8FYPXq1fTt2xcHBwfi4+OrfYEoilLtrX7mzJns3LkTd3d3APR6PS+99JLteKdOnXB0dKxRZ5WgnkZT98ls4eHhiAh5eXkUFBQwatQocnJy8Pf3Z8mSJdVE8VJTU3nssceqiegNHz7ctq9y81CQZ+G4wZ9xHbVI+/ZsWL+e8ePHc/r0afr06cMLL7xATExMtdX2ABaLBY1GYxvrOHbsGFqttk5Ch1X/Xi91vE+fP5dMqTpZl+b2dgoTJ0It0cAczWbQ1hz0uixRUTBv3hWZc+DAAZYsWcLChQsBq7SEl5cXJpOJe+65h0GDBtWIT1BQUECPHj2Ij4/nueeeY/HixUybNu1ixQPQt29fnnjiCfLy8vD09GTlypW88MILgDXozvTp0y96Xl5eHkajkYYNG17RtdWX7du34+DggJeXF48++iijR4/m0Ucf5d///jcTJ05k1apVtrytWrXCobJ/NTw8nCVLljBy5C3bw3hbs3/DKaARIe20dOvWjW3bthESEsK2bdvo1KlTredd+EJhZ3d7N003M6r20XWkefPmdOzY0ba/YsUKoqOjiY6OJiUlhQMHDtQ4x9HRkfvvvx+A9u3b2wapakOv19O3b1++/vprzp49S3Jysm2M43yysrKIiooiJCSEefPm1QjjuX79eqKiomjcuPFVfSOfNWsWUVFRTJ06lS+++AKAnTt38vDDDwPWftaLKaY+/vjjLFmyBJPJxFdffVVNAVbl5mH/D1bBxa//WM7u3btZuHAhSUlJl3QIKjcXt7c7vsQbveEGTK88P4hNWloa77//Prt27cLDw4OhQ4dSVlZW45zzB6a1Wi0mk+my9cTGxjJ79mwMBgMDBw60vXWFhYWxd+9ewsLC8PPzIyEhgfj4eIqLi/Hy8sLOzo4TJ07QqFEjYmJiiImJoU+fPvWKLX0+06ZNY+PGjdjZ2VE1dfiFF164ooHjwYMHM3PmTLp27Urnzp3x8PCodxlFReDkVI8PxMJC6yqnykG/+nDsGOzZ40GPHnC5HhDzT/+lYm8SjuOGw2W6QgBKSiArC5o2ta5rOnwYWrSou21JSbBpkx9OTnDHHXU/70LmzQNXV3j88T/TEn+vwIM8Pt/9NQsXLuSJJ5648gpUbgjql8INorCwEFdXV9zc3MjMzKy3ttGqVauYMWPGRY/17NmT5ORkFi5cWO2NesqUKbz++uukpqba0kpLS23bL774IuPHj6egoACwTkK4mKOqK/Hx8SQkJHDhWpILufPOO/nyyy8B+PTTT+nevXuNPE5OTtx7771MmDDhirqOFi+yEOhdxp3Nszh+/IKDR45gXL2O717ZSe6xymWqe/eyusnzxId8TPHZEn79cB/fjfsOc4WZzRO/4c3or1nyfxVUKqHbyMiAe++1NtiTJ0fx2RtHOLDPyMSJ562Azc2FhQth40a2/GymVUwz3KeN4x8+e5k3JplPllkYG3OSuW+XcWhPERL7CKxdS0UFPPkk+PtDy5Zw4PujvPXECUJC4J0e6+GTT8jNEZ54AoYMgTWrLZQ/9Bjl/Qfzx24TJhN8scJCRAS89VYbunaFbdugtBTOngVSUqyeE6ioAMnIhM8+Y+4sEz/++Of1FRTAzm0mJk2CMWOENWtg6lR4+21IPO5GE20KnTp1YuzYsfV+Tio3AbWNQN8Kv1tp9lFaWppERkbajlksFhk6dKi0bt1a+vbtKw888IB88sknIiJy5513yh9//CFGo7HaTJ8VK1bI448/LiIib7/9trz77ru11v3kk09Kw4YNa8zuWbdunURHR0vLli2lS5cuEhsbK2lpaTab4uPjJSQkRCIiIqRz584yZcoU27166qmnJCgoSBRFkaCgIHnjjTdERGT79u0SFBQkTk5O4u3tLRERERe1qbbZRIcPH5a7775bIiIipGfPnnLy5MmL5t+6das0atSoxsytyz3L3bsPCIh0Zpu4kS9u9qUyMuaMrJubLoaZ74lJ5yCxfCYgoqNchrqtlY80T4kGk4CIXlsh1ndyER9Ntm0bRDzczTK8x1Fpqjshkc6HxN+tRJydLfJ2m+XSla3iRr742OUKiExsvVEkOFgSNZHyCq9KmCZZQKQZ6TKx8w5p7XDYVq4LhbZtX87Ks8o8eaCt9fjIHofFzb5U7uMncaVA3MkTEGnPbmlgny12VIivzprmTp54kmM97n9CnCiRrmyVHR73SAvffPH3F/HzE3F1rJBDhIjZ21fmP/CDuDoZZYzzZ7KOftb7YmeW558XcbQ3SoB9trRRkqUBGRJOYrX7ocUod2o+kqeeeuqSz6Q2brdZPteaazH76IY37H/ld7M7hSulLrY9/PDDkp2dfR2s+ZMbfc/efvttefXVV2ukX86ubb/sFwdKxTx4iKQOflke5RNbQ+pAqTR1yhQQmRp7XJ5p+19x1JZZnUj7cvlv9zgZycfyH8cJ8tVj38g/7dbL7B7rpGDW/8ke2klPfhQniqW/63+ll/NWuYtfJDGglwjI//41WVwdyiWYE/IgX4sWowwI3iUgotFYpIeyRd5XnpViv6YiFRUiubmS3uafssehi5hffFnS3drJ/zFGhrQ/JFqMAiIfMEEE5A1luq2cpPc3yStTDPKPFoflfv0m+b3rM2J0cpMN9JbhDTfJYy13yFyeFR+ypIFDrmS8vVTy2raVBNqKm94g97U6KZ7kSKTTIenivl9ApDlpAiLO+goJs0+VDto9AiLd2SKt7a3HPpnwm6Q+MUcG6L6VH+kpd7K90smNkY8++uiKnvHt1vhea1SnoDqFG8qNtKtfv34SGRkpOTk5NY5dzq7/bUqQEFJFcnNFLBaR1FQpX7dRNsZtl+eGnJK+fS3y3nt/5j91SuS996zZ5cgRkagokXXrrAfP/0r53/9EFi4Uy2efixiN1rI//VTEy0vk0Udl83//K+npIlkrNkl2pxjxcqsQOzuRGTNEzp4VkUmTrP8FX375zzINBpGsLOv2kSMiP/0kIiJHD5bJ5g8SRRITRVJSpDg9U5o3F3n66Vou+uBBkeefF8nOFikvF1m8WAr2H5eq94jNmzaJxMaKCY0IyNrQqQJW05fNOSemFV9Kv56lAiJbvzgteZ5N5Sv+JcYu3aUkt0y2bLFebuUDEHn/fTn23PtyV8QRgYbyyy+/XPKZ1Mbt1vhea1SnoDqFG8qtatd/f9gn9+q3XidrxPrWb7HU+A974IC1rbaRlyfy7LOVHqL+lJef1zDXk82bN1vtnDtXqlr4X36pbkpZmdVmERH59VeRwYMva+usWbMEuKjzrrNdNyG3m12Xcgq39+wjFRXAJBoaul9HdVed7qLJNTT5PDyueM0LQB0UUy6NTmddy1NJt27VD+v159nctav1dxmSk5MJCAjAy8vrLxqncqNQZx+p3NaIgFk0BGS82y8AACAASURBVPvWQ0Bf5YpJSkoiLCzsRpuh8hdQnYLKbY2xQgCFho0uL5fwd6asrIwff/yxRlwKs9nMpEmTWLt27WXLsFgsHDhwgPDw8Gtlpsp1QHUKKrc1FaVGABqG6G+wJVeP3377jeHDh2M0GuuUPzMzk/79+3Ps2DEqKiqYMWMGOTk5mM1m3njjDXr37k2DBg3o3bu3TRKlirfeeot58+YxfPhwMjOtavbffPMN3bt3Z+nSpbbFlElJSbzwwguUlpaqXwq3OrUNNtwKv5txoDk7O1siIyMlMjJS/P39JTAw0LZfXl5eZ9s+/vhjyczMrHO9aWlp0qhRoxrrEsLCwmTPnj0iIrJ06VIJDw+XNm3aSNu2bWXMmDE2RdSKigqZOnWqNG/eXCIjIyUqKkrefvttWznDhg0Tb2/vamstRERWrlwprVu3FkVR5I8//qjVvkcffVSaNGkikZGREh0dLTt27Ljk9Tz66KOXVFw9n0s9y5zTpbJhwwFJ/L/tdSrranHixAmZNGlSrcqdF1JeXi7Tpk2TEydOXDKf0WiUNm3aCCBff/21iIhkZmbKzz//LGfPGwTOz8+XDz74QAoLC2X8+PECyCuvvCJr1qwRQB544AHbdkREhIwaNUr69u0rer1eTp8+LTNmzJB+/fqJoihy//33i16vl969e8u4ceMEEFdXVwGke/fukpCQIB4eHmJnZyedOnWSY8eOXfF9u90GdK816uyjW8ApnE9t0tmXo7CwULp27XrJRvZidOjQwSaDLSKSlJQkLVu2FBGRb7/9Vjp06CCnT58WERGTyST/+c9/bAvXnn/+eRk1apSUlZXZbDh/TcCWLVvkv//9bw2nkJycLKmpqZe19/xG/vvvv5d27dpd8lqullPIPFwsGzYckLzf0+tU1oVs27ZNGjduLPPnz79kvj179khubq6IiCQkJEhAQIAAMnPmTDGbzbJ582Z588035YsvvrioXPjatWsFkD59+ojRaJQlS5bYpJ7PZ+HChQKIXq+X+++/XxYsWGCTo+7Xr5+IiJjNZunfv78A0rVrV9HpdLbG/5FHHhFAHBwcpGPHjtK4cWMxGo0iInLw4EHbwsSq/LGxsVJcXCyvvfaaAKLT6eTxxx+X0tJS+fjjj0Wj0YhWqxUvLy85fPjwFd3j87ndGt9rjeoUbnGnsHTpUunYsaNERkbK+PHjxWw2i9FolKFDh0p4eLiEhYXJ+++/L0uWLBFnZ2dp2bJlvb4w5syZIxMmTLDtv/zyyxIXFyci1lXStc0dLywsFB8fHykuLr5k+X/88UcNp1BFfZxCUVGRuLq6ioi1Mb3jjjskIiJCBg4caPtyqcq/ceNGGTRokK2c9evXy+DBg2vYXxvHDxTJxg1JYjGUXfLajh8/Lvfee68kJSVVu153d3ext7cXQF566SUxGAyybds221v6uXPnbA1tUFCQTJkyRRwdHSU4OFg6dOggdnZ20q5dO1vDDUiPHj1kyJAh8uSTT8q6devEYrHIsGHDbMcjIyMFED8/P3n22WfFzc1NunTpIpMmTRIXFxfp1q2bzJgxQxRFEb1eLz179pSHH35YdDqd5OfnS3x8vAAyYMAAmwOZPHmybfvOO++01TV79uxq96HqnNdff71autlsluTkZNtLQxWff/65BAQEyE+V6yn+Krdb43utUZ3ClTiFHj0u+jPeddef++e/zffoIbJkiXX73Lma59aD853C/v375YEHHrC9lY0ZM0Y+++wz2bFjh/Tp08d2Tl5e3hV/KZw6dUoCAgJsXRYtWrSQlJQUERFxc3OrtdHfs2ePdOjQ4bLlXy2n8Pnnn0uXLl1ERKR169aydat1DcGLL74o48c/LwUFf+Y3m83SsmVL2+rtwYMHy/r1623lWiwiBQW1O4W0fcWyacO+y17b3LlzBZDGjRtLamqqfPHFF+Li4iLBwcGSnp4uI0aMEEDc3NxsDeprr70mbdq0EZ1OJ5MnT5aQkBBb10xGRoasXbtWgoODJTAwUJYsWSLZ2dnywQcfSJMmTWyBZQB59913xdPTUx555BFp27ataDQaefXVV23l9e/fXxo3biwajUYGDRokR48elWPHjomiKOLr6ytnzpyRbdu22Rp5BwcHGThwoFgsFlm+fLl89tlncvToUZvdGzdulLZt24qzs7Pk5eVVuw9nzpyRNWvWXDL40YXUJ+/luN0a32uNuk7hFmbTpk3s3r2bDh2ssbINBgMNGzakd+/epKam8uyzzxITE0OvXr0oLi6+ojqCgoJo2bIlW7Zswd3dHVdXV0JDQ2vkS0hIYMSIERQWFjJr1ixbkJwqFi1axPz588nOzmb37t0EBARckT0XMmnSJF599VX8/Pz4z3/+Q052NmVlZdx1110APPzwcGJjHyPzvOjcGo2GRx55hMWLP2fQoEfZs2cPK1asAMBigSOHhZISJ5o1teDqXnPehNGkQatYaqYbjSiKYlOQ3bJlC76+vpw7d84WhKhTp06sWrWK4OBglixZwrBhw1iwYAF33nknW7duJS4uDicnJ3766Sd69OhBXFwcBw4coGPHjiiKgru7O8nJydjb2+Pg4ADA008/zdNPPw1ARUUFDz74IFOnTkVEGDx4MLNnzyYjI4P27dvz/PPPk5mZSUhICEajkeLiYjw9PW3X8MknnxAaGoq/vz++vr4EBAQwdepUAN59910UReGxxx6z5W/Xrh3Hjh3j3nvv5aWXXqJZs2Y11Gb9/f1rDadaG3UJhKNy63D7O4UtWy6aXKt09vn5fXxqPb++iAijRo3ijTfeqHEsMTGRDRs28MEHH7B69WrmzJlzxfXExsaycuVK3N3dqymktmnThr1799KtWzeioqJISEhg3LhxGAwGQkJCOHr0KCUlJTg7OzN69GhGjx5NaGioLRh5fRk2bBiJiYk0atSIdevWATB37lxbg1NeVE5B0h9QUUHh8Vx0fp6cO2c9t6REELEqciYmwr33jmLcuH+RlQX33vsQJpMWRRHSUowUGXTYYyY1TUewVyn+TZ2qSVVXWOyw0wqZmZns3LmTlJQU9u7dy4YNGygvL6d9+/asWbOGrVu3MmDAACZMmMCvv/6Kn58fAwYMQK//c9bSPffcwz333APAk08+yWuvvUb//v3p3LkzYA3gfscFWtRubm613iN7e3s+/PBDW2ClXr164eTkZHPCLi4uhISEAKDT6ao5BMAWXQ+szvPBBx/ko48+YvTo0TRv3rxGfYsWLSIvLw+dToe/v3+12B4qKlXc/k7hJqFnz54MGjSIZ599Fh8fH3JycigpKcHR0REHBwcGDx5M06ZNGTduHACurq7V5oxPmTKFbt268c9//vOS9QwaNIi4uDj0en21YDUvvvgizz33HN988w2BgYGA9Wulqq5hw4bxzDPP8NFHH6HX6zGZTNWnPBoMKFUOIiPDuhq2Ms6ACJhMcOQIODpCs2awfPnyWm08d9bC8ZP2eNq3wsHBia82pRAV2YXPP19Ox+i7sFgUTBUWqlS9nZyC8fdw5dNlb/Hhgi2cPWPBiVKKDC40ts/E2d1MZq4rp3LdKRMzwZbj2Dk7UGR0wIgXGo3Jds0AwcHBDB06FA8PD2bNmsXIkSPJzc3l7rvvpl27drRr1+4yTxMcHBx4++23L5vvcjRp0oSlS5eSm5uLk5PTXyprzJgx/Pbbb7VKqkdHR/+l8lX+HqhO4ToRERFBXFwcPXv2xGKxoNPpWLhwIVqtlscffxwRQVEU3nnnHQBGjhzJ6NGjcXR0ZNeuXSQmJjJ48ODL1uPt7U379u0pKCioFge3f//+ZGdn06tXL0QEd3d32rZtS8+ePQFr7IPp06fTpk0b3NzccHJyYvTo0fj7+0NODoOHDOHXffvIKSggqF07Xhv/NKNnvMgnn3/NCy9MIjf3HGPG9KZ16/YsWPA9ISEKlT0mFBRAWZnVeZw5A6dOabCnnDzxJO6tFbz5xniM5SUENmzJ8lde4gxQWmLt8mmuOYqTkseo/r1Y+HUxUY19yT4n2GOHo6YMn4gGFBcX08xTyDiUQWZeAPk0JLjgNFm4Y68xYtQb0Wq1bN26lYiICFxcXGz35eTJk3z++ecA9OjR42o86nrz0EMPXZVyoqKi2Lt371UpS+Xvi2Idc7g16dChg1wYwCUlJYXWNURmalJ0AyKv1ZULbRMR+vTpU+9APPVBKhXxq4XKLSmxtuJ5eeDkhJSWkkEgZ2iAPUZCAoo5eM4bjQaCAy14nkyk1KwnTWmJRqehUUMhO9NIfqm1C8bLC3JzBU+lgKau2aQYW2AwQOPACnwzEhEAJycSK0IxmjToFBNtXY+i2GkZ9/bbdL7rLgb1epCU09YumSaB5fgE6v+8X4cOUVJo4qRDCMVlVv2hpk2FlJRtPPTQQ2RkZNS47qSkJCIiImjatClHjhy5qve0Kgj9zcjNaptqV/24UrsURdkjIh0udkz9UrgFUBTl6jsEEVAURKAwx8jpLDsqKhRaBJZQoegpKNLSqOAw5diT49yKoBBnzqTlklnig7uzkYISew5keiCK0KqVgmPhOTCbcHZ3JqQglUPGVqQf1qLBjiD7LMpdfcnOUdBrjDSxHEETEEJzndXf+DSwB4MnSl4e+PnhUqAhLw/cve1QmoQQFRWFp6cnH3z4Ifb29jjnmKgwavBqcMEq5WbNcC4vp5WTjtxc69eJl5eC2Wy2fvFchPDwcKZOnXrVBtNVVG51VKfwd8FshpMnKRFHSsu0eJWeIterBWeKnCiv0GGvMaLVakg94YhUqp8YaYJB64KxRIPdOThX4YWLk4WQ1joyDpeSkedEQ6dcHBUnazxHFxdo0QLnrCxanU6jFAc8vbVos88i+Rk44oW7thRtQAC4uuIA2NrioCCr7KeXFy5mq7OoCleckJBQ7VKat7TDYrngqwbAzg7s7FAAb+/zL712pwDWrjMVFRUrqlP4u5CXh2Rnc4w2GHDiBF5IjgZnu3ICOY2nJQ+T2HOUxrgopdg56ThZ4o0WwdkZTp8G0FA1TBHQzBGP42dxzD4JSZV1NG5sjVLv74+TtzdOZrNVf1mnQcnLw7+xC3g2vHgkewcHaNgQsHYzGY21x7Cvr2T05ZyCiorKn6hO4XbGZMJyJovTJn8sBXZ46rwxGJ3w97NgKTfiWnAKT1Meio8PGN2wLyykVUMDnDwFJaB1MuLYuAEaDSQng05nxsNDC1i7tJya+IOng7Wfxs3NOvWoisq3dsD6FRAUVGezdToIDr46t0BEsFgsqlNQUakjqlO4BTEYrA2n3QVP7+hRqKiwdp2IQHl2KQUlHhjQAh7kKm7Y2UFQsAaNYg8p5VAKNGhgff02Gq1/z56Figp8fLXgbC27aVMwmcpQFOfqlbq71/5KfxNgNpsREdUpqKjUEdUp3EqIYCw3k5Jih4sLhIRUrg2wq8Ct5Aw5pY3QKBaKiqyd7Qou6BUjLSSdAtw4J34E+Fb1xSvWlr60FNvc0aqFWt7ekJlZrbH39oaioporg292qqSd/fz8brAlKiq3BjcknoKiKM8qipKkKEqyoigTK9NeVRTltKIoCZW/mBth218lJyeHqKgooqKiaNCgAUFBQbb9ioqKOpUxfvx4UlNTqyeazZCeztnkbCwWKCyEI+lm8vIg45w9R0v9KC/N4x/3edGwdDcRJBKtSSA8QmHotHHs3rOGpk1h7971dOzYkdDQUKI6dyZ2wgROnToFWLtaZs+eTeh999F2xAgiO3Zk8uTJtlXNcXFxBAcH15BG2Lx5M+3atcPOzu6ywVgWLFhAaGgooaGhdOzYsdoCu7/KXXfdVWNQumoBnvqloKJSN677l4KiKOHAGOAOoALYqCjK95WH54rI7Ott09XE29vb1jC9+uqruLi4MHny5Gp5qoSnNDWmz1hZsGCBdd59Wdmfo6qHDmEqKSeLZnjoSyk12ZNXYIcbhRjRYcCRZiEO3NuzJ5sO7OHRfv3AxYW8khJ27tvHqu++IzV1H88/P5Fvv/2WVq1aISJ88803HD9+nODgYD788EM2b97Mzp07cXd3p7y8nDlz5lBeXo6TkxMxMTE899xzNSJrNWnShOXLl192he/atWtZsmQJ27dvx8vLi99//50BAwZcVX2lC1GdgopK/bgRXwqtgR0iUioiJuB/wIM3wI7rSnp6OuHh4YwbN47o6GgyMzMZO3YsHTp0ICwsjNdff92Wt1evXiRs20ZRwkE8PDyYNmECEQ8MoMPj48jOzSGw4hgNzcfQaypo3KCc5i0U/PzAzw9iH3mEld9/bx2p9fBg9erV9O3bFwcHB+Lj45kxY4ZN8E1RFAYMGEDXyoDsM2fOZOHChbhXdhvp9Xpeeuklm/xCp06daNCgQY1ra9q0KREREbU6uSreeecdZs+ebQvq3qFDBx577DEWLFgAWOUn8vPzAdixY4dttfWOHTvo3Lkz7dq1o2vXrqSlpQFQWlrK4MGD6dy5Mw8//DBlZWU16qzqPlKdgopK3bgRYwpJwFuKongDBiAG+B3IASYoijKscv95Ecm78GRFUcYCY8H6H33LBYJ17u7uNs2gqVP17N9/8YZKxBFFMdXb+IgIC++8U7cg8OXl5eh0OoqKiiguLubAgQPMnz+fWbNmAfDyyy/j5eWFyWSib9++3H///YSGhiIW4fhxoaxZOAVFRXRpFcbgUfOZO+95tvx3Af8Y1BcHnRG7xqVUaB0AI56eRkpLoXv37owdO5YTJ07g6enJZ599xjPPPENRURH79+9n0qRJNeLwAuTl5VFRUYGHh8dFj4N10Lbq2MXyGI1GDAZDrecfOHCAli1bVjseFhbGqlWrKCoqQkQoKipCq9VSUlJiqy84OJgNGzag1Wr56aefmDZtGkuXLmXevHm4uLjw66+/kpSURI8ePSgpKalWfklJCQDJyckcPHiwTs/talFcXFzj3+fNws1qm2pX/bgWdl13pyAiKYqivAP8BBQD+wATsAB4A6vm+xvAHGDURc7/N/BvsMpcXLjEOyUlxSYRYW8PWu3F7TCbTWi19b98e3twda3bRHm9Xo9er8fV1RUXFxeaN29ebUn68uXL+fjjjzGZTGRkZHD86FE6urhgKodSccTJwYxe70hYj2HkmxV69uzAjh1bUVq0QHFwwLVqgPg8XF1d6devHz/99BP9+vXj4MGD/POf/8TOzg6NRoOzszOurq5kZWXRq1cvSkpKeOqppxg2bBiKotju3fr163nppZfIy8vjq6++4o477qCoqAjHymmnF5MI0el0ODo6XlI+xNXVFWfnP2cwOTg4YGdnh6urq63+qjxarRZXV1dyc3MZPnw4hw8frlbOzp07mTJlClqtlrvuuouwsDDb9VWRm5uLRqPhvvvuq9Mzu5rcrNIIcPPaptpVP66FXTdk9pGIfAx8DKAoykzglIicrTquKMp/gO/+aj3z5tV+rKjIcN21j85vDNPS0nj//ffZtWsXHh4eDB06lLK8PKSkBDNaXJ0tNA/RotPZk2dyxdcXHBy01u6QCwZ6LyQ2NpbZs2djMBgYOHCgLWZAWFgYe/fuJSwsDD8/PxISEoiPj6e4uBgvLy/s7Ow4ceIEjRo1IiYmhpiYGPr06VPnAfILmTZtGhs3bsTOzo7ff/+d1q1bs2fPHrp3727Ls3fvXluMCTs7OywW6wyn87uCXn75ZXr37s2TTz5Jeno6ffr0sR27nJa/0WgVw1NRUakbN2r2kV/l30bAQGCFoijnjzQ+yJ/rZG9LCgsLcXV1xc3NjczMTH744QfEYKBUcUFQcPHQoddbF/8qynlyEJWsWrWqVonknj17kpyczMKFC6vFVJgyZQqvv/56tZlNpVX61FjltcePH09BQQFgHRC/WD99XYmPjychIYEq0cIpU6YwZcoU8vKsvYJ79+7l22+/ZcyYMYB1wHrPnj0ArF692lZOQUEBQZWL35YuXWpL7969O5999hkA+/btIzk5uYYNqlNQUakfN2qdwurKMQUj8JSI5CmK8omiKFFYu4+OAU/cINuuC9HR0bRp04bw8HCaNWtG+/ZdyShyI9/eOp++6qNCo4Hw8JrSDunp6bUGcNFqtTz44IN8++23tkFksEbeeu+993jkkUcoLi7Gx8eHxo0b2wa5n376aQwGAx07dsTBwQEXFxe6detGZGQkYHUaa9eupbCwkODgYMaNG8f06dP57bffGDx4MHl5eWzcuJFXXnmFxMTEGnYNHDiQzMxM7rzzTkwmE1lZWezfvx/vSqGiV199lTFjxtCgQYNqwWqmTp3KqFGjePfdd21BbgAmTJjA8OHD6dy5Mx06dKBDhw6ICKdOncLNzQ03NzdMJpPqFFRU6oEqnX2jMZmQ48dJLGyC0awFBL3eQkTEpRuy2NhY5s+fb2tQrwdX854ZjUaGDx+OTqdj2bJlV82ukpISUlJSUBQFHx8fsrOzKS8vp0uXLlfD7Hpxs/ZDw81rm2pX/VCls28nzGbrKHhGBqV55RjR4kgpBpxwdjYBl3YKVXGKb1V0Op0tuM1fwWAwUFxcbHMKVV1fTk5OnDt3Djc3N+zrq6CnovI3pk5OQVEUTyAQ6xTSYyJy6+kd3CyIWCUkMjLA0xPy8ylwbAYGIcQpgxzPFuj1RkB/2aJuZyoqKjh27BjOzs4EBQVhNBoREVsDLyLk5eVx7NgxLBYLZWVlNGrUiIKCApydnWnVqhVGoxG9Xk9KSsoNvhoVlVuHWp2CoijuwFNALGAPnAMcAH9FUXYAH4nI5uti5W1E+fEz5GRDibYVjnnFuCkW8nHHxUXBvlVzAhQoKrp1u/Tqg4hQXl6OQ+XU2qqQpGVlZaSmpmI0GikvLycoKMgWFa1Vq1acPXuW06dPY7FYcHZ2Rq/Xk5OTg9FopKSkhMDAQDQaDXr939uxqqhcCZf6UlgFLAe6iUj++QcURWkPPKYoSrPK6aUqdUBMZtKzPTDggIMOCs0unBEFDJXK0peZXnmrUlpaSnFxMb6+vuTk5JCTk0PLli05e/Ysp06dIjAwkIqKCnJzcwkNDSUjIwOz2WwbE6ioqKC4uNg2tTYvLw+dTkdAQABeXl6UlJTg7OzMyZMnAWwrslVUVOpPrU5BRP5xiWN7gD3XxKLbmJIzRRjwoHGDcnyD9ZjNUFxsDYXs63ujrbt2nDx5kqKiIioqKsjKysJisWAwGCgsLASwxU7WarWkpaVhNBoJCgrCxcWF7OxssrKyEBGMRiMWi4Xy8nLc3Nzw8fGx1eHn50dZWRlFRUU2WQ4VFZX6U+eBZkVRfIFnAUdggYikXzOrblOyc0CDGa8Aa7+4VntzhiOo6qP/K41raWkp5eXluLi4UFRUhEaj4cyZMzZ9pIKCAoqLi/Hz80Ov19tWSh86dAidTldN6jo7O9u2XV5ebhsrOB9FUWjcuLGtC0pFReXKqM/itTnAL8BG4Nae+nINqSGdHRhIVGgoUa1COVuqx8upHK328o3W4sWLOXPmTJ3rTU9PtzWK5xMeHs7evXsBWLZsGREREYSFhREZGcnYsWMpKCjAYDBQXl7OtGnTaNGiBREREbRr1464uDhbOcOHD6dp06ZERUVhMpls6qMrV66kVatWaDQamwZLRUUFhw4d4vDhwzZZ7hYtWrBs2TIGDRrEoEGD6N+/P4cOHcLV1RV/f3/buoJmzZrRokULtFotWq0WR0dHm6gd/Km5dKFTqBLTUx2Cispf41IDzRuBt0SkSvDeHuuiMuHvPjXmElSTzn75ZVxKSpg8ciQZdo3IMDjiE1Q3Eb7FixcTHR19UVXSi9GiRQv8/PzYvn27bcFacnIyRqOR6OhovvvuO+bPn88PP/xAYGAgZrOZJUuWkJqaikajYdGiRRiNRvbt20dqaipFRUWsWLGC7Oxs9Ho9o0aNYsSIEUyaNImDBw9SVlaGTqdDr9czc+ZM3nzzTU6fPk1qaipmsxmLxYJOpyMnJwdHR0cWL17M0aNHSU5O5ty5c6xZs4bnn3+emJjqYTOqFFSrcHZ2xmAw4ObmRmFhoc0pqNNMVVSuDZfqPhoCzFAUZTwwo/IXh7X76MnrYNutT0UFiFDWNJTMND2bNy/jySc/pKKigi5dujB//nwsFgsjR44kISEBEWHs2LG4ubmRkJDAkCFDcHR0ZNeuXXVqBGNjY1m5cqXNKaxYscImc/HWW2/x3nvvERgYCFj77x966CEOHTpESUkJX375JSdPnqSgoACLxUJUVBQeHh4cO3YMsMpmHzx4ELPZTFlZGT4+PogIkZGRODs74+zsjJ+fH0ajkbKyMpo0aYKdnR3p6el4eXnx7rvv8ttvv+Ho6Iibmxtdu3YlMjKSVatWMWzYMHx8fGyy2StXrmTTpk0sWrSI//3vf8yaNQtFUXB2dmbmzJk2BzFw4EBycnKIjo6u8YWkoqJyZVxqoLkAmKwoSjPgLeA0VkmKgutl3NWgtsV+ZrOjTUG1Xz+oioNz990wYoT1l50NgwZVP69eKrVmM0bsOHrKnsOHk9i6dQ3bt2/Hzs6OsWPHsnLlSpo3b052djb79+8HID8/H61Wy6JFi5g/fz5RUVF1rm7IkCF07NiRefPmodVq+eKLL/j2228Bq2x1dHR0tfzZ2dnodDpKSkpo0KABOp2OrKws3N3dcXd3Jzw8nJKSEg4dOmSTtq7qz2/8/9k7z/Aqqq4N35OekAaBhBZKCL13UIoI0kGKoIKKgqKiglgQu8jLi4AFFStNQYEXpFtApYnSQWoogQChk0II6ck5z/djkhAgQBJIAnxzX9dcJ2dm79nPmXMya3ZZa5Uvf8VQTYkSJahVqxZ2uz1z7qBq1aqZ8wDly5cHyIyI2qBBA0JCQq75mTp27Ejz5s2pWLEio0aN4vvvv2fo0KH85z//oU2bNrzxxhvMmTOHqVOtRXAWFjeDaw0fBQHPYsYnehmoBMw1DONnTB8FW8FIvH1JTYMYoyRJBMKGZgAAIABJREFUyQYHD/7J1q2bMyOCJiYmEhgYSIcOHdi/fz/Dhg2jc+fOtG/fnri4uDy1V6ZMGapUqcLq1avx8fHBy8uLatWqXVFu+/btPP7440RFRfHaa69lGp4jR46QlpbG8uXL6dOnD5GRkWzatAknJyfi4uJITk7GbrcTEBBwzbH7rMl2vLy8SElJuaS8o6Mj1apVw9vb+7oB906fPs0rr7zC6dOnuXDhAoGBgbi4uLB27Vp+/fVXALp06XJrhCyxsLgDuNbw0WzgDaAIMFNSW6CDYRgDgN+Bgg9Qnweu9mR/tdDZWcsXL57LnsFlJKc5ImeDGjVg9WoxcOBARo8efUW5nTt38ttvv/HZZ58xf/58Pvroozy3mTGE5OPjc0mE1Bo1arBx40batGlDvXr12LZtG3369MFut1O7dm1OnjzJmTNnKF68OM899xzPP/881apVw2634+npSVxcHBcuXMAwjBzFW3rsscfYuXMn5cqVY8mSJTg6OmaG5QZzrmD79u10794dBweHS4Z/shqK5557jjfeeIPOnTszc+ZMPv/888xJZmtS2cLi5nOt1UduwOH0LXNtoqTvga75rOuOIM3ugKNhx9XVDGc9d+7czOWVUVFRhIeHExERgST69OnDqFGjMlcKeXl5XZJBbMSIEZlDQdfigQceYOnSpcyZM4fmzZuTnGxmiRs2bBjPP/88//zzD2lpaSQnJ2dmhvPx8aFXr158+OGH+Pr6YhjGJSuMvLy8SE5OJj4+PnNV0PWYMWMG27dvZ8mSJQC8+uqrvPDCC5k3/OXLlxMaGkrPnj1xcHCgaNGihIaGYrfbWbhwYeZ5MsJmS2LRokWAufIoa9js33777arZ3iwsLHLHtXoKQ4AJQArwTNYDkhLzU9SdQprdEQ8Hc5Stdu3avPvuu7Rr1y5zZc7XX3+No6MjgwYNylxfP27cOACeeOIJnnzyycyJ5p07d9KnT5/rtunn50fDhg05efIkbm5u7Nmzh8DAQGrVqkXfvn0ZMGAAhmFQrFixzOErMPMnv/nmm7Ro0QJvb288PDx48sknCQgIICUlhZEjR7J9+/bMsNn/+c9/ePzxx5k3bx7Dhw8nIiKCDh060KhRI3755ZcrdL344oucP3+eWrVqkZaWRlpaGrt27cp86h83bhwdO3akXLly1KhRI9OYvffee/Ts2ZOyZctSu3Ztjh07houLC6NGjeLhhx9m7ty53H333Zn5FiwsLG4QSbft1rBhQ11OSEjIFfuyIzY2Nkfl8ozNpn83p+jInrhcV71cm91uV/v27bMtGxkZeUX55ORkbd68WceOHdO+ffu0efNmbd68WTExMTpz5ow2b96sAwcOaPPmzbLZbNfVY7fbtW3bNu3cuVN2uz3Xn+dyzp8/rzZt2ujtt9/OVb3Y2Fht3rxZUVFRV+y/Fjn9TdxsVq1aVSjt5oRbVZulK3fkVRewRVe5r15ronkp8A2wXFLqZceCgMcxI6ZOy0+jdbuSmpRGGi64uSbf8LkMw2D58uVX7E9OTubw4cO4u7tTo0aNzDH2jInqokWLUrp06cwwEj4+PqSlpWUuPXVzc7tkUvha7VesWPGKCeO84u3tzcqVK3Ndz9PTk8DAQHyvk47UwsIi71xr+Ogp4CXgU8MworkYJbUCcAiYJGlxviu8TUmKN4eN3Nxv3mRoSkoKsbGx+Pn5YRhGpsdzYmIiCQkJmTmg4+PjMQwDd3d3HBwcKFu2bOY5nJyc8PX15dy5c5mhJXKCr69voY/bG4ZBQEBAoWqwsLjTuZafwmlgBDDCMIwKQCnMfAoHJCVcrd6tgG6B+DdJCWbKCTePm5cG++zZs5w+fZrU1FSKFi1KZGQkxYoV49y5c0RFRV1iFIoUKXLVXkBGndwYhdsVWU5tFha54rp3LMMwngdiJK2XtP1WNwhubm5ERUUV+s0gKcnAwI5LkZuX3C7jSf3EiRPs2bMHwzAoU6YMvr6+REdHZ4aXyDAKV8PHxwd/f/8rQkrcaUgiKioqM1+DhYXF9cnJHasksMUwjG3ANMw5hlv28ats2bIcP36ciIiIa5ZLSkrKn5uF3Q6JiZyNccGWJvaFOuc6T0JWbcnJydhsNtzc3Dh27BheXl6kpqbi6OiIr68vYWFhJCUlcebMGaKionB1dSUuLg5J13WCO3z4cJ513UpcS5ebm9slw2cWFhbX4Woz0Fk3wAA6AHOAg8B/gUo5qZufW3arj3JKvq0m+PxzCVTOIVwPui/O0ymGDx+uokWLKjAwUJgBCDVmzBgB+vPPP7Ot88cffyggIEBubm568MEHFR8ffyOfIlvutBUY+c2tqku6dbVZunJHfqw+ytGAd/pJTqdvaUBR4CfDMMbfbCN12xMaynHKEG4PpFmJQ3k6xcaNG3F0dOTuu+9m4sSJ+Pr68vbbb+Pi4kLz5s2zrdOuXTuOHTtGdHQ0c+bMsRLNWFhY5InrDh8ZhjEUGABEAlOAVyWlGobhAIRiTkZbZBAWxtoiHSEeWlY8nqdTHDt2jFatWjF7tpm24vz587z77rs0bdr0mjd7Z2dnnJ2d89SmhYWFBeQsyU5xoJekDpLmKd1nQZIdK9zFlYSFsdb/ATxdU6j7VrdcV09NTeXkyZOXBLIbOnQoJUuWpHv37jdTqYWFhcUV5GSi+VcgOuONYRheQA1JGyXtzTdltyN2O4SF8bdnHe5q7YJTu3tyfYpDhw5hs9kuMQq+vr4cPXrU6gVYWFjkOzkxCl8BWQPxx2ez7/83NhucOQPAuSQ3dieXom/L3J1iyZIlHDx4kKCgIIArQl5bmcYsLCwKgpwMHxnpE81A5rDRzVt8fyfwySdQqRJs2MBaWiIZtMyFUThx4gSPPPIII0aM4O+//wbM5DQWFhYWBU1OjEKYYRhDDcNwTt+GAWE30qhhGMMMw9htGMYewzBeTN9XzDCMPwzDCE1/LXojbRQoP/wASUkwaRITeZGA4mk0bZqzqpJ47rnnSExMxGaz8c0331C8eHG8vb3zV7OFhYVFNuTEKDwD3IWZjvM40BQYnNcGDcOohRlXqQlQF+hqGEZlYCSwQlJlYEX6+1uf/fthxw4A1qyysYp7Gfka5NTHa/369SxevJjRo0dTpUoV4uLiCAwMzEfBFhYWFlfnukZB0llJD0nylxQgqZ+kszfQZnVgg6QESWnAGqAncD/wfXqZ74EeN9BGwTFvnvnapQvv8w6lHM/w9HM5H12bMmUKnp6ePP/88/Tt2xcgMzuZhYWFRUGTEz8FN2AQUBMzSioAkgbmsc3dwBjDMPwwA+x1BrYAAZJOpZ/7lGEY/lfRM5j0nkpAQACr85gvMy4uLs91s9Jo+nTSatcmtElrVv9yD8OLT2fjxuBr1klNTeXnn3+mcePGzJ49m7Zt27Jly5bMSeYyZcrcFG03m5t1zW42lq7cc6tqs3TljnzRdTVX54wNmAeMxgyXnZGf+dPr1bvOOQcB24C/gK+BTzCD7mUtc+565yn0MBdnzkggjRunTX8lCqT57b++brXvvvtOgFxcXARow4YNmcc2bNig5cuX37i2fOBOc/XPb25VXdKtq83SlTsKK8xFsKS3gXiZ+Zm7ALVv0BBNldRAUitMH4hQ4IxhGKUA0l9vZIiqYNi40Xxt3pwd+81OVN33e1+32syZMwkMDKRChQo0adKEJk2aZB5r2rSptfzUwsKi0MiJUcjIuhaTPknsg5loJ89kDA0ZhlEO6AXMBpZg9kRIf731E/hs3AiOjtCwITt2gKcnVGxc/JpVjh8/zsqVKxk4cCAhISGsWbOm0HM/WFhYWGSQkxnRb9OXh76FeeP2BN6+wXbnp88ppALPSTpnGMYHwFzDMAYB4cD1s9QXNhs3Qp064OHBjh1Qty5cL7vlrFmzkMQjjzyCo6Mjjo6OBaPVwsLCIgdc0yikB72LlXQOc/w/6GY0KukK1y5JUUDbm3H+AsFuh02boF8/JHNV6iOPXL/arFmzaNasGcHB156MtrCwsCgMrvlcK9N7+fkC0nJ7sW8fxMZCs2YcOWL+WbfutauEhoayY8cOHnzwwQKRaGFhYZFbcjKn8IdhGK8YhhGY7nVczDCMOzuPY07ImGRu2jTDd+26RmH+/PkA9OrVKx+FWVhYWOSdnMwpZPgjPJdln7hJQ0m3LTt2QJEiUKUKf30LLi5Qq1b2RTdt2kRiYiLz5s2jadOmlnOahYXFLct1jYKkigUh5LYjNBSCg7HjwLx50LGjaSMuJykpic6dOxMVFQXAhAkTCliohYWFRc7JiUfzY9ntlzTj5su5fTi9L4atpR7Edz0cPw4ffJB9uZ9++omoqCiGDBlCaGgo/fv3L1ihFhYWFrkgJ8NHjbP87Ya5Qmgb8P/XKKSl8dnhbowNG0mlAeDqCldLivbVV18RHBzM559/jsP11qtaWFhYFDI5GT56Iet7wzB8gJn5puh2IDyccJUF4NAh6NkTvLwuLXLixAmmTp3KunXr+OijjyyDYGFhcVuQl2Q5CUDlmy3ktiI0lOOU5a5a53losA8dOlx6WBJt2rQhNDSU1q1bM3BgXmMHWlhYWBQsOZlTWIq52gjMJaw1gLn5KeqW5+BBTtCeRpWceeGFKw+HhIQQGhrKl19+ybPPPlvw+iwsLCzySE56Ch9m+TsNOCrpeD7puS3QgVCOM5D7K2WfSWfZsmUAdO3atSBlWVhYWNwwOTEK4cApSUkAhmG4G4ZRQdKRfFV2C3Nu72mScKdM2eyPL1u2jJo1a1oZ1Cws7gBee+01du3axT333FPYUgqEnMx+zgPsWd7b0vf9v+XEgXgAyqYbhQ0bNtCvXz9SU1OJj4/nr7/+omPHjoWo0MLiFmfVKhg5EtLS2LJlC6+99hqpqakYaWm5PlVERASHDh26ufq++go+/piff/6Z8ePHs2zZMk6fPn1z28gtR49CHq5PbsmJUXCSlJLxJv3v/78B/xMTOZ4+eFamjPn63XffMXv2bFatWsXKlStJSUmxjIKFxbVYtw7GjeP8yy/TpUsXxo8fz+Rvv6X2G29wul8/fvjhB86cOcPHH3/M2rVrWbp0Ke8PGUJK165gtzN37ly++eYb7HY7jRo14rfeveGll8Bu5/PPP+e+++5j5vTpTJw4kXHjxmUk7soWJSVx9OhROHcOhg+HlBR44w147TUit26lUqVKSGLhwoWX1Pv999/58MMPsz/ppEnw118373qtXQuVKsFTT928c16Nq2Xf0cUMaH8A3bO8vx9Ycb16BbEVWOa1hASpQQNp1ixp7FhNZpBAOnrUPFyrVi0BGjRokLp3764SJUooKSmpYLQVIJau3HGr6pLyX5vNZtPkyZM1bNgwff11ejbCJ56QmjeXJMXHx+tAkyaygR52d1eDBg30GEigb+vWVXBwsGJiYlSpUiUBqgk6C0pycND8adN0j5OTvi1XTqmpqdr59NNmBkTQ1nvu0ZegcyAbqBcuggpavXq1YqdMkerU0ZrZs/Xss88qISFBSklRTLFiGgnaPmiQ5O4u+6xZmefTkCFKTU1VYGCg7r333ks+Y4sWLeTq6qqUlBRJUnJyst584w0dHzzYrDtggP76PVFN6yUpJkZSaqq0dKn066/Sxx9LAwdKa9de/SIeOiRVqiT17y972bJKc3RUSvny0vnzmUXyI/NaToxCJWAD5txCOLAOMxvb/x+jsHevealcXCRPT71X9UcZhpSSIp07d06GYcjJyUleXl4yDENvvfVWnnXlWlsBYunKHbeqLin/tU2fPl2AHB0dNXfuXKWkpGhys2aaXbu2kpKS1Lx5cxUB7XFzk0AXatdWGmgtKGbCBCW+/bYkKTY2VvNnzFBsYKDivL1VDQQP6v2SbXShRHnZPv1cAqV06qSVlSpJoDRQ2iOP6OigQera5ZxACgpqohZOThLoaM2aAlS3bl3tHTVKAnUD1S9ZUrF79yqkcWNFg8507iw5O0sffKBHHnlEToah/fv26fDhw5Kk8OV7NOuZFdpT5j7ZKlTUdn9//ZxhTB5/XEpNVVvPDQKpY8fvtLVHj4vGBiQPD/O1Wzfpzz8vvYBbtkj160teXrK7uyvVMNQctGvTJkVFRWU+dBaKUcgsaCbX8cpp+YLYCswo/PWXealcXSVHRz35wDkFBJiHli1bJkBDhw4VICcnJx0/fjzPunKtrQCxdOWOW1WXlL/aEhISVKZMGTVu3FjxsamKXmI+Dd9///1asGCBUlOlN98crf/973+yJyRIw4crqVINNfQLUe2q4fqk8Y9q5rVLd9eJlYKDpfLlFU6gzi9epddfHyVX17jM+2rLhvFKeWyQEmNi1KBWLa1o00ap//yTqSU42Cz333qT9crQoYodO1YCHWvbVq8UKaIw0EHQzO++U7t27XT84EHZvLy0/+67lbhvnzlCMHq0pk6dqocMQ8dAdX189L9ZkSpqmAanvnuI/qnWWBtA0a6u2tCqlexpadq16+L9vwgzlQBK7NxdF37/0zx3XJzso0bJXqKE1KyZdO6cKToyMtNgJM6bpwfvuUc1QB9//LGSkpLUoHp1Dend+4a+xxvtKfwX8M3yvijwn+vVK4itwIzCggXmpVq6VFq7Vp06SRlNv/POO3JwcFBkZKSKFi2qhx9+OM+a8qStALF05Y5bVZeUv9o++OADQVm93OMv+bvGqDhndfB/W2S32yVJd98tvfqqWTYsTEpOlv7zH/NfzNc3WSDVqGHXqDLfSCVKKPq+vvLzTNTMmWadM2ekzz+Xhg8360yYICUmSnPnpmY8oF9CjdLn1MR5m7Rjh2SzSc8+K6X3UL5066/vn3jmYuFDh8yHv19/zdxlt0t//LFaoVOn6o863dS40WGBVDvogl5v8Za8PSvL3d1drVpN0FNPSYcPS6mpdvXqZZO7u1SixAa5G1H6jVbycLugkiV7KDg4WL/+GqmKFdepmPd3OnXkrHT6tDR5sjkEsWiRDo0dq2bNmsnBwUFTp041xaSl6YKvr0526iSp8IzCv9ns23a9egWxFZhR+OYb81IdOyZJql1b6t7dPNS2bVvVr19fkhQWFqbY2Ng8a8qTtgLkdtVls9kUHR1dMGKykOPrlZQkxcXlq5bLyc/vskrRLzOfkO9xWK1ibuaT/erV5g12yBDpp5+k6GipRAkpKMi8Rz/wgLR8+Wrt2SPZ/zfXPMG0afr3X+mzz0wDkhW73fw/dHOTfHzM4iVKSAcPSsePS506STEx0kcfmcdefSFRfftKP/4oJZy9oFVTD6l4cbvOnr3sA+zff8nbESOkGjViZLdLbdtKRYpI775rfmWzZ88WIGdnZ735ZqSaNZMuXEhU9+4PysMjQUOHSnPmpAmkRhVfEkyWm1tjPfXUs2rVyi5v7zSBTXXrSnNHbNZf3KWnevymVq2eEwTI19dX8+bNU5Mm0rp16YKmTpXWrJFUeEZhJ+Ca5b07sOd69QpiKzCjMGaMeakSEyVJxYqZP2ybzSZPT08NGTIkzzpuWFsBcrvqmvvBB6ru4qKQkJCCEZROjq9Xgwbp/4oFR359lydPnlQ59qixw0bteWeOFBenNWvM0ZB33rmy/OLFZs+heHHzmStTV7Vq5jVJS7tme+Hh5uUbMEBavvxiL2HtWrP6okXSqVOSo+NFowHS7NnS2bPm/3FcnPT++9Izz2TfxsyZUv360dq2zaw7ZszFY5GRkXJ1ddULL7yQuW/Tpk3q1auXPvtshdLSTMPUtas0YcJaubu7a9GiRUpNldavN9ew/PqrVLKkLpluMKcc4rR373mlpEjly0vz5pnnt9nMTcofo5AT57UfgBWGYUxPf/8E8H2uljjd7kREgKcnuLlx6hRER0NgoBn0Li4ujjp16hS2QotrEPzDD4SkpPBi//58snUrhmEUtqRL2bbNfE1ONkPu3sb8/PNqjvEgDwXPocaofgC0agVRUeCWTQCA7t3NTQLDgIMH0w/MmgVFi4Kj4zXbCwyErVuv3N+ihbnC1MfHPO/q1VCsGFSrBmvWQMuW4OQEX3xhlj93DqZMgUaNYPJkc/+ZM9C0qZl7vWzZHcyYcQ/OzjBo0MV2/Pz82LNnzyWJsxo3bpyZZRFMDUuXArRg6NAYXFzMFf3NmpnHO3WCY8fg778hIiKN1NTtnDhRCw+PIlSubF6CvXvB3d28Ts88Y36mr7665qXJMzmJkjreMIydQDvAAJYB5fNHzi1KZCQULw7A55+bX8gDD8CBAwcAqFKlSmGqs7gOnpGRALz477/MnjWLflfLaZFxZ8olhw4dYvXq1Tz00EMUyS7T0rWwZ/ELDQmB+vVz3X5BERISwpdffkmXLl3o1KlTtmXWLv6LDvjStvWlt5bsDEJWrrjsN+E6+Ppe/LtFi4t/t2lzZdlnn4VPPoEnnzTfd+kC58/DQw/B9Olgs8HXX8O990JAwKV1K1WqlGNNGQbhcpycwHSYdgIaXXHc3f3i38WLww8/mM+q+UFO4zmfxvRq7o2ZT2Fv/si5RYmIgBIluHABvvwSeveG4GDLKNwuFIuJYY+rK8OqV+fd994jLatX6N9/Q/v2prfo00+bj5E5wG6HIUPM6vPnz2fw4MHs378fe9abfHakpsKPP8LJk+b741nCiG3ffmnZfftgyRLWrl1LTEzMlecaOhQefBAwHal27doFmDfvw4cPX1XCrl2QkpL7UO4xMTHMnz+fMulemzab7YrPO/SeSvxGZ9r39sn1+QuTypXhuedgwADYtAkSE80b8X//ax5PTHSiZUsYN65wdRoGjBkD//57pXG6WVz1l2EYRhXDMN4xDGMvMAk4BhiS2kialD9yblHSewrTp5tPD6++au4+cOAAHh4elC5dunD1WVydpCT8kpLYWLIkj48Zw8GDB1m9erU5VjBjBpw9S+KJaJLdfMwxhkcfNccSrsPmzWb3/YEHYMCAVxk9ejQNGzbMvDFnJTU1lT/++MOck5syxRyPKF8exo83h4veesssmNUo7N0LLVqgHj14vHVrurRpQ9xff5m9mQxKloSyZQkLC6Nr1660b9+e7du3U7NmTb7/3hzhDQvLMiQD7N4NderAwIGNWLMGQkNDSUlJITIykoYNG/LLL3+S/qyTidLbbNq0GSNGnODIkTqkpqbSqlUrBjzwgDnWkmIGPajnnP5IW7v2da/hrcakSfDdd9C4MWzYYDoRlyplHvP0TOP336Fu3UKVCJiGwc8vHxu42mQDZs9gDVkc1YCwq5UvjK3AJprLlZMee0xdupjzXxl07txZ9erVy7OGm6KtALktde3dq8V0U2nfOE0aHqpTvfuaM4wZs3kJCbrnHrt69ZK0aZPk5CT17GnO5L3zjvTaa5LMFS2pqXZNmzZNZ8+e1ZtvSg4OUq1a0u7d0uk//pAPaPz48VfoeueddwRo4cKF0q+/Kumhh3QoMFD24sUzZwxTm7XQN5UnKCZGijsTp7auf+mfop1ld3TUeNCTlNd8eiom47P++af0xhtSXJweeughubu7q4qjoyY6OKhykSI6dOiQJNOBODg4vZmzZ/X28wcFkp9frLy90+Tg4K727durZ8+eAjR4cJwMw67AwLfVrl07rVixQuPHj9e9996rgwdjBdKLQw5oeJkycgVNy7iOP/6oZcuWqWrwBT3V5YS5NOhmf5eFyJ2mi7ysPgJ6Av/D7CFMxhw2Ony18oWxFZhRcHeX/aWX5e9vrnLIIDg4WH379s2zhqtxp/0A85tr6vr1Vw1hUqYNaMfvOvfws+ab335TQoJpB5ycTJ8hffyxBDpbubIEsjs76/f5CxVQLFl96myVI6h58+aqU0dq1UraXSJAv7VsKVWooD+8vHTfffddouvCuXPy8qwtmKz69e9SamqqOnXqpIEZy2F++UWKjNTk/54VmOv1l72+WiBVL3dBR5s2VRToqUfMz1CnTh+dPZuqn+//VvLw0MZ//lEp0PhhwxTt6yuB4n18lLxmjfbvD5ezs9nMqlWSWrdWJ8clglC99dY/6dekqwABGjNmvEqUkJycbAKbnJxeE7gJXlWtWgNlt9t15ow0tNv9igd94PS8TlDKvE59+6pKlSqqXHmafvwxn77LQuRO03Uto3DV4SNJCyU9CFQDVgPDgQDDML4yDKN9fvRabkkSEiAxkWPOQZw9a3YtAVJSUjh8+LA1n3AjJCSYY/g2W66rpqSkMHv2bLZlrNy5Cjp0iH1Uo3qlSCZ/msAaWnPX7OcJ8S4DHTvy779m4Mm0NFi4EHjxRdbVqkWJ0FB2OThw3Gbjud7vcSbahbM7YxlPB/zXn2DnTqhTM4xtEWdI8C3FsFJzKXYhmCKrV3P+/HkAHJKS8GzfHhfHzcCTBP7rROsaNfjtt9+4d9QoU2CXLiTe04n3vigBwHffJVJ/3bu0cl7PqdgiLK9enw3A6093YMiQcGqWdmV4j3C6Ln6KwxWaYgz7hLbGZLrM3YlvWhqnP/oIDz8/Yu67j8ceGEtqqtnM4J5fw5o1BNmO0q38Znrbf8fT4RyeRQYyY8YMnnnmGYoVe4iICKhWbQyGsZi0tA/w8IgFxtO79xgMw8DfHwaPHcOrVVvzdtpHdHD5k6kYpCxaxD8rV/JP1130q7H98q/B4nbiatYiuw0oBjwNrMxNvfzaCqSncOSIBPrp2T8F0saN5u69e/cK0IwZM/Ks4Ya1FTB51XXs2LHs66aHHFDNmtLmzZccstvtSkxM1MmTJ7M9Z2pqqlxcXPTqq69eU1fK0KHaSG0NGzpHkrS8yVsC6ZHy38hut+uLL0zHouLFbWrbNk0DBgyQI+VUqkiYalT5Re3aPqYSxcYLJC/nBD3kPFef8oJAal7tfvn7++vIkQsKDLRrfNFROgXa2KSJ9McfOta7t9Z4ds7spczgIY1wddX3338vSYrx9VWUg4Pee+hfgdTVY7w60F4XQB/WGCWQSpfeIWfnHUpIMD/Prk9XyMAmkF4n4juZAAAgAElEQVRxvFdvt10hkFyMZG2cslOStG36dv1CJw2/55f0uDsj5QDqBAoxDCUVLao00JN8K3eHCxnuN/rrr9Py8vpKFXHWrKBKmth/k1o2iteKdv81vc1sNnORfnokyBlTUwTSE7Xfk0DLnv9BsXhKX36Zw1/Gldxpv/38plBjH93MDbPXsQfYDcwG3IDvgMPA9vSt3vXOUyBGYcsWCfRarwNydjadTyVp8eLFArRhw4Y8a7hhbfnBoUNSfLz596+/SqGhmYfyqqt169YCtHXr1ksP9Owp+ftLpUpJjRtnjkPv27dPjRo1UpMmTVSlShWz7JEjl7i0jh07VoC6dOlybV09e0rVq198v2CBujn9oqI+Ns2a9Yvc3Ny0adNR1amzVJCq1q37qEOHrho6NC197F3y948QbNOrr36kzRvOys0pVk1Yr2mg6dOmSUoPW7Nli/b4+eku1mggU7SJRirrdED+/jadPi2d2rZNu3ad1datZmiHL5tO1evuH8nJya5mTU9qnaenPg0arGreq1SZ6nJ0NG/+FSqYN/uUFMnNzZ5pZF5uMlX9HkxTyWJJGvCYLTPg5vjxUlGfNHXoIJUvGatw0OS+ffXSSxu14AkznsRmBwc9S0t1abpTZ85cvDzH3n9faZd7UYFUtqzpbeXgIM0xDWxamlS1qlSzepqiqtSVb5FkPfZwinThQq5/IxncaTff/OaOMApAmfSbv3v6+7nA4+lG4YHcnKtAjMJvv0mgNg1i1KjRxd3jx48XoKioqDxruGFteWHpUum++y4NEDN2rPTSS6brpYeHNHKkaf1cXc0IjjnQderU1Zts3ry5ADVs2FCpWdstX1566CHpiy8kwzCj0Upavny5GjRooN69e8vDw0N2u10pTZsqNf3mbrfbVadOHQEKCgq6UtexY5mesId/2qLvh/+rrFEutm2xydNTmjQpRIC+/PJLTZ9uRrNMD84pyZRTtkSiQOredKUA9e17RD4+dm27Lz1cc8uWlzS9Y8cOOTJBBqZRcXY6p99/t2Ue//prs9rBg1LjcqcFUtXyiWZo5cRETZtqV6lSdhUrVloBAXsEF6Mrp6SYE9sfVpssd+I1/OFTqldP6tjx0o8fEmJ2vAICpOKe8zUPdHK1+flatbRLM2dq7aJFmeWjoqQObVMVEiIlh4UprHdvRe3aZfYO3nhD+vZbU/QPP5jXNjk5s+6cOeahRo2UMU1zQ9xpN9/85k4yCsfSh6KcgJ+B9resUZg5UzYMeXum6dlnL+7u06ePAgMD89x+rrSlpUn79t3YSePizP/+n34yn8ozIrnu2ye1bi317m3+04PUtKn5VAhmYJn0uDzZXbP4eGng4+YN8I9Flz0h2mxm0JpTpzRr1iwBmjJlinksMtI8//jx5vmz9EgyeOyxJYIOij5zRgmgNBw0fewpJSWZnYrevWcIPPVbxp3o9Gnp0UfN886aJUl6801ztc2KFUcvOXdsrHT2rF3u7r+oTRtzhdHkyeZN7fXXlRkP59CmSPXxWaYDc7dpx44dSkhIMr+Ko0fNdj788ArdQ4YMETRX06brdeKEue/rr6XRo6UTJy6OxJzYHa0ny/+u0LUXLWpYmBnjpn///vL27qmRI+1XLuT56SfVc9mj9u3S5OYmvfzyFRJ04oQZ9fm553ZlXp+ICGXqyfpdhjw+TuU4on9Wp1x5IskUW726VLfuFauK7HYzRASYnb7Lg9Hlljvt5pvfFFaYi5uKpBOGYXyImZshEfhd0u+GYfQDxhiG8Q6wAhgpKfny+oZhDAYGAwQEBJhrzvNAXFxcjuqWXb8eJ8oRG+eIh8d+Vq8+hST+/PNPGjZsmOf2c6otcPZsSv7+O84xMWycORObp2eezhnw++9UGzeOzdOmkTB+PISGQmgoVT76iBJbtzJ70p9Ev7eKFwH71q0cmTKFIICkJIZWrUrjsWOx2+0MHz6cXs2bY7i6kubjw5gx1VnxZwmcSOV/z/yGk0+JzDadY2K4e+hQTv/8MyVHjqRFQADTv/mGSpUqUXTrVuoC2x0ciNm82axw/DhI2Ox2HBwcmTGjG9CNNV+NogfwEz154vWSXFg9leLNfJk//1HuxpNFCxfx+qsHmBz+CQ0ST7C9QQP22+207taNQA8fYDPHj7/D6tVlLrkmJ0644+RUlVWrxjFx4kRq1KjB8uXl+eKLYJo1W4+3t+nkNmSRKyc4D9GwceN6AE4BjkuXYvPwMP0bsnD//fezfv16WrVawIEDSRw4AAsXVuPsWVdatNiBn9/FpFz9v3PmeNo+jq/ed8k5KlSoQGzsGD74wIHixT+kYcOGFw/6+RHQphi7dyeTlOSBg8M+Vq++MlXk0qUO2O3g5uZ2ye/0wIFLf2NO1Tz5rscXpCa3Y/Xq7D1u/Xv2JGDlSnavXIkuCz3RsiWMHu2Hi4udv/++vo/Htcjp/2VB8/9K19WsRX5tmKG3VwIlAGdgEfAIUAozjIYrZmyld653rgLpKbz+ulY7tDGfhP8wdx04cECAvvnmmzy3nyNtMTHmsMoDD5hPvhlPaV99JQ0dasYMXrs2Z49nDz5ojidkRNJKS1NsbKxig4MV3aS5ivvZdBd/y165imyOjtpTpIhSS5fWOUdHzQANGzZM48aNE6DYSpWkOnU09Ztv5ONzSh4O8/Wcwxf6kJcUlSWWvSS90b69hgwcaMY7Bs1ycFB8fLw0bpz5eJkx/GazSb16Kfb551WkSBFN/HBp5nD2n4+/IoF6O80TSK+7vK/3yo0wJ/5prLtBbsToNcZq0+uvm8NK3t5KrFhRq7t3F5BtlNSEBGnAgA0CBwGZyVOyJLbKM3a7Pdvf2PTp0p49168fGRmZuVT04MGD2ZZZuNC8PnmZ1srTE2bKVXoSN5E77Yk8vynQJan5SDtMf4cISanAAuAuSRl96GRgOtCkELRdSUQE4Z41AMiIefVX+mNey5Yt87ftjRvN++LTT8PDD5uujPPnm4FaJk82XatbtjSPX864cWjlSpYsWUJKQgJattyMvOXgABMnQqlSPPfoo7gfPMgXm9YzO/U+PuJljC+/4OkHH6RmfDy17HYW2Wz0c3Dgo5EjqVu3LgdWrsTr0CHYuZN9L73ChQvFqF7flwFLyvO08Ql777sP2WymF/jBg6hhQ0pWqJAREYwKdjsrV65ketGihP3yixmlDMDBge1Gfb7cXoP4+Hiit3sD0IaR2Dev4Qxu/Gp0A2B6kUbMdqiBYYiy7GSlgwPTeRovPqPjN99QtGhRGnZ4igmP7GbA9k8wjA74+FwZdsHdHcaMKYvppwnly5cHwNv7xr+67ILuXbgATzwBixZdv76fnx9Tp04lJCTkqrF1QkLM1xo1bkRpLnB2LqCGLAqTwjAK4UAzwzA8DPM/py2w1zCMUgDp+3pgrkwqfMLCCPeuBZgRGQHWrl1L8eLFqVatWu7P99ZbMHLkxfeRkWZIgEnZRA5Zt840BE3S7eObb5pxFRo0MONtRETA44/DjBkkHz7JmDEwbx7m3eeNNzj63Xfcf//9tKv7DzXOrzOjfAGUKQMREZRcvBgnIKVOHb6zb8GnVW2OV27DivXrKVu2LPtPn+bP4GAcgoJw9PPD1dWVykePAnA+IIAB8UWw210YWNWFXxYv5iU5UiXBg1P9+5txeapW5b99+/J2fDyMH8/WgE60cy/OigUL2L9uHS2efDIzDtHu3fC+/S3G7noQJycPDu3wxp8zbGcceyLDGUUHElNd8fa2ExVXhmSqUbGiwVR/H/Z4edF3ekcmlUgjOjqa559/HviQd0Z7cDQ8iCJFauHgkP1PPSOOj5eXV75GT9279+JDRU5v4gMHDqR69erZHjtxwgyz8dhj4OV1k0RaWEChLUkdBezDvPHPxBwyWgnsSt/3A+B5vfMUyPBR6dJ6qvIq+ftf3BUUFKRevXrlvlGbzVzj6O5+cdlnRlY3UPjDD0s220Vt7dtLdepcrD96tFl2586L+0JDdQZ/1Q2MzFxCmfDzCgl0qmxZ3QWqzVw9ZMwyh6MkKSJC8eketaN5U/c0Oy5wlYODTW++Ke3sPVwxeOuHT3/Q/PlH9PRgc7JzyQ/L9UTAAv3j0lD969TRGpqbTrl0UtJPP8nfP05tjU8lkN0wtL9bN9kjIyXD0DbqCaRuXb7Sjnr1FNW1q7Zs2SJJWrZsv8CMKnFX8y56PShI5V1OqLfvH2rn3VQ9GCTopJIlt+vRRy8ILsjf/6Q6d5Zq1qypIkWKSJLatPlWLi7PadeuSDk5Sa1b/ytwUvWsS1KzITw8XKdPn87993kdsv7GDhzI/JpveM2AZP58mjeXliy5cW23Epau3HFHrD66mVu+G4Xz5yVQh8qHMpej/vvvvwI0adKk69dPTpaWLbs4F7B798U7w+LF5r4335QcHTU1/SZt799fb7zyit5+40294PKVZrednHm6ffukZwed14kT5y5ppn/XdQJp6FAzZ+zkbosz2xnl6alTjo76y8NDYWFhmjt3rmw2m/o1bqz9tWqrkscJtWtnV4MGDeTsHKaePW0KLpsgkF592abHH5datJDSIqKVWqSIBjIlfbnlU3o/+B2BtGfmVikuTm+/LTVr9Kl6uvRTaR/zhrx7927Za9dRW/6Qn3eyYjbtN2OFZPFZaNr0R4E0ceJS1QaFUcF8f+9idfEeKwObKhYLliRt2RIpqCZn51S99JK0a9cujR07VpLUtWuyfHzS1L+/+fHr1esrQC1atLj+d5UPZP2NJSVd/OpvdIXOzeBOu8nlN3eaLssoZEOOLuamTRKoetnzSs+TrYEDB8rDw0Pnzp27dl3p4vrudAcnffml+d7FRRo4UDExMUq+916pTh2dj4lRzIgREug/JUtqeMuWKsUJDWh5IPN0gweb1StVClZSUpLmzp2rbt26ycFhg2CTPvroYzVsKL1S/n9SnTqqW7WqxtZrqlg81adEcwUFrZNhtNDBg4d0+vRpbdhgz5S3aNEilSu3TaVLR2no0DXKcDT29TXv4YmJ0r9PvaRDi9YKNgt2af+GHdq1JCzrsvV0p74e5pr4VlvUsKHUomyYQPr04zRFRkqXz/nWrXtWsFuA6tSpo/frzTU7RF//o68+nikHAnTXXXfJZrNp8+bNgnICM0tq1u9y3z7T9QGkdu2k+Ph41a5dWz169Lj+d5UPXP4byzAKtwJ32k0uv7nTdFlGIRtydDG//152kIe7TcOHSxEREXJzc9PTTz+dozZs//1Am2l4cYXNww9LZcqYDlslSqhZ48Y65+IiPfFEZp3EsWNV28FB/ctPF0i+HutlS18xVLWqdNdd0ZoyZYpCQ6X77tsgCBDY9JDLaM0tU0ZJcamSp6d+aPutYJJ+LPagQJo6JUXe3qYRqFrVdB+oXdv0T8uwbyNGSIaRrHvvbZ+ZSB3MNIAg3X13hCSpVKmvBLbM0aispKWladKkr1S+vJmAvXJlqVZNu5o2StWxY2ZaxAkTLpY/fNh0ku3YcZNKlSpl9iyiorX/ze8zHdCeeuopvfLKK3JyclKLFm0EiwWZaWov+S7PnDEv56ZNStdaSoMGDcrR93Wzufw31rv31VM+FjR32k0uv7nTdFlGIRtydDFff12Rjv4C6ZNPpAkTJgjQ7t27c9TGp/csMJey/m43h5IuXDDnA2bPlr1ePT3bt68mDxyoQwsX6vnnn1ffvn1Vt25dgYOquplOVz4+Z5WQkKAjR1IFUv/+2ySZPl9+flLv3iECaXqN/nrXMBST7oE9ouM6ebvu08e8KDCdlqKjzV5B7drmN1+mjOngnMG0aUp/Ao/Thg1Kb9+UPmuWNGmSOeQzd645TPXgg9L8+dl/9rVrzYCjGWFBMpg40RxF27DB9Lx9+WXTUBw7Zi7jvJz4+Hjt2rVLycnJ8vT0lJeXd6axygjPcLXv0m63C9CArKFtC5Bb9UYi3braLF25wzIKBW0UevbU1gq9BOZ8cL9+/VSxYsVr19m+XerVS0pK0oxmXwikZ9uEmJm5//xTkpSWkKyPP7Sle+ba9cUXXwhQ48b3CFarhsNI2UEvNlgjFxe77r67pWrU+K9AGj36Z0nmNMWZM6au7t2lDRs2yhEUWbGiVLy47JFRkt2uF7qFydPzUq9Ym80M7Bcbe6n0desu9g5SU00P1SefvPKaZbhPgNSnz/UvY3ZMmiQVLSp5e5vG5Wr88MMPArR3714FBQWlr933U2JiUuZnutZ3GRISovM3w/EgD9yqNxLp1tVm6codd4RH823Fvn2E+z8KR8zlhEePHs1cy35Vpk2DBQsgNpZHXeeytHg15u9qzWcDBvDjoRbE7YMqVVx46RUoFf4P57/rzAtxcbi7u1O//kg2b25Na23HGDSIyvVakPKCgaNjaUJC/IFoHnigMmCuVPX3h549zc1ub8RLJUrgd/gwmjOHSLuNEobB/uSKVK16aQ5cB4eLq1yzUrXqxb+dnMyE6EWLXlnOxweqVzevybRpub6qAHTuDBMmmFkwhw27erl69eoRGBiIj48PAQEBhIWF0bRpMG5uOUtwf7UlnRYWFtlTGH4KtwepqXDwYKaPQrlyEB4eTrmMxeZX49NPwW4nxacEiSeieajyNs5GOvJdtQ8Y8bYr8+fDvffa8PW9l3t+6E635GTsdjs1a9YkIqIZcA7/Hutg0iTKVzS/nurVOwL34uz8D1WqBGfbrIODA+937QpPPME8w6BixYq0arWR33+HnKZ8KFYMhg+/GLWhbFm4Wh765s3NXLa5zVOfQcWKphvGwoXQrNnVy9WsWZPw8HBKlSqFv78/tWrVYsOGDXlr1MLC4rpYRuFqHDgAqakcdQrC3R18fdM4ceLE1Y1CRqYWCc6d48/55/E+uJUSZVzw8oKnnoKoqDTeey+Z7du3ExOzijUffsj7D4wBNhIU1Ia///bhnnuSaDb4CXBzy3R2Mow2QEWCgo5e1QkLwG3aNJg2jfvvv5/PPvuMmjUbAVChQs4/9scfQ+vW1y9XsiRER5uJ6/NK6dLQo8elvZhrERAQwNmzZ/PeoIWFxXWxjMLVSH9cDjfKU64cnDp1ErvdfqVRkEzv3RIliHjsZWIr1gU/PyrOG88rfEiDOml8+y00bDgPm60C58//zu7dprN2/bvvpmLtFkBVli17h4gIGDy4FG5uboCZ2x1g5Uqzza5dPXIk3dXVlYEDB1K7thm47GaEbbicl16CIUOgfv2bf+6rkWEUxowZU3CNWlj8P8MyClfjzz+hQgXCozwzh46AS+cUkpLghRfg888hNZWms4dROnw9/X1/xi9kLWNdR1GkfHECAlaxdWtf4AR79uwhJCQEFxcXgoKCGDasLt26zSQ+vgiOjtCx48XTe3ubT+SnTxtUrWpn3LjHc/URnnoKPvrItFk3m2LF4IsvII9BW/OEv78/YC6OsLCwyB+siebssNnMnkLv3hz9Gbp1u2gUMnsKu3aZB44eheHDSRs4mMO1gwj2jWRVQnOi07zxT0wEu50RzZoRFBREYmIiu3fvJjY2lipVquDk5ISTkxNLljzPggVm5OjLJ3ZPnjSHVySHHA+zZODsbD7R3ykEBAQAZmhqCwuL/MEyCtmxbRvExJDU8j7OTOWSnkJgRlS8KVPgzBlYsYJNnp58+P6XwGe8+H4xnjv0Mny7CoAjx46xZcsWJkyYwMqVK9m9ezfx8fHUv2zcpVeva0vKx1httw01a9Zk2LBheFkR4Cws8g3LKGTHihUAHK/aFjCNwsaN4fj5+VEkY7nN+PHw8stQrhyP16jB3r3m+L1/gAPYK0JCAnTrxoHBg/H19aVHjx5UrlyZ06dPM2TIEPr165cjKf36wZw55qRudstD/z9Ro0YNJk6cWNgyLCzuaCyjkB0bNkC1ahyNLw6YE77z5l22HNXVNTMWss1mw8wRBCVKAG4VzTK//EL7pUuJiIjAycmJ4OBgdu7cid1up0YO4ye/9JK5fNPX92Z9OAsLC4urY000Z8fx41CxIukjRtn7KIwYAStXAvD2229jJpIzHcqoaBoF+48/gmHg5GTaXpvNxty5c4GcO1U1bgz//a81fGRhYVEwWEYhO06dglKlOHrUvBmXLXuZUYiLMzOcbNsGwCOPPELnzo8DYBiRmY4Bu5cupVq1apw4cQKAlJQUxowZg6OjI1Vy6lFmYWFhUYBYw0eXY7OZE8ilShEeDqVKQWLiec6fP3/RKHh6Qmws2GwcOHCA1NRU2rYN4tdf57J1q43q1R8GoNqyZdRu146i6ZMB7u7uLFy4kDp16mT6IlhYWFjcSlhG4XIiI03DUKoU4RvMoaOMJ/2yZcteLGcY4OTEhAkTWLBgAWfPnuWjj9rw3nvutGvXhpILFuBStizzGje+5PQ9evQoyE9jYWFhkSus4aPLOXnSfE0fPjK9mU8BULp0afPYggXokUchMZGRI0cyZ84cDMORBQsW0LhxY3x9faFnTxJr1SqkD2FhYWGRN6yewuWkGwB7ydIcO2ZGID117BhTgHLx8WaZf/7h0zkl2KKFODn3Q6rE6NHg49OUpUtnZ54qKCiIPn368NlnnxXCB7GwsLDIPZZRuJx0oxDhUobkZLOnkLhrF08Btrfegk6d4MgR1hh9+GXeXbz+ujmS1LQpuLmB3W5nypQplCxZktOnT1OqVKnC/TwWFhYWucAyCpeTbhTOYIZUKFkSwv825xQcR40CQEeOsC+tIv5lEkjflQUHRo0aRZkyZQCoVKlSgci2sLCwuBlYcwqXc/IkFCtGbJILYCaUSUqfaMbPD4C0Q4c4RiWqV3cGzNQLR4+arwD//vsvr732GgDBwdnnP7CwsLC4FbGMwuWcOgWlSxMba7719oa0M2fMN488AmvWEHfeIJ7i3H23P4cOgYuL6ZowZYpZzN/fn7CwMMDqKVhYWNxeWEbhctId17IaBSM62nyTnAzjx3MI80Zfv74XGfHxIN2bGTh+/DgjRowAwMfHp6CUW1hYWNwwllG4nMuMgpeXcIiJwQ5w+DDavZtFhumNHBxs9hIyyDAK7u7uBSrZwsLC4mZhGYWsSFcYhbS0aHxsNlLc3WHFCozwcBbJ7CkEBV1avYQZ/gi/9LmHFi1aFJRyCwsLi5uCtfooK1FR5mxx6dIcORAN+DJx4hiaAqk+PrgdOoTN0ZG9tmBKlkzF3d2caL7rLjMJfYZRADh//jwuWbsRFhYWFrcBhWIUDMMYDjwJCNgFPIEZe3oOUAzYBjwqKaVAhaUvR6VUKU6sugA4MG3aFGKBZl274vXss0xOTcX1jepUq3bx0i1ZAn/9lbk4CQDv/EiMbGFhYZHPFPjwkWEYZYChQCNJtQBH4CFgHPCJpMrAOWBQQWvj3DnztVgxIiOTgVguXLjAdMD22mvg4MAzL77IhQtNWLDgYixrPz/T89nCwsLidqew5hScAHfDMJwAD+AUcC/wU/rx74GCjxyXEcaiSBGio22AObHgBZRKzw8M4OhoZUGzsLC4MylwoyDpBPAhEI5pDM4DW4EYSWnpxY4DZQpaG3Fx5qunJ+fPg5NTAuXLl+c44PLGu2zYsIcKFTrTvftpDh0qcHUWFhYW+U6BzykYhlEUuB+oCMQA84BO2RTVVeoPBgYDBAQEsHr16jzpiIuLu6Juya1bqQZs2LWL8+fr4OycxP3duzP7j5W8PHksLUL3U6RITVatKso//2zk2LHEPLWdF223Apau3HGr6oJbV5ulK3fkiy5JBboBfYCpWd4/BnwFRAJO6fuaA8uvd66GDRsqr6xaterKnZMmSSCdOSM3tzCVLLlGkmSzSR9/LK1cebGo3Z7npvOm7RbA0pU7blVd0q2rzdKVO/KqC9iiq9xXC2NOIRxoZhiGh2EYBtAWCAFWAQ+klxkALC5wZVmGj1JS3PD2NiAhgZnjT/H228LF5XhmUStnsoWFxZ1IYcwpbMScUN6GuRzVAfgWeA14yTCMg4AfMLWgtREfD4ZBmrMzdrsnRYs6wtatnHz9M+LjDVq06M/dd5/j448LXJmFhYVFgVAofgqS3gXevWx3GNCkEORcJC4OihThxMkzQFmKF3eBqOOcJD3jGmtYtw5atSpMkRYWFhb5hxXmIivx8VCkCAcPngagZEl3iIriJKVx4GxmsWrVCkughYWFRf5iGYWspBuFQ4ciAChd2ivTKMAOihZNAqBq1ULUaGFhYZGPWEYhK3Fx4OnJ0aOmZ3PZst4QHc1JSmPnJNWrm24UllGwsLC4U7EC4mUlvadw7Nh5wDQKWn+WU5QCTtGzpyt2u+XNbGFhcedi9RSykm4UTp40l6b6ekPU8i2k4kLRoom88ooz69cXskYLCwuLfMQyCllJHz6KjDSDs3of3sHJ9MCpZcpYl8rCwuLOxxo+ykp6TyEmxg6A98pFpLik4cl31KhRyNosLCwsCgDLKGQl3U/hwgXTXdn7tWfx6dWI+a6u+PvXK2RxFhYWFvmPZRSyEh8Pnp7Ex5tDRV6VS5JYrhttXc1w2RYWFhZ3OtZAeQZ2OyQkYHd3p3qyG55cwDHiNIMGnaN48SSSk5MLW6GFhYVFvmMZhQwSE0EiwcGBaLxxc00B//9r795j5CrrMI5/n91ul+52Sy1tgXBpS10bSyKlNA2oYKKiLREqmggNCVVIQKIB4iVASAxE/wG8BWgkJVbQoBCjxCZWhTQVNdoi1Ja2gUILBWuXLV3tZac3WH7+cd6zDpudhV2Yc8bM80kmc+ad2Z1n33P2/OZc5j3TaW39Lfv23VJ2OjOzQrgo5NJV1yrAK0yibco4aGlh+fKL2bDhStrb28vNZ2ZWABeFXF4UDh1iIp1M7Awi4OWXj6e7++ySw5mZFcNFIZeupRA7drCADrpajrJ69XrOOgvuuadScjgzs2K4KOTSloJ6eqjQQee0Th544I8AzJ7tk7TMrDm4KOTSlkJ7by/76GDS5PGsXfsSAHPm+HiCmTUHF4FvktcAAAgISURBVIVc2lLo2ruX/XQwMHCQvr6JAMyYUWYwM7PieL9ILhWFSf39HKKTXbu20dIym66uN5k82bXTzJqDi0Iu7T4COKoOduzYzPTpCznpJBcEM2seXuPlKv87w+iNmMDhw32MH9/NzJnlRTIzK5qLQi4VhdcZR9DGccdBX1+Xi4KZNRUXhVx/P7S2cpgJAEybNpVKRS4KZtZUXBRy6VoK17ZPAWDu3NP5yU9g0aKSc5mZFcgHmnP9/cSkSTy8K6uTS5cuYtmykjOZmRXMWwq5SoWB1lbm0wHAkSOwbh0cO1ZyLjOzArko5CoVOHiQ76aisGLF05x3Hhw4UHIuM7MCuSjkKhX2dHZyfSoKF14oVq+GKVNKzmVmViAXheTY/v1s3b2b4xZ8DIBLL53P4sXQ4h4ysyZS+CpP0hxJG6tuByTdKOk2Sf+qar+oyFyvvfIKnQMDXHXO+QBs3Pgma9cWmcDMrHyFF4WI2BYR8yJiHnAOcAh4ND39g/y5iFhdaLBKhQ+2tdHyhz8DcNdd+7n99kITmJmVruydI58AdkTEyyXnoG1ggFaJg+oE4MiRdqZNKzmUmVnBFBHlvbm0EtgQEfdKug34InAAeAr4ekT8Z5ifuQa4Jj2cA2wb49tPBfaO8WfrrVGzOdfoNGouaNxszjU6Y801IyKG/dhbWlGQNB7YDZwZEb2STiT74wL4NnByRFxVx/d/KiIW1Ov3vxuNms25RqdRc0HjZnOu0alHrjJ3Hy0m20roBYiI3ogYiIg3gfuBhSVmMzNrSmUWhaXAL/IHkk6ueu5SYEvhiczMmlwpYx9J6gAuBK6tar5T0jyy3Uc7hzxXDyvq/PvfjUbN5lyj06i5oHGzOdfovOe5Sj3QbGZmjaXsU1LNzKyBuCiYmdmgpiwKkhZJ2iZpu6SbS8xxmqS1kp6VtFXSDam91CE/Uoadkjan938qtU2R9LikF9L9+0rI1TDDpEhaKWmPpC1VbcP2kTJ3p2XuGUnzC851l6Tn0ns/Kmlyap8p6XBVv91XcK6a803SLam/tkn6dL1yjZDtkapcOyVtTO1F9lmtdUT9lrOIaKob0ArsAM4AxgObgLklZTkZmJ+mu4DngbnAbcA3Su6nncDUIW13Ajen6ZuBOxpgXr4KzCijz4ALgPnAlrfrI+Ai4HeAgHOB9QXn+hQwLk3fUZVrZvXrSuivYedb+j/YBLQDs9L/bGuR2YY8/z3gWyX0Wa11RN2Ws2bcUlgIbI+IFyPiGPAwsKSMIBHRExEb0vRB4FnglDKyvENLgAfT9IPAZ0vMAiUPkxIRfwL+PaS5Vh8tAX4amXXA5CGnYdc1V0Q8FhFvpIfrgFPr8d6jzTWCJcDDEXE0Il4CtlPH7y6NlE2SgC9QdQp9UUZYR9RtOWvGonAK8M+qx7togBWxpJnA2cD61PTVtPm3sozdNGSnBj8m6WllQ4sAnBgRPZAtrMD0EnJVu5y3/qOW3WdQu48aabm7iuzTZG6WpH9IekLS+SXkGW6+NVJ/nQ/0RsQLVW2F99mQdUTdlrNmLAoapq3U83IlTQR+BdwYEQeAHwGzgXlAD9mma9E+EhHzyb55/hVJF5SQoSZlw6RcAvwyNTVCn42kIZY7SbcCbwAPpaYe4PSIOBv4GvBzSZMKjFRrvjVEfyVv+aItJfTZMOuImi8dpm1U/daMRWEXcFrV41PJxmAqhaQ2spn9UET8GhpjyI+I2J3u95ANbb4Q6M03RdP9nqJzVWnUYVJq9VHpy52kZcBngCsi7YBOu2f60vTTZPvuP1BUphHmW+n9BSBpHPA54JG8reg+G24dQR2Xs2YsCn8HuiXNSp82LwdWlREk7av8MfBsRHy/qr3UIT8kdUrqyqfJDlJuIeunZelly4DfFJlriEYdJqVWH60Crkxnh5wL7M83/4sgaRFwE3BJRByqap8mqTVNnwF0Ay8WmKvWfFsFXC6pXdKslOvJonJV+STwXETsyhuK7LNa6wjquZwVcQS90W5kR+ifJ6vwt5aY46Nkm3bPABvT7SLgZ8Dm1L6KbMTYInOdQXbmxyZga95HwAnAGuCFdD+lpH7rAPqA46vaCu8zsqLUA7xO9gnt6lp9RLZZvzwtc5uBBQXn2k62rzlfzu5Lr/18msebgA3AxQXnqjnfgFtTf20DFhc9L1P7A8CXh7y2yD6rtY6o23LmYS7MzGxQM+4+MjOzGlwUzMxskIuCmZkNclEwM7NBLgpmZjbIRcFsBJIG9NZRWd+zUXXTaJu+7Kw1lFIux2n2f+RwRMwrO4RZUbylYDYGaXz9OyQ9mW7vT+0zJK1JA7ytkXR6aj9R2XUMNqXbh9OvapV0fxor/zFJE0r7o8xwUTB7OxOG7D66rOq5AxGxELgX+GFqu5ds6OIPkQ06d3dqvxt4IiLOIhu3f2tq7waWR8SZwD6yb8ualcbfaDYbgaT+iJg4TPtO4OMR8WIasOzViDhB0l6yoRpeT+09ETFV0mvAqRFxtOp3zAQej4ju9PgmoC0ivlP/v8xseN5SMBu7qDFd6zXDOVo1PYCP81nJXBTMxu6yqvu/pem/ko28C3AF8Jc0vQa4DkBSa8HXLDB7x/ypxGxkE5Qu2J78PiLy01LbJa0n+3C1NLVdD6yU9E3gNeBLqf0GYIWkq8m2CK4jG5XTrKH4mILZGKRjCgsiYm/ZWczeS959ZGZmg7ylYGZmg7ylYGZmg1wUzMxskIuCmZkNclEwM7NBLgpmZjbovwwyzOXFf6DRAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "import pickle\n",
    "import matplotlib.pyplot as plt\n",
    "import matplotlib\n",
    "\n",
    "# train_accuracy_Relu = pickle.load(open('./plot/CIFAR10_CNN_ReLU_v2_train','rb'))\n",
    "# test_accuracy_Relu = pickle.load(open('./plot/CIFAR10_CNN_ReLU_v2_test','rb'))\n",
    "\n",
    "# train_accuracy_qXsquare2 = pickle.load(open('./plot/CIFAR10_NiN_Poly_v1_train','rb'))\n",
    "# test_accuracy_qXsquare2 = pickle.load(open('./plot/CIFAR10_NiN_Poly_v1_test','rb'))\n",
    "\n",
    "# train_accuracy_qXsquare = pickle.load(open('./plot/CIFAR10_CNN_Xsq_train','rb'))\n",
    "# test_accuracy_qXsquare = pickle.load(open('./plot/CIFAR10_CNN_Xsq_test','rb'))\n",
    "\n",
    "\n",
    "stt_pos = 0\n",
    "end_pos = 200\n",
    "\n",
    "print(test_accuracy_Relu[49], test_accuracy_Relu[end_pos-1])\n",
    "print(test_accuracy_qXsquare2[49], test_accuracy_qXsquare2[end_pos-1])\n",
    "print(test_accuracy_qXsquare[49],  test_accuracy_qXsquare[end_pos-1])\n",
    "\n",
    "plt.plot(np.array(train_accuracy_Relu[stt_pos:end_pos])*100,'k')\n",
    "plt.plot(np.array(test_accuracy_Relu[stt_pos:end_pos])*100,'k',linestyle='-.')\n",
    "\n",
    "plt.plot(np.array(train_accuracy_qXsquare2[stt_pos:end_pos])*100,'r')\n",
    "plt.plot(np.array(test_accuracy_qXsquare2[stt_pos:end_pos])*100,'r',linestyle='-.')\n",
    "\n",
    "plt.plot(np.array(train_accuracy_qXsquare[stt_pos:end_pos])*100,'b')\n",
    "plt.plot(np.array(test_accuracy_qXsquare[stt_pos:end_pos])*100,'b',linestyle='-.')\n",
    "\n",
    "\n",
    "# plt.plot(acc_Brea,'b')\n",
    "# plt.plot(acc_FedAvg_,'b',linestyle='-.')\n",
    "plt.grid(True)\n",
    "plt.xlabel('Epoch')\n",
    "plt.ylabel('Accuracy(%)')\n",
    "\n",
    "plt.legend(['Train, VGG11-ReLU','Test,  VGG11-ReLU','Train, VGG11-Poly','Test,  VGG11-Poly' ,'Train, VGG11-Quad','Test,  VGG11-Quad' ])\n",
    "plt.ylim([75,105])\n",
    "plt.savefig('./plot/accuracy_CIFAR10_VGG11_BN_E'+str(end_pos)+'.png',dpi=300)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 2. Without Batch Normalization"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "qVGG_xsquare2_woBN(\n",
       "  (features): Sequential(\n",
       "    (0): QuantConv2d(\n",
       "      3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (1): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (2): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (3): QuantConv2d(\n",
       "      64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (4): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (5): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (6): QuantConv2d(\n",
       "      128, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (7): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (8): QuantConv2d(\n",
       "      256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (9): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (10): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (11): QuantConv2d(\n",
       "      256, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (12): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (13): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (14): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (15): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (16): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (17): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (18): QuantConv2d(\n",
       "      512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)\n",
       "      (weight_reg): WeightReg()\n",
       "      (weight_quant): WeightQuantProxy(\n",
       "        (tensor_quant): RescalingIntQuant(\n",
       "          (int_quant): IntQuant(\n",
       "            (float_to_int_impl): RestrictValue(\n",
       "              (forward_impl): RecursiveScriptModule(\n",
       "                original_name=Sequential\n",
       "                (0): RoundSte()\n",
       "                (1): Identity()\n",
       "              )\n",
       "            )\n",
       "            (tensor_clamp_impl): TensorClampSte()\n",
       "          )\n",
       "          (scaling_impl): ParameterStatsScaling(\n",
       "            (parameter_list_stats): ParameterListStats(\n",
       "              (first_tracked_param): _ViewParameterWrapper()\n",
       "              (stats): Stats(\n",
       "                (stats_impl): AbsMax()\n",
       "              )\n",
       "            )\n",
       "            (stats_scaling_impl): StatsScaling(\n",
       "              (affine_rescaling): Identity()\n",
       "              (restrict_scaling): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "              (restrict_scaling_preprocess): LogTwo()\n",
       "            )\n",
       "          )\n",
       "          (int_scaling_impl): IntScaling(\n",
       "            (forward_impl): SignedFpIntScale()\n",
       "          )\n",
       "          (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "        )\n",
       "      )\n",
       "      (bias_quant): BiasQuantProxy()\n",
       "    )\n",
       "    (19): QuantXsquare2(\n",
       "      (act_quant_proxy): ActivationQuantProxy(\n",
       "        (fused_activation_quant_proxy): FusedActivationQuantProxy(\n",
       "          (activation_impl): RecursiveScriptModule(original_name=act_xsquare2)\n",
       "          (tensor_quant): RescalingIntQuant(\n",
       "            (int_quant): IntQuant(\n",
       "              (float_to_int_impl): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): RoundSte()\n",
       "                  (1): Identity()\n",
       "                )\n",
       "              )\n",
       "              (tensor_clamp_impl): TensorClamp()\n",
       "            )\n",
       "            (scaling_impl): StandaloneScaling(\n",
       "              (restrict_value): RestrictValue(\n",
       "                (forward_impl): RecursiveScriptModule(\n",
       "                  original_name=Sequential\n",
       "                  (0): PowerOfTwo()\n",
       "                  (1): ClampMin()\n",
       "                )\n",
       "              )\n",
       "            )\n",
       "            (int_scaling_impl): IntScaling(\n",
       "              (forward_impl): UnsignedFpIntScale()\n",
       "            )\n",
       "            (msb_clamp_bit_width_impl): BitWidthConst()\n",
       "          )\n",
       "        )\n",
       "      )\n",
       "    )\n",
       "    (20): AvgPool2d(kernel_size=2, stride=2, padding=0)\n",
       "    (21): AvgPool2d(kernel_size=1, stride=1, padding=0)\n",
       "  )\n",
       "  (classifier): Linear(in_features=512, out_features=10, bias=True)\n",
       ")"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from torch.nn import Module\n",
    "import torch.nn.functional as F\n",
    "import brevitas.nn as qnn\n",
    "from brevitas.core.quant import QuantType\n",
    "\n",
    "bit_width_sel = 8\n",
    "\n",
    "class qVGG_xsquare2_woBN(nn.Module):\n",
    "    def __init__(self, vgg_name):\n",
    "        super(qVGG_xsquare2_woBN, self).__init__()\n",
    "        self.features = self._make_layers(cfg[vgg_name])\n",
    "        self.classifier = nn.Linear(512, 10)\n",
    "\n",
    "    def forward(self, x):\n",
    "        out = self.features(x)\n",
    "        out = out.view(out.size(0), -1)\n",
    "        out = self.classifier(out)\n",
    "        return out\n",
    "\n",
    "    def _make_layers(self, cfg):\n",
    "        layers = []\n",
    "        in_channels = 3\n",
    "        for x in cfg:\n",
    "            if x == 'M':\n",
    "                #layers += [nn.MaxPool2d(kernel_size=2, stride=2)]\n",
    "                layers += [nn.AvgPool2d(kernel_size=2, stride=2)]\n",
    "            else:\n",
    "                layers += [qnn.QuantConv2d(in_channels, out_channels=x, kernel_size=3, padding=1, weight_quant_type=QuantType.INT, \n",
    "                                     weight_bit_width=bit_width_sel),\n",
    "#                            nn.BatchNorm2d(x),\n",
    "                           qnn.QuantXsquare2(quant_type=QuantType.INT, bit_width=8, max_val=6)]\n",
    "                in_channels = x\n",
    "        layers += [nn.AvgPool2d(kernel_size=1, stride=1)]\n",
    "        return nn.Sequential(*layers)\n",
    "    \n",
    "    \n",
    "                    \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "Learning rate= 0.1\n",
      "\n",
      "0 tensor(2.3044, device='cuda:0')\n",
      "100 tensor(2.3018, device='cuda:0')\n",
      "200 tensor(2.3001, device='cuda:0')\n",
      "300 tensor(2.3004, device='cuda:0')\n",
      "Iteration: 1 | Loss: 2.30263614654541 | Train,Test accuracy: 0.08763586729764938.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3036, device='cuda:0')\n",
      "100 tensor(2.3013, device='cuda:0')\n",
      "200 tensor(2.3013, device='cuda:0')\n",
      "300 tensor(2.3026, device='cuda:0')\n",
      "Iteration: 2 | Loss: 2.302642345428467 | Train,Test accuracy: 0.08751998841762543.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3027, device='cuda:0')\n",
      "100 tensor(2.3035, device='cuda:0')\n",
      "200 tensor(2.3063, device='cuda:0')\n",
      "300 tensor(2.3026, device='cuda:0')\n",
      "Iteration: 3 | Loss: 2.3026182651519775 | Train,Test accuracy: 0.08734414726495743.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3024, device='cuda:0')\n",
      "100 tensor(2.3025, device='cuda:0')\n",
      "200 tensor(2.3034, device='cuda:0')\n",
      "300 tensor(2.3017, device='cuda:0')\n",
      "Iteration: 4 | Loss: 2.302621603012085 | Train,Test accuracy: 0.08758791536092758.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3008, device='cuda:0')\n",
      "100 tensor(2.3007, device='cuda:0')\n",
      "200 tensor(2.3030, device='cuda:0')\n",
      "300 tensor(2.3017, device='cuda:0')\n",
      "Iteration: 5 | Loss: 2.302657127380371 | Train,Test accuracy: 0.08815137296915054.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3001, device='cuda:0')\n",
      "100 tensor(2.3035, device='cuda:0')\n",
      "200 tensor(2.3022, device='cuda:0')\n",
      "300 tensor(2.3025, device='cuda:0')\n",
      "Iteration: 6 | Loss: 2.302640199661255 | Train,Test accuracy: 0.08793958276510239.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3041, device='cuda:0')\n",
      "100 tensor(2.3057, device='cuda:0')\n",
      "200 tensor(2.3028, device='cuda:0')\n",
      "300 tensor(2.3024, device='cuda:0')\n",
      "Iteration: 7 | Loss: 2.3026580810546875 | Train,Test accuracy: 0.08761189132928848.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3022, device='cuda:0')\n",
      "100 tensor(2.3015, device='cuda:0')\n",
      "200 tensor(2.3038, device='cuda:0')\n",
      "300 tensor(2.3027, device='cuda:0')\n",
      "Iteration: 8 | Loss: 2.3026483058929443 | Train,Test accuracy: 0.08780370652675629.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3050, device='cuda:0')\n",
      "100 tensor(2.3025, device='cuda:0')\n",
      "200 tensor(2.2994, device='cuda:0')\n",
      "300 tensor(2.3006, device='cuda:0')\n",
      "Iteration: 9 | Loss: 2.302640199661255 | Train,Test accuracy: 0.08801150321960449.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3038, device='cuda:0')\n",
      "100 tensor(2.3020, device='cuda:0')\n",
      "200 tensor(2.2991, device='cuda:0')\n",
      "300 tensor(2.3030, device='cuda:0')\n",
      "Iteration: 10 | Loss: 2.302628755569458 | Train,Test accuracy: 0.08771979063749313.3f%, 0.09009098261594772.3f%\n",
      "0 tensor(2.3037, device='cuda:0')\n",
      "100 tensor(2.3009, device='cuda:0')\n",
      "200 tensor(2.3058, device='cuda:0')\n",
      "300 tensor(2.3035, device='cuda:0')\n",
      "Iteration: 11 | Loss: 2.302602529525757 | Train,Test accuracy: 0.08798753470182419.3f%, 0.09009098261594772.3f%\n"
     ]
    },
    {
     "ename": "IndexError",
     "evalue": "index 10 is out of bounds for axis 0 with size 10",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mIndexError\u001b[0m                                Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-27-9a3c1db1a2ea>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m     86\u001b[0m               \"Train,Test accuracy: {0}.3f%, {1}.3f%\".format(train_accuracy/len(trainloader), test_accuracy/len(testloader)) )\n\u001b[0;32m     87\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 88\u001b[1;33m         \u001b[0mtrain_accuracy_qXsquare2_woBN\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mlr_idx\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mepoch\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mtrain_accuracy\u001b[0m\u001b[1;33m/\u001b[0m\u001b[0mlen\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mtrainloader\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     89\u001b[0m         \u001b[0mtrain_loss_qXsquare2_woBN\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mlr_idx\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m[\u001b[0m\u001b[0mepoch\u001b[0m\u001b[1;33m]\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mtrain_loss\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     90\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mIndexError\u001b[0m: index 10 is out of bounds for axis 0 with size 10"
     ]
    }
   ],
   "source": [
    "# net = DNNCifar(args=args).to(args.device)\n",
    "\n",
    "lr_array = [0.1, 0.01, 0.001, 0.0001]\n",
    "Max_iter = 10\n",
    "\n",
    "train_accuracy_qXsquare2_woBN = np.zeros((len(lr_array), Max_iter))\n",
    "train_loss_qXsquare2_woBN     = np.zeros((len(lr_array), Max_iter))\n",
    "test_accuracy_qXsquare2_woBN  = np.zeros((len(lr_array), Max_iter))\n",
    "test_loss_qXsquare2_woBN      = np.zeros((len(lr_array), Max_iter))\n",
    "\n",
    "\n",
    "for lr_idx in range(len(lr_array)):\n",
    "    \n",
    "    cur_lr = lr_array[lr_idx]\n",
    "    \n",
    "    print()\n",
    "    print('Learning rate=', cur_lr)\n",
    "    print()\n",
    "    \n",
    "    criterion = nn.CrossEntropyLoss()\n",
    "    optimizer = optim.Adam(net.parameters(), lr=cur_lr, weight_decay=3e-4)\n",
    "\n",
    "    # optimizer = optim.SGD(net.parameters(), lr=0.05, momentum=0.9, weight_decay=0.0001)\n",
    "    \n",
    "    \n",
    "\n",
    "    net = qVGG_xsquare2_woBN('VGG11')\n",
    "    net.cuda()\n",
    "\n",
    "    for epoch in range(200):\n",
    "\n",
    "#         if epoch <= 80:\n",
    "#             cur_lr = 0.001\n",
    "#         elif epoch <= 140:\n",
    "#             cur_lr = 0.0005\n",
    "#         else:    \n",
    "#             cur_lr = 0.0001\n",
    "    #     else:\n",
    "    #         cur_lr = 0.0004\n",
    "\n",
    "#         for g in optimizer.param_groups:\n",
    "#             g['lr'] = cur_lr\n",
    "\n",
    "        running_loss = 0.0\n",
    "        for i, data in enumerate(trainloader, 0):\n",
    "            # get the inputs\n",
    "            inputs, labels = data\n",
    "\n",
    "            if args.gpu:\n",
    "                inputs = inputs.cuda()\n",
    "                labels = labels.cuda()\n",
    "\n",
    "            # wrap them in Variable\n",
    "            inputs, labels = Variable(inputs), Variable(labels)\n",
    "\n",
    "            # zero the parameter gradients\n",
    "            optimizer.zero_grad()\n",
    "\n",
    "            # forward + backward + optimize\n",
    "            outputs = net(inputs)\n",
    "            loss = criterion(outputs, labels)\n",
    "            loss.backward()\n",
    "\n",
    "            if epoch > 16:\n",
    "                for group in optimizer.param_groups:\n",
    "                    for p in group['params']:\n",
    "                        state = optimizer.state[p]\n",
    "                        if state['step'] >= 1024:\n",
    "                            state['step'] = 1000\n",
    "            optimizer.step()\n",
    "\n",
    "\n",
    "            # print statistics\n",
    "            if i % 100 == 0:\n",
    "                print(i,loss.data)\n",
    "            running_loss += loss.data\n",
    "\n",
    "        # Normalizing the loss by the total number of train batches\n",
    "        running_loss /= len(trainloader)\n",
    "\n",
    "        # Calculate training/test set accuracy of the existing model\n",
    "        test_loss, test_accuracy = validation(net, testloader, criterion)\n",
    "        train_loss, train_accuracy = validation(net, trainloader, criterion)\n",
    "\n",
    "        print(\"Iteration: {0} | Loss: {1} |\".format(epoch+1, running_loss),\n",
    "              \"Train,Test accuracy: {0}.3f%, {1}.3f%\".format(train_accuracy/len(trainloader), test_accuracy/len(testloader)) )\n",
    "\n",
    "        train_accuracy_qXsquare2_woBN[lr_idx][epoch] = (train_accuracy/len(trainloader))\n",
    "        train_loss_qXsquare2_woBN[lr_idx][epoch] = (train_loss)\n",
    "\n",
    "        test_accuracy_qXsquare2_woBN[lr_idx][epoch] = (test_accuracy/len(testloader))\n",
    "        test_loss_qXsquare2_woBN[lr_idx][epoch] = (test_loss)\n",
    "\n",
    "        # Specify a path\n",
    "#         PATH = \"./save_models/CIFAR10_VGG11_woBN_xsq2_E200_iter\"+str(epoch)+\"_v1.pt\"\n",
    "#         torch.save(net.state_dict(), PATH)\n",
    "\n",
    "    # save model\n",
    "#     if epoch % 50 == 0:\n",
    "#         print('==> Saving model ...')\n",
    "#         state = {\n",
    "#             'net': net.module if opt.is_gpu else net,\n",
    "#             'epoch': epoch,\n",
    "#         }\n",
    "#         if not os.path.isdir('checkpoint'):\n",
    "#             os.mkdir('checkpoint')\n",
    "#         torch.save(state, '../checkpoint/ckpt.t7')\n",
    "\n",
    "print('==> Finished Training ...')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
