{
  "cells": [
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "J5BFismMgGPM"
      },
      "source": [
        "# Preamble"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "!apt update && apt install -y --no-install-recommends libopencv-dev libturbojpeg-dev\n",
        "# !pip install cupy-cuda11x\n",
        "!pip install mosaicml ffcv numba opencv-python"
      ],
      "metadata": {
        "id": "9fkslf722SZt",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "647f385d-380a-49ff-aaa4-fd9e4a3c86c3"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "\u001b[33m\r0% [Working]\u001b[0m\r            \rGet:1 https://cloud.r-project.org/bin/linux/ubuntu focal-cran40/ InRelease [3,622 B]\n",
            "Hit:2 https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/x86_64  InRelease\n",
            "Get:3 http://security.ubuntu.com/ubuntu focal-security InRelease [114 kB]\n",
            "Hit:4 http://ppa.launchpad.net/c2d4u.team/c2d4u4.0+/ubuntu focal InRelease\n",
            "Hit:5 http://archive.ubuntu.com/ubuntu focal InRelease\n",
            "Get:6 http://archive.ubuntu.com/ubuntu focal-updates InRelease [114 kB]\n",
            "Hit:7 http://ppa.launchpad.net/cran/libgit2/ubuntu focal InRelease\n",
            "Get:8 http://security.ubuntu.com/ubuntu focal-security/universe amd64 Packages [1,051 kB]\n",
            "Get:9 http://ppa.launchpad.net/deadsnakes/ppa/ubuntu focal InRelease [18.1 kB]\n",
            "Get:10 http://archive.ubuntu.com/ubuntu focal-backports InRelease [108 kB]\n",
            "Hit:11 http://ppa.launchpad.net/graphics-drivers/ppa/ubuntu focal InRelease\n",
            "Get:12 http://archive.ubuntu.com/ubuntu focal-updates/main amd64 Packages [3,202 kB]\n",
            "Hit:13 http://ppa.launchpad.net/ubuntugis/ppa/ubuntu focal InRelease\n",
            "Get:14 http://ppa.launchpad.net/deadsnakes/ppa/ubuntu focal/main amd64 Packages [29.5 kB]\n",
            "Get:15 http://archive.ubuntu.com/ubuntu focal-updates/universe amd64 Packages [1,345 kB]\n",
            "Get:16 http://archive.ubuntu.com/ubuntu focal-backports/main amd64 Packages [55.2 kB]\n",
            "Get:17 http://archive.ubuntu.com/ubuntu focal-backports/universe amd64 Packages [28.6 kB]\n",
            "Get:18 http://security.ubuntu.com/ubuntu focal-security/restricted amd64 Packages [2,270 kB]\n",
            "Get:19 http://security.ubuntu.com/ubuntu focal-security/main amd64 Packages [2,726 kB]\n",
            "Fetched 11.1 MB in 17s (656 kB/s)\n",
            "Reading package lists... Done\n",
            "Building dependency tree       \n",
            "Reading state information... Done\n",
            "39 packages can be upgraded. Run 'apt list --upgradable' to see them.\n",
            "Reading package lists... Done\n",
            "Building dependency tree       \n",
            "Reading state information... Done\n",
            "Note, selecting 'libturbojpeg0-dev' instead of 'libturbojpeg-dev'\n",
            "libopencv-dev is already the newest version (4.2.0+dfsg-5+focal2).\n",
            "The following NEW packages will be installed:\n",
            "  libturbojpeg0-dev\n",
            "0 upgraded, 1 newly installed, 0 to remove and 39 not upgraded.\n",
            "Need to get 179 kB of archives.\n",
            "After this operation, 997 kB of additional disk space will be used.\n",
            "Get:1 http://archive.ubuntu.com/ubuntu focal-updates/universe amd64 libturbojpeg0-dev amd64 2.0.3-0ubuntu1.20.04.3 [179 kB]\n",
            "Fetched 179 kB in 1s (135 kB/s)\n",
            "Selecting previously unselected package libturbojpeg0-dev:amd64.\n",
            "(Reading database ... 122532 files and directories currently installed.)\n",
            "Preparing to unpack .../libturbojpeg0-dev_2.0.3-0ubuntu1.20.04.3_amd64.deb ...\n",
            "Unpacking libturbojpeg0-dev:amd64 (2.0.3-0ubuntu1.20.04.3) ...\n",
            "Setting up libturbojpeg0-dev:amd64 (2.0.3-0ubuntu1.20.04.3) ...\n",
            "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
            "Collecting mosaicml\n",
            "  Downloading mosaicml-0.14.1-py3-none-any.whl (565 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m565.9/565.9 kB\u001b[0m \u001b[31m9.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hCollecting ffcv\n",
            "  Downloading ffcv-1.0.2.tar.gz (2.6 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.6/2.6 MB\u001b[0m \u001b[31m52.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25h  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "Requirement already satisfied: numba in /usr/local/lib/python3.10/dist-packages (0.56.4)\n",
            "Requirement already satisfied: opencv-python in /usr/local/lib/python3.10/dist-packages (4.7.0.72)\n",
            "Requirement already satisfied: pyyaml<7,>=6.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (6.0)\n",
            "Requirement already satisfied: tqdm<5,>=4.62.3 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (4.65.0)\n",
            "Collecting torchmetrics<0.11.4,>=0.10.0 (from mosaicml)\n",
            "  Downloading torchmetrics-0.11.3-py3-none-any.whl (518 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m518.6/518.6 kB\u001b[0m \u001b[31m37.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hCollecting torch-optimizer<0.4,>=0.3.0 (from mosaicml)\n",
            "  Downloading torch_optimizer-0.3.0-py3-none-any.whl (61 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m61.9/61.9 kB\u001b[0m \u001b[31m7.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: torchvision<0.16,>=0.11.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (0.15.2+cu118)\n",
            "Requirement already satisfied: torch<2.1,>=1.10.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (2.0.1+cu118)\n",
            "Requirement already satisfied: requests<3,>=2.26.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (2.27.1)\n",
            "Requirement already satisfied: numpy<1.25.0,>=1.21.5 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (1.22.4)\n",
            "Requirement already satisfied: psutil<6,>=5.8.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (5.9.5)\n",
            "Collecting coolname<3,>=1.1.0 (from mosaicml)\n",
            "  Downloading coolname-2.2.0-py2.py3-none-any.whl (37 kB)\n",
            "Collecting tabulate==0.9.0 (from mosaicml)\n",
            "  Downloading tabulate-0.9.0-py3-none-any.whl (35 kB)\n",
            "Requirement already satisfied: py-cpuinfo<10,>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from mosaicml) (9.0.0)\n",
            "Collecting packaging<23,>=21.3.0 (from mosaicml)\n",
            "  Downloading packaging-22.0-py3-none-any.whl (42 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m42.6/42.6 kB\u001b[0m \u001b[31m5.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hCollecting importlib-metadata<7,>=5.0.0 (from mosaicml)\n",
            "  Downloading importlib_metadata-6.6.0-py3-none-any.whl (22 kB)\n",
            "Collecting terminaltables (from ffcv)\n",
            "  Downloading terminaltables-3.1.10-py2.py3-none-any.whl (15 kB)\n",
            "Collecting pytorch_pfn_extras (from ffcv)\n",
            "  Downloading pytorch-pfn-extras-0.6.7.tar.gz (163 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m163.8/163.8 kB\u001b[0m \u001b[31m20.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25h  Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
            "  Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
            "  Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
            "Collecting fastargs (from ffcv)\n",
            "  Downloading fastargs-1.2.0.tar.gz (12 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "Collecting assertpy (from ffcv)\n",
            "  Downloading assertpy-1.1.tar.gz (25 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in /usr/local/lib/python3.10/dist-packages (from numba) (0.39.1)\n",
            "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from numba) (67.7.2)\n",
            "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.10/dist-packages (from importlib-metadata<7,>=5.0.0->mosaicml) (3.15.0)\n",
            "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.26.0->mosaicml) (1.26.15)\n",
            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.26.0->mosaicml) (2022.12.7)\n",
            "Requirement already satisfied: charset-normalizer~=2.0.0 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.26.0->mosaicml) (2.0.12)\n",
            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.26.0->mosaicml) (3.4)\n",
            "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (3.12.0)\n",
            "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (4.5.0)\n",
            "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (1.11.1)\n",
            "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (3.1)\n",
            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (3.1.2)\n",
            "Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch<2.1,>=1.10.0->mosaicml) (2.0.0)\n",
            "Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch<2.1,>=1.10.0->mosaicml) (3.25.2)\n",
            "Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch<2.1,>=1.10.0->mosaicml) (16.0.5)\n",
            "Collecting pytorch-ranger>=0.1.1 (from torch-optimizer<0.4,>=0.3.0->mosaicml)\n",
            "  Downloading pytorch_ranger-0.1.1-py3-none-any.whl (14 kB)\n",
            "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/local/lib/python3.10/dist-packages (from torchvision<0.16,>=0.11.0->mosaicml) (8.4.0)\n",
            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch<2.1,>=1.10.0->mosaicml) (2.1.2)\n",
            "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch<2.1,>=1.10.0->mosaicml) (1.3.0)\n",
            "Building wheels for collected packages: ffcv, assertpy, fastargs, pytorch_pfn_extras\n",
            "  Building wheel for ffcv (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "  Created wheel for ffcv: filename=ffcv-1.0.2-cp310-cp310-linux_x86_64.whl size=249762 sha256=bfac92843a3f38b74dca007a3c0817a748a29c90142853eadedeb5ddfe20743c\n",
            "  Stored in directory: /root/.cache/pip/wheels/2c/bb/f2/0077860cc45e301b01d29fde8b307adc22e8df497f0649cbb5\n",
            "  Building wheel for assertpy (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "  Created wheel for assertpy: filename=assertpy-1.1-py3-none-any.whl size=42897 sha256=5d6623db902e43f5ba5affd1e59ad895cdce5229a0543ed7ffd23d77a00d196c\n",
            "  Stored in directory: /root/.cache/pip/wheels/af/56/e7/175b60f695bb1520ccdcc66a6d0dbdbf124f6e14cad04703c9\n",
            "  Building wheel for fastargs (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
            "  Created wheel for fastargs: filename=fastargs-1.2.0-py3-none-any.whl size=10920 sha256=cc7ce865294c184cebeab71b8037c155139b707fbf71a7bc44bb2bdba158bfdb\n",
            "  Stored in directory: /root/.cache/pip/wheels/f1/3d/33/d0d781228841ce1f794e71d29715f2a91beb8e49159620992b\n",
            "  Building wheel for pytorch_pfn_extras (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
            "  Created wheel for pytorch_pfn_extras: filename=pytorch_pfn_extras-0.6.7-py3-none-any.whl size=191237 sha256=c8899ed9f7d7b09ba36f3cc69b687a493f100371fe156cbf3cb9ca6529a20589\n",
            "  Stored in directory: /root/.cache/pip/wheels/3c/da/ab/4c121b54bf37ab1f5bc4e43d500c5788bf787e5508dba74ba4\n",
            "Successfully built ffcv assertpy fastargs pytorch_pfn_extras\n",
            "Installing collected packages: fastargs, coolname, assertpy, terminaltables, tabulate, packaging, importlib-metadata, pytorch-ranger, torchmetrics, torch-optimizer, pytorch_pfn_extras, mosaicml, ffcv\n",
            "  Attempting uninstall: tabulate\n",
            "    Found existing installation: tabulate 0.8.10\n",
            "    Uninstalling tabulate-0.8.10:\n",
            "      Successfully uninstalled tabulate-0.8.10\n",
            "  Attempting uninstall: packaging\n",
            "    Found existing installation: packaging 23.1\n",
            "    Uninstalling packaging-23.1:\n",
            "      Successfully uninstalled packaging-23.1\n",
            "Successfully installed assertpy-1.1 coolname-2.2.0 fastargs-1.2.0 ffcv-1.0.2 importlib-metadata-6.6.0 mosaicml-0.14.1 packaging-22.0 pytorch-ranger-0.1.1 pytorch_pfn_extras-0.6.7 tabulate-0.9.0 terminaltables-3.1.10 torch-optimizer-0.3.0 torchmetrics-0.11.3\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "sUXLtA27scwa"
      },
      "outputs": [],
      "source": [
        "from __future__ import print_function\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "import torch.optim as optim\n",
        "from torchvision import datasets, transforms, models\n",
        "from torch.optim.lr_scheduler import StepLR\n",
        "from tqdm import tqdm\n",
        "from torch.utils.data import DataLoader, Dataset, Subset\n",
        "import random\n",
        "import matplotlib.pyplot as plt\n",
        "import numpy as np\n",
        "import math\n",
        "from collections import OrderedDict\n",
        "import tensorflow as tf\n",
        "from PIL import Image\n",
        "import os\n",
        "import itertools\n",
        "from typing import List\n",
        "from torch.cuda.amp import GradScaler, autocast"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "from ffcv.fields import IntField, RGBImageField\n",
        "from ffcv.fields.decoders import IntDecoder, SimpleRGBImageDecoder\n",
        "from ffcv.loader import Loader, OrderOption\n",
        "from ffcv.pipeline.operation import Operation\n",
        "from ffcv.transforms import RandomHorizontalFlip, Cutout, \\\n",
        "    RandomTranslate, Convert, ToDevice, ToTensor, ToTorchImage\n",
        "from ffcv.transforms.common import Squeeze\n",
        "from ffcv.writer import DatasetWriter\n",
        "import gc"
      ],
      "metadata": {
        "id": "n3nxy5RcGbRQ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "from ffcv.transforms import ToTensor, ToDevice, Squeeze, NormalizeImage, \\\n",
        "    RandomHorizontalFlip, ToTorchImage\n",
        "from ffcv.fields.rgb_image import CenterCropRGBImageDecoder, \\\n",
        "    RandomResizedCropRGBImageDecoder\n",
        "from ffcv.fields.basics import IntDecoder\n",
        "from pathlib import Path"
      ],
      "metadata": {
        "id": "oD903y2lprnk"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "hlHrV6qggaS_"
      },
      "outputs": [],
      "source": [
        "def to_chunks(it, size):\n",
        "  size = int(math.ceil(size))\n",
        "  it = iter(it)\n",
        "  return iter(lambda: tuple(itertools.islice(it, size)), ())"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "device = torch.device(\"cuda\")\n",
        "torch.manual_seed(318946379189643)"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "qp6Pb0oFYMKA",
        "outputId": "1bbc4689-de57-4049-97ba-84882dc69102"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "<torch._C.Generator at 0x7fef6c116470>"
            ]
          },
          "metadata": {},
          "execution_count": 6
        }
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "5gQ2Kn887PlA"
      },
      "source": [
        "# Plotting"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "def plot_error_bars(xs, yss, linestyle, color, label):\n",
        "  means = np.array([np.mean(ys) for ys in yss])\n",
        "  high = np.array([np.quantile(ys, 0.9) for ys in yss])\n",
        "  low = np.array([np.quantile(ys, 0.1) for ys in yss])\n",
        "  # errs_train = [100 - np.mean(x['train']) for x in samples2acc.values()]\n",
        "  plt.errorbar(xs, means, [np.maximum(means - low, 0), np.maximum(high - means, 0)], linestyle=linestyle, color=color, capsize=5, label=label)"
      ],
      "metadata": {
        "id": "1alfTeKbqlJD"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def plot_ratio(stats, *, ylim, root, emp_by_pred, n_points, line_name, dim_f):\n",
        "  plt.title(f\"Ratio of empirical to predicted error difference\")\n",
        "  # plt.title(f\"Ratio of empirical to predicted error to predicted error for {n_classes} classes\")\n",
        "  plt.xscale('log')\n",
        "  plt.xlabel('n_samples')\n",
        "  plt.ylim([0, ylim])\n",
        "  plt.ylabel('Ratio')\n",
        "  ax = plt.gca()\n",
        "  for key, samples2acc in stats.items():\n",
        "    samples = list(samples2acc.keys())\n",
        "    err_dif = [np.array(x['train']) - np.array(x['test']) for x in samples2acc.values()]\n",
        "    # err_dif = [test_accs[dim] - np.array(v['test']) for k, v in samples2acc.items()]\n",
        "    dim = dim_f(key)\n",
        "    def predicted_error(x):\n",
        "      if root:\n",
        "        return 100 * math.sqrt(n_points * dim / x)\n",
        "      else:\n",
        "        return 100 * n_points * dim / x\n",
        "    predicted = np.array([predicted_error(x) for x in samples]).reshape(-1, 1)\n",
        "    color = next(ax._get_lines.prop_cycler)['color']\n",
        "    arr = [x / y if emp_by_pred else y / x for x, y in zip(err_dif, predicted)]\n",
        "    plot_error_bars(samples, arr, linestyle=\"-\", color=color, label=f'{line_name}={key}')\n",
        "  plt.legend()\n",
        "  plt.show()"
      ],
      "metadata": {
        "id": "gej3RbUeWziZ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "gN7JYgVggb3i"
      },
      "source": [
        "# Datasets"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "9qi58TQOL_OB"
      },
      "outputs": [],
      "source": [
        "def get_labels(dataset):\n",
        "  return torch.tensor(dataset.targets).tolist()\n",
        "  # return [label for (_, label) in dataset]"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "cifar10_datasets = {\n",
        "    'train': datasets.CIFAR10('/tmp', train=True, download=True),\n",
        "    'test': datasets.CIFAR10('/tmp', train=False, download=True)\n",
        "}\n",
        "\n",
        "for (name, ds) in cifar10_datasets.items():\n",
        "    writer = DatasetWriter(f'/tmp/cifar_{name}.beton', {\n",
        "        'image': RGBImageField(),\n",
        "        'label': IntField()\n",
        "    })\n",
        "    writer.from_indexed_dataset(ds)"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "EqI4yLSoGwkg",
        "outputId": "34345e37-5e0e-4cf8-8164-e1b5931bbf6a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /tmp/cifar-10-python.tar.gz\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 170498071/170498071 [00:10<00:00, 15858674.79it/s]\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Extracting /tmp/cifar-10-python.tar.gz to /tmp\n",
            "Files already downloaded and verified\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 50000/50000 [00:03<00:00, 15806.89it/s]\n",
            "100%|██████████| 10000/10000 [00:01<00:00, 8908.22it/s]\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "def generate_until(gen_f, pred):\n",
        "  while True:\n",
        "    res = gen_f()\n",
        "    if pred(res):\n",
        "      return res"
      ],
      "metadata": {
        "id": "6DvFCXExHqxV"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def gen_order(*, labels, label_map, n_samples, n_negatives):\n",
        "    n_points = len(labels)\n",
        "    order = []\n",
        "    for _ in range(n_samples):\n",
        "      a = random.randrange(n_points)\n",
        "      label = labels[a]\n",
        "      order.append(a)\n",
        "      order.append(generate_until(\n",
        "          lambda: random.choice(label_map[label]),\n",
        "          lambda p: p != a\n",
        "          )\n",
        "      )\n",
        "      for _ in range(n_negatives):\n",
        "        order.append(generate_until(\n",
        "            lambda: random.randrange(n_points),\n",
        "            lambda n: labels[n] != label\n",
        "            )\n",
        "        )\n",
        "    return order\n",
        "\n",
        "\n",
        "def contrastive_dataloader(dataset_path, labels, *, n_samples, n_negatives, batch_size):\n",
        "    label_map = {}\n",
        "    for i, label in enumerate(labels):\n",
        "      label_map.setdefault(label, []).append(i)\n",
        "      # assert init_dataset[i][1] == label, (init_dataset[i][1], label)\n",
        "\n",
        "    order = gen_order(labels=labels, label_map=label_map, n_samples=n_samples, n_negatives=n_negatives)\n",
        "\n",
        "    CIFAR_MEAN = [125.307, 122.961, 113.8575]\n",
        "    CIFAR_STD = [51.5865, 50.847, 51.255]\n",
        "    loaders = {}\n",
        "\n",
        "    label_pipeline: List[Operation] = [IntDecoder(), ToTensor(), ToDevice(torch.device('cuda:0')), Squeeze()]\n",
        "    image_pipeline: List[Operation] = [SimpleRGBImageDecoder()]\n",
        "\n",
        "    # if name == 'train':\n",
        "    #     image_pipeline.extend([\n",
        "    #         RandomHorizontalFlip(),\n",
        "    #         RandomTranslate(padding=2, fill=tuple(map(int, CIFAR_MEAN))),\n",
        "    #         Cutout(4, tuple(map(int, CIFAR_MEAN))),\n",
        "    #     ])\n",
        "\n",
        "    image_pipeline.extend([\n",
        "        ToTensor(),\n",
        "        ToDevice(torch.device('cuda:0'), non_blocking=True),\n",
        "        ToTorchImage(),\n",
        "        Convert(torch.float16),\n",
        "        transforms.Normalize(CIFAR_MEAN, CIFAR_STD),\n",
        "    ])\n",
        "\n",
        "    ordering = OrderOption.SEQUENTIAL\n",
        "    batch_size = batch_size - batch_size % (n_negatives + 2)\n",
        "\n",
        "    return Loader(dataset_path,\n",
        "                  batch_size=batch_size,\n",
        "                  num_workers=2,\n",
        "                  order=OrderOption.SEQUENTIAL,\n",
        "                  indices=order,\n",
        "                  os_cache=True,\n",
        "                  drop_last=False,\n",
        "                  pipelines={'image': image_pipeline, 'label': label_pipeline})"
      ],
      "metadata": {
        "id": "fu2_iqN3IuH9"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def get_outputs(model, batch):\n",
        "  return model(batch[0].to(device))"
      ],
      "metadata": {
        "id": "LgMLX2CZQ4oR"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "logsoftmax = nn.LogSoftmax(1)"
      ],
      "metadata": {
        "id": "DUyOPuVD9Ro2"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def contrastive_loss_acc(outputs, n_negatives):\n",
        "  assert outputs.shape[0] % (n_negatives + 2) == 0\n",
        "  # print(outputs.shape[0] / (n_negatives + 2))\n",
        "  tuples_sep = outputs.reshape([outputs.shape[0] // (n_negatives + 2), n_negatives + 2] + list(outputs.shape[1:]))\n",
        "  anchor = tuples_sep[:, :1]\n",
        "  candidates = tuples_sep[:, 1:]\n",
        "  inner_products = (anchor * candidates).sum(dim=-1)\n",
        "  # print(anchor.shape, candidates.shape, inner_products.shape)\n",
        "  softmax = logsoftmax(inner_products)\n",
        "  loss = torch.mean(-softmax[:, 0])\n",
        "  acc = torch.mean((softmax.argmax(dim=1) == 0).float())\n",
        "  return loss, acc"
      ],
      "metadata": {
        "id": "u1Xkje5l6fgr"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Train/Test"
      ],
      "metadata": {
        "id": "bU5Wl-fZK9wF"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "-rWuAR-zxMDy"
      },
      "outputs": [],
      "source": [
        "def train(model, train_loader, scaler, optimizer, epoch, n_vals, loss_acc_f):\n",
        "  model.train()\n",
        "  n_batches = len(train_loader)\n",
        "  # progress_bar = tqdm(train_loader, position=0, leave=True, miniters=10)\n",
        "  losses = []\n",
        "  # for batch in progress_bar:\n",
        "\n",
        "  for batch in train_loader:\n",
        "    optimizer.zero_grad()\n",
        "    with autocast():\n",
        "      outputs = get_outputs(model, batch)\n",
        "    n_vals -= outputs.shape[0]\n",
        "    if n_vals < 0:\n",
        "      outputs = outputs[:n_vals]\n",
        "    loss, _ = loss_acc_f(outputs)\n",
        "    losses.append(loss.detach().item())\n",
        "    scaler.scale(loss).backward()\n",
        "    scaler.step(optimizer)\n",
        "    scaler.update()\n",
        "    if n_vals < 0:\n",
        "      break\n",
        "    # progress_bar.set_description(f'Train Epoch: {epoch} [{len(losses)}/{n_batches} ({100. * len(losses) / n_batches:.0f}%)]\\tLoss: {np.mean(losses):.6f}', refresh=False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ZXEy_RxcxRxe"
      },
      "outputs": [],
      "source": [
        "def test(model, test_loader, msg, n_vals, loss_acc_f):\n",
        "  model.eval()\n",
        "  test_loss = []\n",
        "  correct = []\n",
        "  with torch.no_grad():\n",
        "    for batch in test_loader:\n",
        "      with autocast():\n",
        "        outputs = get_outputs(model, batch)\n",
        "      n_vals -= outputs.shape[0]\n",
        "      if n_vals < 0:\n",
        "        outputs = outputs[:n_vals]\n",
        "      loss, acc = loss_acc_f(outputs)\n",
        "      test_loss.append(loss.detach().item())\n",
        "      correct.append(acc.detach().item())\n",
        "      if n_vals < 0:\n",
        "        break\n",
        "\n",
        "  print(f'{msg} Average loss: {np.mean(test_loss):.4f}, Accuracy: {100. * np.mean(correct):.2f}%)')\n",
        "  return 100 * np.mean(correct)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "8lBmUSdcdsK-"
      },
      "outputs": [],
      "source": [
        "def class_label_list_to_sets(assignment, n_classes):\n",
        "  res = [[] for _ in range(n_classes)]\n",
        "  for i, c in enumerate(assignment):\n",
        "    res[c].append(i)\n",
        "  return res"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "jDA-mxSiZsqq"
      },
      "outputs": [],
      "source": [
        "def subsample(dataset, indices, max_class):\n",
        "  sample_indices = list(itertools.chain(*indices[:max_class]))\n",
        "  labels = []\n",
        "  for c, lst in enumerate(indices[:max_class]):\n",
        "    labels += [c] * len(lst)\n",
        "  return Subset(dataset, sample_indices), labels"
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Sampling from different classes"
      ],
      "metadata": {
        "id": "zn1Gb_r_hFFO"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "def get_embedding_dataloader(dataset_path, batch_size, mean, std):\n",
        "    loaders = {}\n",
        "\n",
        "    label_pipeline: List[Operation] = [IntDecoder(), ToTensor(), ToDevice(torch.device('cuda:0')), Squeeze()]\n",
        "    image_pipeline: List[Operation] = [SimpleRGBImageDecoder()]\n",
        "\n",
        "    image_pipeline.extend([\n",
        "        ToTensor(),\n",
        "        ToDevice(torch.device('cuda:0'), non_blocking=True),\n",
        "        ToTorchImage(),\n",
        "        Convert(torch.float16),\n",
        "        transforms.Normalize(mean, std),\n",
        "    ])\n",
        "\n",
        "    ordering = OrderOption.SEQUENTIAL\n",
        "\n",
        "    return Loader(dataset_path,\n",
        "                  batch_size=batch_size,\n",
        "                  num_workers=2,\n",
        "                  order=OrderOption.SEQUENTIAL,\n",
        "                  drop_last=False,\n",
        "                  pipelines={'image': image_pipeline, 'label': label_pipeline})\n",
        "\n",
        "def getembeddings(dataset_path, mean, std):\n",
        "  model = models.resnet18(weights=models.ResNet18_Weights.IMAGENET1K_V1).to(device)\n",
        "  model.fc = nn.Identity()\n",
        "  model.eval()\n",
        "  res = []\n",
        "  train_loader = get_embedding_dataloader(dataset_path, batch_size=1000)\n",
        "  with torch.no_grad():\n",
        "    for batch in train_loader:\n",
        "        with autocast():\n",
        "          res.append(get_outputs(model, batch).detach().cpu())\n",
        "  return torch.cat(res).float()"
      ],
      "metadata": {
        "id": "x7TZ87SlhGV1"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def gen_order_with_ground_truth(embeddings, *, n_samples, n_negatives):\n",
        "    order = []\n",
        "    n_points = embeddings.shape[0]\n",
        "    for _ in range(n_samples):\n",
        "      cur = random.sample(range(n_points), k=n_negatives + 2)\n",
        "      a, *candidates = cur\n",
        "      a_emb = embeddings[a]\n",
        "      similarities = a_emb @ embeddings[candidates].T\n",
        "      best = torch.argmax(similarities)\n",
        "      candidates[0], candidates[best] = candidates[best], candidates[0]\n",
        "      order += [a] + candidates\n",
        "    return order\n",
        "\n",
        "\n",
        "def contrastive_dataloader_with_ground_truth(dataset_path, embeddings, *, n_samples, n_negatives, batch_size):\n",
        "    label_map = {}\n",
        "    n_points = embeddings.shape[0]\n",
        "\n",
        "    order = gen_order_with_ground_truth(embeddings, n_samples=n_samples, n_negatives=n_negatives)\n",
        "\n",
        "    CIFAR_MEAN = [125.307, 122.961, 113.8575]\n",
        "    CIFAR_STD = [51.5865, 50.847, 51.255]\n",
        "    loaders = {}\n",
        "\n",
        "    label_pipeline: List[Operation] = [IntDecoder(), ToTensor(), ToDevice(torch.device('cuda:0')), Squeeze()]\n",
        "    image_pipeline: List[Operation] = [SimpleRGBImageDecoder()]\n",
        "\n",
        "    image_pipeline.extend([\n",
        "        ToTensor(),\n",
        "        ToDevice(torch.device('cuda:0'), non_blocking=True),\n",
        "        ToTorchImage(),\n",
        "        Convert(torch.float16),\n",
        "        transforms.Normalize(CIFAR_MEAN, CIFAR_STD),\n",
        "    ])\n",
        "\n",
        "    ordering = OrderOption.SEQUENTIAL\n",
        "    batch_size = batch_size - batch_size % (n_negatives + 2)\n",
        "\n",
        "    return Loader(dataset_path,\n",
        "                  batch_size=batch_size,\n",
        "                  num_workers=2,\n",
        "                  order=OrderOption.SEQUENTIAL,\n",
        "                  indices=order,\n",
        "                  drop_last=False,\n",
        "                  pipelines={'image': image_pipeline, 'label': label_pipeline})"
      ],
      "metadata": {
        "id": "3arjK9br1gOz"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Code"
      ],
      "metadata": {
        "id": "13us12ZrZXvk"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "code = \\\n",
        "\"\"\"\n",
        "from __future__ import print_function\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "import torch.optim as optim\n",
        "from torchvision import datasets, transforms, models\n",
        "from torch.optim.lr_scheduler import StepLR\n",
        "from tqdm import tqdm\n",
        "from torch.utils.data import DataLoader, Dataset, Subset\n",
        "import random\n",
        "import matplotlib.pyplot as plt\n",
        "import numpy as np\n",
        "import math\n",
        "from collections import OrderedDict\n",
        "import tensorflow as tf\n",
        "from PIL import Image\n",
        "import os\n",
        "import itertools\n",
        "from typing import List\n",
        "from torch.cuda.amp import GradScaler, autocast\n",
        "\n",
        "from ffcv.fields import IntField, RGBImageField\n",
        "from ffcv.fields.decoders import IntDecoder, SimpleRGBImageDecoder\n",
        "from ffcv.loader import Loader, OrderOption\n",
        "from ffcv.pipeline.operation import Operation\n",
        "from ffcv.transforms import RandomHorizontalFlip, Cutout, \\\n",
        "    RandomTranslate, Convert, ToDevice, ToTensor, ToTorchImage\n",
        "from ffcv.transforms.common import Squeeze\n",
        "from ffcv.writer import DatasetWriter\n",
        "import gc\n",
        "import sys\n",
        "\n",
        "n_runs, n_points, n_negatives, dim, n_samples = [int(x) for x in sys.argv[1:]]\n",
        "print(f\"Runs: {n_runs} Points: {n_points} Negatives: {n_negatives} Dim: {dim} Samples: {n_samples}\")\n",
        "\n",
        "device = torch.device(\"cuda\")\n",
        "torch.manual_seed(318946379189643)\n",
        "\n",
        "\n",
        "\n",
        "def get_labels(dataset):\n",
        "  return torch.tensor(dataset.targets).tolist()\n",
        "  # return [label for (_, label) in dataset]\n",
        "\n",
        "\n",
        "def generate_until(gen_f, pred):\n",
        "  while True:\n",
        "    res = gen_f()\n",
        "    if pred(res):\n",
        "      return res\n",
        "\n",
        "\n",
        "def gen_order(*, labels, allowed_indices, n_samples, n_negatives):\n",
        "    n_points = len(labels)\n",
        "    order = []\n",
        "    for _ in range(n_samples):\n",
        "      a = random.choice(allowed_indices)\n",
        "      label = labels[a]\n",
        "      order.append(a)\n",
        "      order.append(generate_until(\n",
        "          lambda: random.choice(allowed_indices),\n",
        "          lambda p: p != a and labels[p] == labels[a]\n",
        "          )\n",
        "      )\n",
        "      for _ in range(n_negatives):\n",
        "        order.append(generate_until(\n",
        "            lambda: random.choice(allowed_indices),\n",
        "            lambda n: labels[n] != label\n",
        "            )\n",
        "        )\n",
        "    return order\n",
        "\n",
        "\n",
        "def contrastive_dataloader(dataset_path, labels, *, allowed_indices, n_samples, n_negatives, batch_size):\n",
        "    order = gen_order(labels=labels, allowed_indices=allowed_indices, n_samples=n_samples, n_negatives=n_negatives)\n",
        "\n",
        "    CIFAR_MEAN = [125.307, 122.961, 113.8575]\n",
        "    CIFAR_STD = [51.5865, 50.847, 51.255]\n",
        "    loaders = {}\n",
        "\n",
        "    label_pipeline: List[Operation] = [IntDecoder(), ToTensor(), ToDevice(torch.device('cuda:0')), Squeeze()]\n",
        "    image_pipeline: List[Operation] = [SimpleRGBImageDecoder()]\n",
        "\n",
        "    # if name == 'train':\n",
        "    #     image_pipeline.extend([\n",
        "    #         RandomHorizontalFlip(),\n",
        "    #         RandomTranslate(padding=2, fill=tuple(map(int, CIFAR_MEAN))),\n",
        "    #         Cutout(4, tuple(map(int, CIFAR_MEAN))),\n",
        "    #     ])\n",
        "\n",
        "    image_pipeline.extend([\n",
        "        ToTensor(),\n",
        "        ToDevice(torch.device('cuda:0'), non_blocking=True),\n",
        "        ToTorchImage(),\n",
        "        Convert(torch.float16),\n",
        "        transforms.Normalize(CIFAR_MEAN, CIFAR_STD),\n",
        "    ])\n",
        "\n",
        "    ordering = OrderOption.SEQUENTIAL\n",
        "    batch_size = batch_size - batch_size % (n_negatives + 2)\n",
        "\n",
        "    return Loader(dataset_path,\n",
        "                  batch_size=batch_size,\n",
        "                  num_workers=2,\n",
        "                  order=OrderOption.SEQUENTIAL,\n",
        "                  indices=order,\n",
        "                  os_cache=True,\n",
        "                  drop_last=False,\n",
        "                  pipelines={'image': image_pipeline, 'label': label_pipeline})\n",
        "\n",
        "def get_outputs(model, batch):\n",
        "  return model(batch[0].to(device))\n",
        "\n",
        "\n",
        "logsoftmax = nn.LogSoftmax(1)\n",
        "\n",
        "\n",
        "\n",
        "def contrastive_loss_acc(outputs, n_negatives):\n",
        "  assert outputs.shape[0] % (n_negatives + 2) == 0\n",
        "  # print(outputs.shape[0] / (n_negatives + 2))\n",
        "  tuples_sep = outputs.reshape([outputs.shape[0] // (n_negatives + 2), n_negatives + 2] + list(outputs.shape[1:]))\n",
        "  anchor = tuples_sep[:, :1]\n",
        "  candidates = tuples_sep[:, 1:]\n",
        "  inner_products = (anchor * candidates).sum(dim=-1)\n",
        "  # print(anchor.shape, candidates.shape, inner_products.shape)\n",
        "  softmax = logsoftmax(inner_products)\n",
        "  loss = torch.mean(-softmax[:, 0])\n",
        "  acc = torch.mean((softmax.argmax(dim=1) == 0).float())\n",
        "  return loss, acc\n",
        "\n",
        "\n",
        "def train(model, train_loader, scaler, optimizer, epoch, n_vals, loss_acc_f):\n",
        "  model.train()\n",
        "  n_batches = len(train_loader)\n",
        "  # progress_bar = tqdm(train_loader, position=0, leave=True, miniters=10)\n",
        "  losses = []\n",
        "  # for batch in progress_bar:\n",
        "\n",
        "  for i, batch in enumerate(train_loader):\n",
        "    optimizer.zero_grad()\n",
        "    with autocast():\n",
        "      outputs = get_outputs(model, batch)\n",
        "    n_vals -= outputs.shape[0]\n",
        "    if n_vals < 0:\n",
        "      outputs = outputs[:n_vals]\n",
        "    loss, _ = loss_acc_f(outputs)\n",
        "    losses.append(loss.detach().item())\n",
        "    scaler.scale(loss).backward()\n",
        "    scaler.step(optimizer)\n",
        "    scaler.update()\n",
        "    if n_vals < 0:\n",
        "      break\n",
        "    # progress_bar.set_description(f'Train Epoch: {epoch} [{len(losses)}/{n_batches} ({100. * len(losses) / n_batches:.0f}%)]\\tLoss: {np.mean(losses):.6f}', refresh=False)\n",
        "\n",
        "\n",
        "def test(model, test_loader, msg, n_vals, loss_acc_f):\n",
        "  model.eval()\n",
        "  test_loss = []\n",
        "  correct = []\n",
        "  with torch.no_grad():\n",
        "    for batch in test_loader:\n",
        "      with autocast():\n",
        "        outputs = get_outputs(model, batch)\n",
        "      n_vals -= outputs.shape[0]\n",
        "      if n_vals < 0:\n",
        "        outputs = outputs[:n_vals]\n",
        "      loss, acc = loss_acc_f(outputs)\n",
        "      test_loss.append(loss.detach().item())\n",
        "      correct.append(acc.detach().item())\n",
        "      if n_vals < 0:\n",
        "        break\n",
        "\n",
        "  print(f'{msg} Average loss: {np.mean(test_loss):.4f}, Accuracy: {100. * np.mean(correct):.2f}%)')\n",
        "  return 100 * np.mean(correct)\n",
        "\n",
        "\n",
        "cifar10_train_dataset = datasets.CIFAR10('/tmp', train=True, download=True)\n",
        "cifar10_test_dataset = datasets.CIFAR10('/tmp', train=False)\n",
        "cifar10_train_labels = get_labels(cifar10_train_dataset)\n",
        "cifar10_test_labels = get_labels(cifar10_test_dataset)\n",
        "\n",
        "\n",
        "def every_class_twice(allowed_indices):\n",
        "  cnts = [0] * 10\n",
        "  for x in allowed_indices:\n",
        "    cnts[cifar10_train_labels[x]] += 1\n",
        "  return all(xnt > 1 for cnt in cnts)\n",
        "\n",
        "n_vals = n_samples * (2 + n_negatives)\n",
        "epochs = 100\n",
        "for run in range(n_runs):\n",
        "  init_n_points = len(cifar10_train_labels)\n",
        "  allowed_indices = random.sample(range(init_n_points), k=n_points)\n",
        "# train_loader = train_loaders[n_negatives][run]\n",
        "# test_loader = test_loaders[n_negatives][run]\n",
        "  train_loader = contrastive_dataloader(\"/tmp/cifar_train.beton\", cifar10_train_labels, allowed_indices=allowed_indices, n_samples=n_vals, n_negatives=n_negatives, batch_size=500)\n",
        "  test_loader = contrastive_dataloader(\"/tmp/cifar_train.beton\", cifar10_train_labels, allowed_indices=allowed_indices, n_samples=10000, n_negatives=n_negatives, batch_size=500)\n",
        "  # test_loader = contrastive_dataloader(\"/tmp/cifar_test.beton\", cifar10_test_labels, allowed_indices=allowed_indices, n_samples=10000, n_negatives=n_negatives, batch_size=5000)\n",
        "  model = models.resnet18()\n",
        "  model.fc = nn.Linear(512, dim, bias=False)\n",
        "  model = model.to(device)\n",
        "  optimizer = optim.Adadelta(model.parameters(), lr=0.1)\n",
        "  scheduler = StepLR(optimizer, step_size=0.1, gamma=0.7)\n",
        "\n",
        "  scaler = GradScaler()\n",
        "  for epoch in range(1, epochs + 1):\n",
        "      train(model, train_loader, scaler, optimizer, epoch, n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      scheduler.step()\n",
        "  train_acc = test(model, train_loader, \"Train\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "  last_test = test(model, test_loader, \"Test\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "  print(f\"{n_points} {n_negatives} {dim} {n_samples} Train: {train_acc} Test: {last_test}\")\n",
        "  with open(\"res.txt\", \"a\") as fout:\n",
        "    print(f\"{n_points} {n_negatives} {dim} {n_samples} Train: {train_acc} Test: {last_test}\", file=fout)\n",
        "  gc.collect()\n",
        "  print(\"-----------------------------------------------\")\n",
        "\"\"\""
      ],
      "metadata": {
        "id": "3W6LPeswZYs-"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"runner.py\", 'w') as fout:\n",
        "  print(code, file=fout)"
      ],
      "metadata": {
        "id": "XvPdRtMSrNmm"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "eJBodVNCVqRj"
      },
      "source": [
        "# CIFAR 10"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "6682cca9-5c84-48b6-c656-7d74a2239561",
        "id": "VbJff_U1VqRk"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n"
          ]
        }
      ],
      "source": [
        "cifar10_train_dataset = datasets.CIFAR10('/tmp', train=True, download=True)\n",
        "cifar10_test_dataset = datasets.CIFAR10('/tmp', train=False)\n",
        "cifar10_train_labels = get_labels(cifar10_train_dataset)\n",
        "cifar10_test_labels = get_labels(cifar10_test_dataset)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "CbQIS9acVqRk"
      },
      "outputs": [],
      "source": [
        "cifar10_train_indices = class_label_list_to_sets(cifar10_train_labels, 10)\n",
        "cifar10_test_indices = class_label_list_to_sets(cifar10_test_labels, 10)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 588
        },
        "outputId": "97b4af8a-a408-4fdd-b147-06d05e450ba6",
        "id": "B0-nR0nWVqRk"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3648, Accuracy: 77.00%)\n",
            "128 10000 Train: 99.99999413724805 Test: 77.00222730636597\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6491, Accuracy: 75.25%)\n",
            "128 10000 Train: 99.99999413724805 Test: 75.25295615196228\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5592, Accuracy: 75.68%)\n",
            "128 10000 Train: 99.99999413724805 Test: 75.68169917379107\n"
          ]
        },
        {
          "output_type": "error",
          "ename": "KeyboardInterrupt",
          "evalue": "ignored",
          "traceback": [
            "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
            "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ffcv/pipeline/allocation_query.py\u001b[0m in \u001b[0;36mallocate_query\u001b[0;34m(memory_allocation, batch_size, batches_ahead)\u001b[0m\n\u001b[1;32m     28\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 29\u001b[0;31m                 \u001b[0mpartial\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpartial\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpin_memory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     30\u001b[0m             \u001b[0;32mexcept\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;31mRuntimeError\u001b[0m: cannot pin 'torch.cuda.LongTensor' only dense CPU tensors can be pinned",
            "\nDuring handling of the above exception, another exception occurred:\n",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
            "\u001b[0;32m<ipython-input-22-36904a1f2f54>\u001b[0m in \u001b[0;36m<cell line: 4>\u001b[0;34m()\u001b[0m\n\u001b[1;32m     18\u001b[0m       \u001b[0mscaler\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mGradScaler\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     19\u001b[0m       \u001b[0;32mfor\u001b[0m \u001b[0mepoch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mepochs\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 20\u001b[0;31m           \u001b[0mtrain\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrain_loader\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mscaler\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moptimizer\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mepoch\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0mo\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mcontrastive_loss_acc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_negatives\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     21\u001b[0m           \u001b[0mscheduler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     22\u001b[0m       \u001b[0mtrain_acc\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtest\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrain_loader\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"Train\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0mo\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mcontrastive_loss_acc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_negatives\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m<ipython-input-16-c3502dd8afcb>\u001b[0m in \u001b[0;36mtrain\u001b[0;34m(model, train_loader, scaler, optimizer, epoch, loss_acc_f)\u001b[0m\n\u001b[1;32m      5\u001b[0m   \u001b[0mlosses\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      6\u001b[0m   \u001b[0;31m# for batch in progress_bar:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 7\u001b[0;31m   \u001b[0;32mfor\u001b[0m \u001b[0mbatch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtrain_loader\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      8\u001b[0m       \u001b[0moptimizer\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mzero_grad\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      9\u001b[0m       \u001b[0;32mwith\u001b[0m \u001b[0mautocast\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ffcv/loader/loader.py\u001b[0m in \u001b[0;36m__iter__\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    224\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgenerate_code\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    225\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 226\u001b[0;31m         \u001b[0;32mreturn\u001b[0m \u001b[0mEpochIterator\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mselected_order\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    227\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    228\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0mfilter\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfield_name\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mstr\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcondition\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mCallable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mbool\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0;34m'Loader'\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ffcv/loader/epoch_iterator.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, loader, order)\u001b[0m\n\u001b[1;32m     63\u001b[0m                              for _ in range(self.loader.batches_ahead + 2)]\n\u001b[1;32m     64\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 65\u001b[0;31m         self.memory_allocations = self.loader.graph.allocate_memory(\n\u001b[0m\u001b[1;32m     66\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mloader\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbatch_size\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     67\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mloader\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbatches_ahead\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;36m2\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ffcv/pipeline/graph.py\u001b[0m in \u001b[0;36mallocate_memory\u001b[0;34m(self, batch_size, batches_ahead)\u001b[0m\n\u001b[1;32m    364\u001b[0m                 \u001b[0mallocated_buffer\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    365\u001b[0m                 \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmemory_allocation\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mAllocationQuery\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 366\u001b[0;31m                     allocated_buffer = allocate_query(memory_allocation,\n\u001b[0m\u001b[1;32m    367\u001b[0m                                                                 \u001b[0mbatch_size\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    368\u001b[0m                                                                 batches_ahead)\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/ffcv/pipeline/allocation_query.py\u001b[0m in \u001b[0;36mallocate_query\u001b[0;34m(memory_allocation, batch_size, batches_ahead)\u001b[0m\n\u001b[1;32m     27\u001b[0m                               device=memory_allocation.device)\n\u001b[1;32m     28\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 29\u001b[0;31m                 \u001b[0mpartial\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpartial\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpin_memory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     30\u001b[0m             \u001b[0;32mexcept\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     31\u001b[0m                 \u001b[0;32mpass\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
          ]
        }
      ],
      "source": [
        "n_runs = 10\n",
        "stats = {}\n",
        "n_negatives = 1\n",
        "for dim in [128, 256,512, 1024]:\n",
        "  stats[dim] = {}\n",
        "  test_loader = contrastive_dataloader(\"/tmp/cifar_test.beton\", cifar10_test_labels, n_samples=10000, n_negatives=n_negatives, batch_size=5000)\n",
        "  for n_samples, epochs in [(2, 100), (10, 100), (100, 100), (1000, 100), (10000, 100)]: # , (100000, 7)\n",
        "  # for n_samples, epochs in [(10000, 100)]: # , (100000, 7)\n",
        "    stats[dim][n_samples] = {'train': [], 'test': []}\n",
        "    for _ in range(n_runs):\n",
        "      train_loader = contrastive_dataloader(\"/tmp/cifar_train.beton\", cifar10_train_labels, n_samples=n_samples, n_negatives=n_negatives, batch_size=500)\n",
        "      model = models.resnet18()\n",
        "      model.fc = nn.Linear(512, dim, bias=False)\n",
        "      model = model.to(device)\n",
        "      optimizer = optim.Adadelta(model.parameters(), lr=0.1)\n",
        "      scheduler = StepLR(optimizer, step_size=0.1, gamma=0.7)\n",
        "\n",
        "      scaler = GradScaler()\n",
        "      for epoch in range(1, epochs + 1):\n",
        "          train(model, train_loader, scaler, optimizer, epoch, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "          scheduler.step()\n",
        "      train_acc = test(model, train_loader, \"Train\", lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      last_test = test(model, test_loader, \"Test\", lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      print(f\"{dim} {n_samples} Train: {train_acc} Test: {last_test}\")\n",
        "      stats[dim][n_samples]['train'].append(train_acc)\n",
        "      stats[dim][n_samples]['test'].append(last_test)\n",
        "    print(\"-----------------------------------------------\")\n",
        "print(stats)"
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# CIFAR10 - sampling from different classes"
      ],
      "metadata": {
        "id": "Hzc01xYEjKsd"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "CIFAR_MEAN = [125.307, 122.961, 113.8575]\n",
        "CIFAR_STD = [51.5865, 50.847, 51.255]\n",
        "cifar10_train_embeddings = getembeddings(\"/tmp/cifar_train.beton\", CIFAR_MEAN, CIFAR_STD)\n",
        "cifar10_test_embeddings = getembeddings(\"/tmp/cifar_test.beton\", CIFAR_MEAN, CIFAR_STD)"
      ],
      "metadata": {
        "id": "WCn2IPPrg3Cl"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "cifar10_train_embeddings.shape, cifar10_test_embeddings.shape"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "PiGWS0KcjWLE",
        "outputId": "78a99698-2115-4499-c13f-a1c4e5ff84ab"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "execute_result",
          "data": {
            "text/plain": [
              "(torch.Size([50000, 512]), torch.Size([10000, 512]))"
            ]
          },
          "metadata": {},
          "execution_count": 22
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "stats = {}\n",
        "def run():\n",
        "  n_runs = 2\n",
        "  n_negatives = 1\n",
        "  for dim in [128, 256,512, 1024]:\n",
        "    stats[dim] = {}\n",
        "    test_loader = contrastive_dataloader_with_ground_truth(\"/tmp/cifar_test.beton\", cifar10_test_embeddings, n_samples=10000, n_negatives=n_negatives, batch_size=5000)\n",
        "    for n_samples, epochs in [(2, 100), (10, 100), (100, 100), (1000, 100), (10000, 100)]: # , (100000, 7)\n",
        "    # for n_samples, epochs in [(10000, 100)]: # , (100000, 7)\n",
        "      stats[dim][n_samples] = {'train': [], 'test': []}\n",
        "      for _ in range(n_runs):\n",
        "        train_loader = contrastive_dataloader_with_ground_truth(\"/tmp/cifar_train.beton\", cifar10_train_embeddings, n_samples=n_samples, n_negatives=n_negatives, batch_size=500)\n",
        "        model = models.resnet18()\n",
        "        model.fc = nn.Linear(512, dim, bias=False)\n",
        "        model = model.to(device)\n",
        "        optimizer = optim.Adadelta(model.parameters(), lr=0.1)\n",
        "        scheduler = StepLR(optimizer, step_size=0.1, gamma=0.7)\n",
        "\n",
        "        scaler = GradScaler()\n",
        "        for epoch in range(1, epochs + 1):\n",
        "            train(model, train_loader, scaler, optimizer, epoch, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "            scheduler.step()\n",
        "        train_acc = test(model, train_loader, \"Train\", lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "        last_test = test(model, test_loader, \"Test\", lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "        print(f\"{dim} {n_samples} Train: {train_acc} Test: {last_test}\")\n",
        "        stats[dim][n_samples]['train'].append(train_acc)\n",
        "        stats[dim][n_samples]['test'].append(last_test)\n",
        "      print(\"-----------------------------------------------\")\n",
        "\n",
        "run()\n",
        "print(stats)"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "kvgnfDU5lVAp",
        "outputId": "348e08a9-4676-477d-a34f-4f1450272b5a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.5054, Accuracy: 53.04%)\n",
            "128 2 Train: 100.0 Test: 53.035498516900205\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.8435, Accuracy: 55.60%)\n",
            "128 2 Train: 100.0 Test: 55.60366894517627\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1887, Accuracy: 56.62%)\n",
            "128 10 Train: 100.0 Test: 56.61550079073224\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.4840, Accuracy: 49.14%)\n",
            "128 10 Train: 100.0 Test: 49.138225827898296\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0436, Accuracy: 56.56%)\n",
            "128 100 Train: 100.0 Test: 56.555477210453574\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3206, Accuracy: 49.70%)\n",
            "128 100 Train: 100.0 Test: 49.69559056418283\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.9582, Accuracy: 58.97%)\n",
            "128 1000 Train: 99.99999489103045 Test: 58.973587410790586\n",
            "Train Average loss: 0.0010, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9911, Accuracy: 47.86%)\n",
            "128 1000 Train: 99.99999489103045 Test: 47.86485859325954\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0364, Accuracy: 99.01%)\n",
            "Test Average loss: 5.1642, Accuracy: 60.29%)\n",
            "128 10000 Train: 99.01243956362616 Test: 60.2898291179112\n",
            "Train Average loss: 0.0068, Accuracy: 99.82%)\n",
            "Test Average loss: 3.1707, Accuracy: 67.96%)\n",
            "128 10000 Train: 99.82223461885921 Test: 67.95575192996434\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 28.1828, Accuracy: 52.12%)\n",
            "256 2 Train: 100.0 Test: 52.11798889296395\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.3330, Accuracy: 52.26%)\n",
            "256 2 Train: 100.0 Test: 52.25518601281303\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3563, Accuracy: 59.95%)\n",
            "256 10 Train: 100.0 Test: 59.94683418955121\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.5002, Accuracy: 60.41%)\n",
            "256 10 Train: 100.0 Test: 60.409876278468545\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2084, Accuracy: 54.16%)\n",
            "256 100 Train: 100.0 Test: 54.15880509785244\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.0692, Accuracy: 52.37%)\n",
            "256 100 Train: 100.0 Test: 52.36666032246181\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.3085, Accuracy: 96.08%)\n",
            "Test Average loss: 3.8064, Accuracy: 58.23%)\n",
            "256 1000 Train: 96.08433246612549 Test: 58.2275756767818\n",
            "Train Average loss: 0.0013, Accuracy: 99.91%)\n",
            "Test Average loss: 4.2740, Accuracy: 54.51%)\n",
            "256 1000 Train: 99.91393685340881 Test: 54.5103737286159\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0396, Accuracy: 99.08%)\n",
            "Test Average loss: 4.0787, Accuracy: 66.34%)\n",
            "256 10000 Train: 99.08156834664892 Test: 66.33510504450116\n",
            "Train Average loss: 0.0003, Accuracy: 99.99%)\n",
            "Test Average loss: 4.2930, Accuracy: 64.53%)\n",
            "256 10000 Train: 99.9901186247341 Test: 64.53009588377816\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 33.0939, Accuracy: 51.19%)\n",
            "512 2 Train: 100.0 Test: 51.19190386363438\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 59.0191, Accuracy: 53.30%)\n",
            "512 2 Train: 100.0 Test: 53.30131905419486\n",
            "-----------------------------------------------\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Better memory"
      ],
      "metadata": {
        "id": "4MhbR2q0IZNS"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "cb25540c-4223-4b51-9ebc-32b40bd657aa",
        "id": "1x2b043mIexJ"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Files already downloaded and verified\n"
          ]
        }
      ],
      "source": [
        "cifar10_train_dataset = datasets.CIFAR10('/tmp', train=True, download=True)\n",
        "cifar10_test_dataset = datasets.CIFAR10('/tmp', train=False)\n",
        "cifar10_train_labels = get_labels(cifar10_train_dataset)\n",
        "cifar10_test_labels = get_labels(cifar10_test_dataset)"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "all_negatives = [1, 2, 4, 8]"
      ],
      "metadata": {
        "id": "VsXm8kzdKfqE"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# train_loaders = {n_negatives: [contrastive_dataloader(\"/tmp/cifar_train.beton\", cifar10_train_labels, n_samples=10000, n_negatives=n_negatives, batch_size=500)\n",
        "#                                for _ in range(10)]\n",
        "#                  for n_negatives in all_negatives}"
      ],
      "metadata": {
        "id": "FJ31SovJIjDi"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "# test_loaders = {n_negatives: [contrastive_dataloader(\"/tmp/cifar_test.beton\", cifar10_test_labels, n_samples=10000, n_negatives=n_negatives, batch_size=5000)\n",
        "#                                for _ in range(10)]\n",
        "#                  for n_negatives in all_negatives}"
      ],
      "metadata": {
        "id": "CroeCtLzPsun"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 693
        },
        "outputId": "77375cf6-95f3-4014-d4bf-5cf246916418",
        "id": "I66SIpexIexP"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5044, Accuracy: 71.71%)\n",
            "128 10000 Train: 99.99999413724805 Test: 71.70725294521877\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7397, Accuracy: 76.15%)\n",
            "128 10000 Train: 99.99999413724805 Test: 76.15331666810172\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4191, Accuracy: 65.46%)\n",
            "128 10000 Train: 99.99999413724805 Test: 65.45618006161281\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.9688, Accuracy: 73.68%)\n",
            "128 10000 Train: 99.99999413724805 Test: 73.67946931294033\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6445, Accuracy: 73.55%)\n",
            "128 10000 Train: 99.99999413724805 Test: 73.55084759848458\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.8597, Accuracy: 69.47%)\n",
            "128 10000 Train: 99.99999413724805 Test: 69.47350246565682\n"
          ]
        },
        {
          "output_type": "error",
          "ename": "KeyboardInterrupt",
          "evalue": "ignored",
          "traceback": [
            "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
            "\u001b[0;32m<ipython-input-25-69b3cdc327ca>\u001b[0m in \u001b[0;36m<cell line: 4>\u001b[0;34m()\u001b[0m\n\u001b[1;32m     19\u001b[0m       \u001b[0mscaler\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mGradScaler\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     20\u001b[0m       \u001b[0;32mfor\u001b[0m \u001b[0mepoch\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mepochs\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 21\u001b[0;31m           \u001b[0mtrain\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrain_loader\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mscaler\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moptimizer\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mepoch\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_vals\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0mo\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mcontrastive_loss_acc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_negatives\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     22\u001b[0m           \u001b[0mscheduler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     23\u001b[0m       \u001b[0mtrain_acc\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtest\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrain_loader\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"Train\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_vals\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0mo\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mcontrastive_loss_acc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_negatives\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m<ipython-input-15-1fcabaf5c064>\u001b[0m in \u001b[0;36mtrain\u001b[0;34m(model, train_loader, scaler, optimizer, epoch, n_vals, loss_acc_f)\u001b[0m\n\u001b[1;32m     15\u001b[0m     \u001b[0mloss\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0m_\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mloss_acc_f\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0moutputs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     16\u001b[0m     \u001b[0mlosses\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mloss\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdetach\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitem\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 17\u001b[0;31m     \u001b[0mscaler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mscale\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mloss\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     18\u001b[0m     \u001b[0mscaler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0moptimizer\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     19\u001b[0m     \u001b[0mscaler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mupdate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/torch/_tensor.py\u001b[0m in \u001b[0;36mbackward\u001b[0;34m(self, gradient, retain_graph, create_graph, inputs)\u001b[0m\n\u001b[1;32m    485\u001b[0m                 \u001b[0minputs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0minputs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    486\u001b[0m             )\n\u001b[0;32m--> 487\u001b[0;31m         torch.autograd.backward(\n\u001b[0m\u001b[1;32m    488\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mgradient\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mretain_graph\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcreate_graph\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0minputs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0minputs\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    489\u001b[0m         )\n",
            "\u001b[0;32m/usr/local/lib/python3.10/dist-packages/torch/autograd/__init__.py\u001b[0m in \u001b[0;36mbackward\u001b[0;34m(tensors, grad_tensors, retain_graph, create_graph, grad_variables, inputs)\u001b[0m\n\u001b[1;32m    198\u001b[0m     \u001b[0;31m# some Python versions print out the first line of a multi-line function\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    199\u001b[0m     \u001b[0;31m# calls in the traceback and some print out the last line\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 200\u001b[0;31m     Variable._execution_engine.run_backward(  # Calls into the C++ engine to run the backward pass\n\u001b[0m\u001b[1;32m    201\u001b[0m         \u001b[0mtensors\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mgrad_tensors_\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mretain_graph\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcreate_graph\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0minputs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    202\u001b[0m         allow_unreachable=True, accumulate_grad=True)  # Calls into the C++ engine to run the backward pass\n",
            "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
          ]
        }
      ],
      "source": [
        "n_runs = 10\n",
        "stats = {}\n",
        "n_negatives = 1\n",
        "for dim in [128, 256,512, 1024]:\n",
        "  stats[dim] = {}\n",
        "  # for n_samples, epochs in [(2, 100), (10, 100), (100, 100), (1000, 100), (10000, 100)]: # , (100000, 7)\n",
        "  for n_samples, epochs in [(10000, 100), (10000, 100), (10000, 100)]: # , (100000, 7)\n",
        "    stats[dim][n_samples] = {'train': [], 'test': []}\n",
        "    n_vals = n_samples * (2 + n_negatives)\n",
        "    for run in range(n_runs):\n",
        "      # train_loader = train_loaders[n_negatives][run]\n",
        "      # test_loader = test_loaders[n_negatives][run]\n",
        "      train_loader = contrastive_dataloader(\"/tmp/cifar_train.beton\", cifar10_train_labels, n_samples=10000, n_negatives=n_negatives, batch_size=500)\n",
        "      test_loader = contrastive_dataloader(\"/tmp/cifar_test.beton\", cifar10_test_labels, n_samples=10000, n_negatives=n_negatives, batch_size=5000)\n",
        "      model = models.resnet18()\n",
        "      model.fc = nn.Linear(512, dim, bias=False)\n",
        "      model = model.to(device)\n",
        "      optimizer = optim.Adadelta(model.parameters(), lr=0.1)\n",
        "      scheduler = StepLR(optimizer, step_size=0.1, gamma=0.7)\n",
        "\n",
        "      scaler = GradScaler()\n",
        "      for epoch in range(1, epochs + 1):\n",
        "          train(model, train_loader, scaler, optimizer, epoch, n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "          scheduler.step()\n",
        "      train_acc = test(model, train_loader, \"Train\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      last_test = test(model, test_loader, \"Test\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      print(f\"{dim} {n_samples} Train: {train_acc} Test: {last_test}\")\n",
        "      stats[dim][n_samples]['train'].append(train_acc)\n",
        "      stats[dim][n_samples]['test'].append(last_test)\n",
        "      gc.collect()\n",
        "    print(\"-----------------------------------------------\")"
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Subsample points"
      ],
      "metadata": {
        "id": "NIH3a5_Bg5qx"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "for n_points in [100, 1000, 10000]:\n",
        "  for dim in [512]:\n",
        "    for n_samples in [2, 10, 100, 1000, 10000]:\n",
        "      !python runner.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner.py 4 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "aXuHzeVa6c7Q",
        "outputId": "bb92a0c1-353f-484e-b1e1-852061cd864b"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-22 05:23:56.697765: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:23:57.762358: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0015, Accuracy: 100.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.0625, Accuracy: 50.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:24:59.362510: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:25:00.431190: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2578, Accuracy: 50.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.9688, Accuracy: 0.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:26:06.524532: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:26:07.757811: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.3281, Accuracy: 50.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.1719, Accuracy: 70.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.5586, Accuracy: 60.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:27:01.795006: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:27:03.342577: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.5781, Accuracy: 50.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.6328, Accuracy: 70.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.3516, Accuracy: 50.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.0312, Accuracy: 50.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:28:10.949839: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:28:12.010259: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.0312, Accuracy: 64.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 63.999998569488525\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.7422, Accuracy: 61.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 61.000001430511475\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.9375, Accuracy: 64.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 63.999998569488525\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:29:07.329131: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:29:08.380841: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.2266, Accuracy: 55.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.4453, Accuracy: 63.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 62.99999952316284\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.0469, Accuracy: 68.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 68.00000071525574\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 12.1250, Accuracy: 59.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 58.99999737739563\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:30:16.144485: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:30:17.186477: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.1986, Accuracy: 98.62%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 98.62306118011475\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.1430, Accuracy: 98.54%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 98.53700143950326\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.3026, Accuracy: 97.07%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 97.07400713648114\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:31:45.488274: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:31:46.552141: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0075, Accuracy: 94.79%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 94.79345594133649\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 0.3646, Accuracy: 97.76%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 97.76247569492885\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 0.4646, Accuracy: 97.33%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 97.33218210084098\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.3060, Accuracy: 99.05%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 99.05335307121277\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:33:36.924357: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:33:38.014981: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0010, Accuracy: 99.99%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.9901186247341\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0053, Accuracy: 99.99%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.9901186247341\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0083, Accuracy: 99.96%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.96049198947969\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:39:12.128532: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:39:13.243617: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0034, Accuracy: 99.99%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.9901186247341\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 99.99%)\n",
            "Test Average loss: 0.0023, Accuracy: 99.98%)\n",
            "100 1 512 10000 Train: 99.9901186247341 Test: 99.98024311222014\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0053, Accuracy: 99.97%)\n",
            "100 1 512 10000 Train: 99.99999413724805 Test: 99.97036759970618\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:46:42.920178: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:46:44.012831: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 85.9375, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 17.2500, Accuracy: 0.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:47:39.360565: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:47:40.959233: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1748, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 35.8438, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0005, Accuracy: 100.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.5977, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:48:49.019851: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:48:50.160462: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 20.9219, Accuracy: 30.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.1562, Accuracy: 50.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 152.3750, Accuracy: 60.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:49:45.510317: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:49:46.622236: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.0859, Accuracy: 50.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.1484, Accuracy: 40.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.8906, Accuracy: 30.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.8047, Accuracy: 30.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-22 05:50:52.276275: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:50:53.394132: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.4141, Accuracy: 53.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.8359, Accuracy: 53.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.4141, Accuracy: 54.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:51:48.728184: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:51:49.817243: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.3750, Accuracy: 51.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 50.999999046325684\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.1250, Accuracy: 54.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.5547, Accuracy: 57.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.2656, Accuracy: 59.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 58.99999737739563\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:52:59.414703: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:53:00.925773: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0006, Accuracy: 100.00%)\n",
            "Test Average loss: 10.7137, Accuracy: 55.12%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 55.12048133781978\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.1814, Accuracy: 66.91%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 66.91049677985055\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 9.4983, Accuracy: 60.15%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 60.154902083533145\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:54:30.801890: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:54:31.896596: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 12.8164, Accuracy: 54.00%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 54.00171875953674\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 7.0717, Accuracy: 59.77%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 59.76764048848834\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.2388, Accuracy: 64.07%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 64.07056621142796\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.7048, Accuracy: 56.15%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 56.15318162100655\n",
            "-----------------------------------------------\n",
            "2023-05-22 05:56:26.807032: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 05:56:27.906893: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0582, Accuracy: 99.66%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.66422602778576\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0441, Accuracy: 99.88%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.88148788936803\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.1771, Accuracy: 99.63%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.63459929481881\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:02:30.253067: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:02:31.385208: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0003, Accuracy: 99.99%)\n",
            "Test Average loss: 0.0435, Accuracy: 99.61%)\n",
            "1000 1 512 10000 Train: 99.9901186247341 Test: 99.6148479766533\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.1141, Accuracy: 99.61%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.61484836750343\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.1404, Accuracy: 99.64%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.64299377847891\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0400, Accuracy: 99.63%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 99.63459968566895\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:10:21.664403: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:10:23.333171: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.0547, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.1562, Accuracy: 0.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 27.9375, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-22 06:11:17.972928: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:11:19.057756: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 2\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 33.5625, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.9482, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0046, Accuracy: 100.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:12:28.669963: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:12:29.807091: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.8203, Accuracy: 40.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.8516, Accuracy: 30.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 21.2344, Accuracy: 40.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-22 06:13:23.531386: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:13:24.619160: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 10\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.3203, Accuracy: 40.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.2188, Accuracy: 50.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.5938, Accuracy: 50.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9121, Accuracy: 60.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:14:34.786639: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:14:36.098487: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.1562, Accuracy: 54.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.9219, Accuracy: 54.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.2578, Accuracy: 50.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-22 06:15:33.095530: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:15:34.239608: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 100\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.6328, Accuracy: 61.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 61.000001430511475\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.2188, Accuracy: 47.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 46.99999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.7656, Accuracy: 57.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.7734, Accuracy: 54.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:16:46.043964: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:16:47.208220: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0026, Accuracy: 99.91%)\n",
            "Test Average loss: 8.4933, Accuracy: 54.13%)\n",
            "10000 1 512 1000 Train: 99.91393685340881 Test: 54.13080709321159\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 7.7455, Accuracy: 56.54%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 56.54044491904122\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.3717, Accuracy: 54.99%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 54.99139172690255\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:18:20.245295: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:18:21.373339: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.5988, Accuracy: 58.18%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 58.17555785179138\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 6.8554, Accuracy: 62.56%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 62.56454331534249\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0014, Accuracy: 99.91%)\n",
            "Test Average loss: 13.7860, Accuracy: 63.30%)\n",
            "10000 1 512 1000 Train: 99.91393685340881 Test: 63.29603961535862\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 9.0379, Accuracy: 56.54%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 56.54044662203107\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:20:21.364579: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:20:22.508362: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6718, Accuracy: 78.29%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 78.29004272085722\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6163, Accuracy: 78.00%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 78.00463867969201\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9472, Accuracy: 78.43%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 78.42830048232781\n",
            "-----------------------------------------------\n",
            "2023-05-22 06:26:27.080724: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-22 06:26:28.214198: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Files already downloaded and verified\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "id": "u8IBpL6V5F6n"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "for _ in range(3):\n",
        "  for n_points in [100, 1000, 10000]:\n",
        "    for dim in [512]:\n",
        "      for n_samples in [10 ** 5]:\n",
        "        !python runner.py 3 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "c6NvB7gCuhoj",
        "outputId": "06077f5e-9997-426e-8369-ed18ebfad5b3"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-22 15:11:33.693438: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 15:57:09.078678: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 16:41:52.151643: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0017, Accuracy: 99.94%)\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.94074096445178\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0018, Accuracy: 99.95%)\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.95061657467826\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0132, Accuracy: 99.85%)\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.85037973669709\n",
            "-----------------------------------------------\n",
            "2023-05-22 17:27:19.200903: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 18:10:58.474773: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0004, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.9989950340581 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 18:54:30.394212: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: nan, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0154, Accuracy: 99.86%)\n",
            "10000 1 512 100000 Train: 99.99699700333387 Test: 99.86173686434012\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0107, Accuracy: 99.87%)\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.87013085943754\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0024, Accuracy: 99.93%)\n",
            "10000 1 512 100000 Train: 99.9989950340581 Test: 99.9308654519378\n",
            "-----------------------------------------------\n",
            "2023-05-22 19:37:59.480519: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 20:21:34.444928: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 100000 Train: 99.9989950340581 Test: 99.99999413724805\n",
            "-----------------------------------------------\n",
            "2023-05-22 21:04:55.594227: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100000\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0005, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0479, Accuracy: 99.87%)\n",
            "10000 1 512 100000 Train: 99.99699700333387 Test: 99.87161237685407\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0085, Accuracy: 99.88%)\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.88148788936803\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0104, Accuracy: 99.93%)\n",
            "10000 1 512 100000 Train: 99.9989950340581 Test: 99.93086554965035\n",
            "-----------------------------------------------\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "eWB_EEWM5WxB",
        "outputId": "48eabfd4-5220-48cb-fb32-83b08dea6dfe"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.94074096445178\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.95061657467826\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.85037973669709\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.9989950340581 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "10000 1 512 100000 Train: 99.99699700333387 Test: 99.86173686434012\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.87013085943754\n",
            "10000 1 512 100000 Train: 99.9989950340581 Test: 99.9308654519378\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "100 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.99999404942021 Test: 99.99999413724805\n",
            "1000 1 512 100000 Train: 99.9989950340581 Test: 99.99999413724805\n",
            "10000 1 512 100000 Train: 99.99699700333387 Test: 99.87161237685407\n",
            "10000 1 512 100000 Train: 99.99999404942021 Test: 99.88148788936803\n",
            "10000 1 512 100000 Train: 99.9989950340581 Test: 99.93086554965035\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Fast runs"
      ],
      "metadata": {
        "id": "7pJM1JHNqf3S"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "for dim in [128, 256, 512, 1024]:\n",
        "  for n_samples in [100000]:\n",
        "    !python runner.py 3 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "ZFDEqAhYri5x",
        "outputId": "071872d0-95d2-4702-9c0e-bad22051869d"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-21 18:59:28.421140: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2686, Accuracy: 88.26%)\n",
            "1 128  100000 Train: 99.9989950340581 Test: 88.26101677758354\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2084, Accuracy: 77.93%)\n",
            "1 128  100000 Train: 99.99799601869599 Test: 77.93259961264474\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0020, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5368, Accuracy: 87.50%)\n",
            "1 128  100000 Train: 99.99699700333387 Test: 87.49785338129315\n",
            "-----------------------------------------------\n",
            "2023-05-21 19:47:42.437466: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2589, Accuracy: 87.52%)\n",
            "1 256  100000 Train: 99.99599798797178 Test: 87.5150033405849\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5857, Accuracy: 84.60%)\n",
            "1 256  100000 Train: 99.99699700333387 Test: 84.59526470729283\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0024, Accuracy: 99.94%)\n",
            "Test Average loss: 1.3640, Accuracy: 87.02%)\n",
            "1 256  100000 Train: 99.94205114853322 Test: 87.01766218457904\n",
            "-----------------------------------------------\n",
            "2023-05-21 20:38:33.086968: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: nan, Accuracy: 99.99%)\n",
            "Test Average loss: 1.5350, Accuracy: 87.81%)\n",
            "1 512  100000 Train: 99.99200192652333 Test: 87.80654839106968\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0033, Accuracy: 99.94%)\n",
            "Test Average loss: 2.5504, Accuracy: 84.00%)\n",
            "1 512  100000 Train: 99.94305015401065 Test: 83.99502379553658\n",
            "-----------------------------------------------\n",
            "Train Average loss: nan, Accuracy: 99.96%)\n",
            "Test Average loss: 1.4006, Accuracy: 84.46%)\n",
            "1 512  100000 Train: 99.96402948649961 Test: 84.45806588445392\n",
            "-----------------------------------------------\n",
            "2023-05-21 21:29:02.321798: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: nan, Accuracy: 99.88%)\n",
            "Test Average loss: 1.6551, Accuracy: 84.13%)\n",
            "1 1024  100000 Train: 99.87811402697271 Test: 84.13222261837551\n",
            "-----------------------------------------------\n",
            "Train Average loss: nan, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4001, Accuracy: 88.10%)\n",
            "1 1024  100000 Train: 99.99599798797178 Test: 88.09809344155448\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0115, Accuracy: 99.86%)\n",
            "Test Average loss: 1.8804, Accuracy: 86.97%)\n",
            "1 1024  100000 Train: 99.85713467471437 Test: 86.96621315819877\n",
            "-----------------------------------------------\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "for _ in range(3):\n",
        "  for dim in [128, 256, 512, 1024]:\n",
        "    for n_samples in [10 ** 6]:\n",
        "      !python runner.py 1 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "I28QC8S3NeF4",
        "outputId": "e5441d0f-2596-4156-929e-c9696bde19da"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-21 22:19:04.652570: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0005, Accuracy: 99.99%)\n",
            "Test Average loss: 0.8299, Accuracy: 86.08%)\n",
            "1 128  1000000 Train: 99.99359503524433 Test: 86.078713621412\n",
            "-----------------------------------------------\n",
            "2023-05-22 00:55:51.269460: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0004, Accuracy: 99.99%)\n",
            "Test Average loss: 0.8338, Accuracy: 86.17%)\n",
            "1 256  1000000 Train: 99.99259519181311 Test: 86.17303712027413\n",
            "-----------------------------------------------\n",
            "2023-05-22 03:33:54.445996: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Traceback (most recent call last):\n",
            "  File \"/content/runner.py\", line 203, in <module>\n",
            "    train(model, train_loader, scaler, optimizer, epoch, n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
            "  File \"/content/runner.py\", line 153, in train\n",
            "    scaler.scale(loss).backward()\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/torch/_tensor.py\", line 487, in backward\n",
            "    torch.autograd.backward(\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/torch/autograd/__init__.py\", line 200, in backward\n",
            "    Variable._execution_engine.run_backward(  # Calls into the C++ engine to run the backward pass\n",
            "KeyboardInterrupt\n",
            "^C\n",
            "Traceback (most recent call last):\n",
            "  File \"/content/runner.py\", line 16, in <module>\n",
            "    import tensorflow as tf\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/__init__.py\", line 37, in <module>\n",
            "    from tensorflow.python.tools import module_util as _module_util\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/__init__.py\", line 42, in <module>\n",
            "    from tensorflow.python import data\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/__init__.py\", line 21, in <module>\n",
            "    from tensorflow.python.data import experimental\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/experimental/__init__.py\", line 97, in <module>\n",
            "    from tensorflow.python.data.experimental import service\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/experimental/service/__init__.py\", line 419, in <module>\n",
            "    from tensorflow.python.data.experimental.ops.data_service_ops import distribute\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/experimental/ops/data_service_ops.py\", line 22, in <module>\n",
            "    from tensorflow.python.data.experimental.ops import compression_ops\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/experimental/ops/compression_ops.py\", line 16, in <module>\n",
            "    from tensorflow.python.data.util import structure\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/data/util/structure.py\", line 30, in <module>\n",
            "    from tensorflow.python.ops import resource_variable_ops\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/ops/resource_variable_ops.py\", line 41, in <module>\n",
            "    from tensorflow.python.framework import meta_graph\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/framework/meta_graph.py\", line 34, in <module>\n",
            "    from tensorflow.python.framework import importer\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/framework/importer.py\", line 24, in <module>\n",
            "    from tensorflow.python.framework import function\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/framework/function.py\", line 34, in <module>\n",
            "    from tensorflow.python.ops import variable_scope as vs\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/ops/variable_scope.py\", line 33, in <module>\n",
            "    from tensorflow.python.ops import init_ops\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/ops/init_ops.py\", line 43, in <module>\n",
            "    from tensorflow.python.ops import random_ops\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/ops/random_ops.py\", line 25, in <module>\n",
            "    from tensorflow.python.ops import control_flow_ops\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/tensorflow/python/ops/control_flow_ops.py\", line 45, in <module>\n",
            "    from tensorflow.python.ops import tensor_array_ops\n",
            "  File \"<frozen importlib._bootstrap>\", line 1027, in _find_and_load\n",
            "  File \"<frozen importlib._bootstrap>\", line 1006, in _find_and_load_unlocked\n",
            "  File \"<frozen importlib._bootstrap>\", line 688, in _load_unlocked\n",
            "  File \"<frozen importlib._bootstrap_external>\", line 879, in exec_module\n",
            "  File \"<frozen importlib._bootstrap_external>\", line 1012, in get_code\n",
            "  File \"<frozen importlib._bootstrap_external>\", line 672, in _compile_bytecode\n",
            "KeyboardInterrupt\n",
            "^C\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "for dim in [128, 256, 512, 1024]:\n",
        "  for n_samples in [2, 10, 100, 1000, 10000]:\n",
        "    for _ in range(3):\n",
        "      !python runner.py 3 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "rAVDipI-Sddu",
        "outputId": "78b4684c-4ffc-49e6-942e-6c44c662a78f"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-21 08:18:51.011188: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:18:52.218046: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2773, Accuracy: 0.00%)\n",
            "1 128  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.8672, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.4141, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:19:45.597208: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:19:46.658536: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.4453, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2812, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.0625, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:20:40.490713: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:20:41.546431: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.1445, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.6680, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.6250, Accuracy: 50.00%)\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:21:35.571355: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:21:37.124776: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.3770, Accuracy: 30.00%)\n",
            "1 128  10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.7930, Accuracy: 30.00%)\n",
            "1 128  10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.7891, Accuracy: 50.00%)\n",
            "1 128  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:22:32.820490: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:22:33.905501: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.5898, Accuracy: 40.00%)\n",
            "1 128  10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.2695, Accuracy: 50.00%)\n",
            "1 128  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8984, Accuracy: 60.00%)\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:23:29.707325: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:23:30.781483: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0195, Accuracy: 90.00%)\n",
            "1 128  10 Train: 100.0 Test: 90.00000357627869\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0781, Accuracy: 60.00%)\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.0273, Accuracy: 60.00%)\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:24:23.713321: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:24:24.807114: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.2188, Accuracy: 48.00%)\n",
            "1 128  100 Train: 100.0 Test: 47.999998927116394\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4551, Accuracy: 58.00%)\n",
            "1 128  100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.6797, Accuracy: 57.00%)\n",
            "1 128  100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:25:17.777252: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:25:18.867225: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.6367, Accuracy: 49.00%)\n",
            "1 128  100 Train: 100.0 Test: 48.99999797344208\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0527, Accuracy: 54.00%)\n",
            "1 128  100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.5664, Accuracy: 55.00%)\n",
            "1 128  100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:26:11.761944: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:26:12.855162: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3711, Accuracy: 51.00%)\n",
            "1 128  100 Train: 100.0 Test: 50.999999046325684\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.9121, Accuracy: 51.00%)\n",
            "1 128  100 Train: 100.0 Test: 50.999999046325684\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.1758, Accuracy: 67.00%)\n",
            "1 128  100 Train: 100.0 Test: 66.99999570846558\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:27:05.907629: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:27:06.987396: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8711, Accuracy: 55.90%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 55.900001525878906\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6836, Accuracy: 57.10%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 57.10000395774841\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9883, Accuracy: 57.90%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 57.90000557899475\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:28:32.742816: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:28:34.024242: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7695, Accuracy: 53.90%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 53.90000343322754\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7637, Accuracy: 54.10%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7637, Accuracy: 58.30%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:30:02.324411: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:30:03.468145: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7109, Accuracy: 58.30%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4863, Accuracy: 58.50%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.500003814697266\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8789, Accuracy: 56.50%)\n",
            "1 128  1000 Train: 99.99999489103045 Test: 56.49999976158142\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:31:28.442245: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:31:29.527582: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6272, Accuracy: 75.54%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 75.544502053942\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.5296, Accuracy: 69.11%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 69.11335842950004\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4355, Accuracy: 72.53%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 72.53043907029289\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:37:24.837871: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:37:25.987182: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8742, Accuracy: 73.72%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 73.72234378542218\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2207, Accuracy: 69.22%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 69.21625563076564\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9629, Accuracy: 71.85%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 71.85302547046116\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:43:24.887931: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:43:25.950800: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0132, Accuracy: 99.63%)\n",
            "Test Average loss: 3.7687, Accuracy: 68.56%)\n",
            "1 128  10000 Train: 99.63459919710628 Test: 68.55599113873073\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5281, Accuracy: 77.19%)\n",
            "1 128  10000 Train: 99.99999413724805 Test: 77.19087430409023\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0338, Accuracy: 99.25%)\n",
            "Test Average loss: 3.1602, Accuracy: 74.90%)\n",
            "1 128  10000 Train: 99.249452938799 Test: 74.9013866697039\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:49:09.607221: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:49:11.014878: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1465, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.5791, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.8281, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:50:03.468025: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:50:05.057706: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0848, Accuracy: 100.00%)\n",
            "1 256  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.7070, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.7344, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:51:00.847719: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:51:01.948796: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4492, Accuracy: 0.00%)\n",
            "1 256  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 20.6250, Accuracy: 50.00%)\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1 256  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:51:56.786131: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:51:57.851092: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.5488, Accuracy: 50.00%)\n",
            "1 256  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.5547, Accuracy: 40.00%)\n",
            "1 256  10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.0781, Accuracy: 30.00%)\n",
            "1 256  10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "2023-05-21 08:52:52.412628: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:52:53.497009: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.2969, Accuracy: 70.00%)\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.9883, Accuracy: 60.00%)\n",
            "1 256  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5000, Accuracy: 70.00%)\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:53:45.556763: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:53:46.632780: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.5938, Accuracy: 60.00%)\n",
            "1 256  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7578, Accuracy: 70.00%)\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.9766, Accuracy: 50.00%)\n",
            "1 256  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:54:38.679496: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:54:39.789682: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.2188, Accuracy: 53.00%)\n",
            "1 256  100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.9570, Accuracy: 46.00%)\n",
            "1 256  100 Train: 100.0 Test: 45.99999785423279\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3984, Accuracy: 58.00%)\n",
            "1 256  100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:55:32.805767: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:55:33.897353: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.4336, Accuracy: 54.00%)\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.7266, Accuracy: 42.00%)\n",
            "1 256  100 Train: 100.0 Test: 41.999998688697815\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.0508, Accuracy: 48.00%)\n",
            "1 256  100 Train: 100.0 Test: 47.999998927116394\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:56:27.025269: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:56:28.126811: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.3945, Accuracy: 54.00%)\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.5742, Accuracy: 60.00%)\n",
            "1 256  100 Train: 100.0 Test: 59.99999642372131\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.3906, Accuracy: 54.00%)\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:57:21.980951: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:57:23.041115: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 4.5352, Accuracy: 55.30%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.30000329017639\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3711, Accuracy: 56.70%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 56.700003147125244\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.5820, Accuracy: 54.10%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 08:58:52.568819: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 08:58:53.654111: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.4961, Accuracy: 54.50%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.500001668930054\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.7188, Accuracy: 54.60%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.60000038146973\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.5625, Accuracy: 55.60%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.60000538825989\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:00:17.945059: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:00:19.218195: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.7773, Accuracy: 55.00%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.2344, Accuracy: 56.80%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 56.80000185966492\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.0234, Accuracy: 54.10%)\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:01:46.675809: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:01:47.755278: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0006, Accuracy: 99.99%)\n",
            "Test Average loss: 3.8211, Accuracy: 68.63%)\n",
            "1 256  10000 Train: 99.9901186247341 Test: 68.63316552979606\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0736, Accuracy: 75.69%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 75.69027457918439\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3502, Accuracy: 69.85%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 69.8507947581155\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:07:29.574594: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:07:30.636362: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0248, Accuracy: 73.10%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 73.10495461736407\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 17.4143, Accuracy: 73.53%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 73.52512223379952\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0130, Accuracy: 99.79%)\n",
            "Test Average loss: 2.8496, Accuracy: 74.79%)\n",
            "1 256  10000 Train: 99.79260808131734 Test: 74.78991406304496\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:13:10.950630: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:13:12.034997: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.6247, Accuracy: 65.39%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 65.38758192743573\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8089, Accuracy: 75.93%)\n",
            "1 256  10000 Train: 99.99999413724805 Test: 75.930369751794\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 99.99%)\n",
            "Test Average loss: 3.3008, Accuracy: 72.44%)\n",
            "1 256  10000 Train: 99.9901186247341 Test: 72.43611557143075\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:19:00.757345: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:19:01.867673: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0673, Accuracy: 100.00%)\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.8828, Accuracy: 0.00%)\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:19:54.216296: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:19:55.306211: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.5474, Accuracy: 50.00%)\n",
            "1 512  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:20:47.639671: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:20:48.739232: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 16.5000, Accuracy: 0.00%)\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2188, Accuracy: 50.00%)\n",
            "1 512  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 30.2500, Accuracy: 0.00%)\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:21:40.968143: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:21:42.069821: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 16.0625, Accuracy: 40.00%)\n",
            "1 512  10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.7734, Accuracy: 40.00%)\n",
            "1 512  10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.4375, Accuracy: 60.00%)\n",
            "1 512  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:22:35.736815: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:22:36.831181: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.9141, Accuracy: 60.00%)\n",
            "1 512  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.7812, Accuracy: 50.00%)\n",
            "1 512  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2051, Accuracy: 90.00%)\n",
            "1 512  10 Train: 100.0 Test: 90.00000357627869\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:23:29.722875: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:23:30.830752: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.0781, Accuracy: 80.00%)\n",
            "1 512  10 Train: 100.0 Test: 80.0000011920929\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.3672, Accuracy: 70.00%)\n",
            "1 512  10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 23.8281, Accuracy: 30.00%)\n",
            "1 512  10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:24:26.200014: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:24:27.765103: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.8594, Accuracy: 53.00%)\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.4922, Accuracy: 58.00%)\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.6484, Accuracy: 58.00%)\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:25:21.660151: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:25:23.333709: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.2422, Accuracy: 54.00%)\n",
            "1 512  100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.0156, Accuracy: 53.00%)\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.4688, Accuracy: 57.00%)\n",
            "1 512  100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:26:18.587690: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:26:19.689723: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 11.1875, Accuracy: 58.00%)\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.6172, Accuracy: 47.00%)\n",
            "1 512  100 Train: 100.0 Test: 46.99999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.3438, Accuracy: 53.00%)\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:27:15.647751: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:27:16.745953: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 9.0703, Accuracy: 54.00%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 54.00000214576721\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 8.3672, Accuracy: 55.60%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 55.60000538825989\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.7930, Accuracy: 58.30%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:28:46.039844: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:28:47.142852: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0013, Accuracy: 99.91%)\n",
            "Test Average loss: 8.4453, Accuracy: 57.60%)\n",
            "1 512  1000 Train: 99.91393685340881 Test: 57.600003480911255\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0024, Accuracy: 99.83%)\n",
            "Test Average loss: 8.8672, Accuracy: 56.00%)\n",
            "1 512  1000 Train: 99.82787881578717 Test: 56.00000023841858\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0005, Accuracy: 100.00%)\n",
            "Test Average loss: 8.4609, Accuracy: 54.80%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 54.80000376701355\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:30:17.092334: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:30:18.194054: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.2969, Accuracy: 55.40%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 55.400002002716064\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.9453, Accuracy: 53.60%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 53.60000133514404\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.5938, Accuracy: 58.00%)\n",
            "1 512  1000 Train: 99.99999489103045 Test: 58.000004291534424\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:31:45.506153: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:31:46.940610: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.8446, Accuracy: 73.10%)\n",
            "1 512  10000 Train: 99.99999413724805 Test: 73.09638006346566\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1381, Accuracy: 72.53%)\n",
            "1 512  10000 Train: 99.99999413724805 Test: 72.5304399217878\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7199, Accuracy: 76.35%)\n",
            "1 512  10000 Train: 99.99999413724805 Test: 76.35053821972438\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:37:30.279735: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:37:31.330167: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0247, Accuracy: 99.52%)\n",
            "Test Average loss: 3.6699, Accuracy: 72.53%)\n",
            "1 512  10000 Train: 99.51609275380119 Test: 72.5304399217878\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4874, Accuracy: 68.82%)\n",
            "1 512  10000 Train: 99.99999413724805 Test: 68.82181252752032\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0214, Accuracy: 99.59%)\n",
            "Test Average loss: 3.5178, Accuracy: 76.00%)\n",
            "1 512  10000 Train: 99.58522143911142 Test: 75.998968737466\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:43:09.580867: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:43:10.661406: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0178, Accuracy: 99.70%)\n",
            "Test Average loss: 4.1696, Accuracy: 67.60%)\n",
            "1 512  10000 Train: 99.70372807784159 Test: 67.60418329920087\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.4978, Accuracy: 72.29%)\n",
            "1 512  10000 Train: 99.99999413724805 Test: 72.29034304618835\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0008, Accuracy: 99.99%)\n",
            "Test Average loss: 3.7721, Accuracy: 75.68%)\n",
            "1 512  10000 Train: 99.9901186247341 Test: 75.68169917379107\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:48:57.419222: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:48:58.450684: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1 1024  2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.3828, Accuracy: 50.00%)\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 25.0000, Accuracy: 0.00%)\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:49:50.354346: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:49:51.406679: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 9.6875, Accuracy: 50.00%)\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 61.7500, Accuracy: 0.00%)\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 59.3750, Accuracy: 0.00%)\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:50:43.461740: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:50:44.560907: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.3125, Accuracy: 50.00%)\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 374.2500, Accuracy: 0.00%)\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 13.2500, Accuracy: 50.00%)\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:51:38.770188: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:51:39.905325: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 57.5312, Accuracy: 50.00%)\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.8984, Accuracy: 80.00%)\n",
            "1 1024  10 Train: 100.0 Test: 80.0000011920929\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 32.8438, Accuracy: 80.00%)\n",
            "1 1024  10 Train: 100.0 Test: 80.0000011920929\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:52:33.896765: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:52:35.519039: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 12.3359, Accuracy: 70.00%)\n",
            "1 1024  10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 23.3906, Accuracy: 50.00%)\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 29.5156, Accuracy: 60.00%)\n",
            "1 1024  10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:53:29.067486: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:53:30.175932: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 12.9688, Accuracy: 50.00%)\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 28.4219, Accuracy: 30.00%)\n",
            "1 1024  10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 29.9062, Accuracy: 40.00%)\n",
            "1 1024  10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:54:23.938361: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:54:25.013579: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 24.9531, Accuracy: 48.00%)\n",
            "1 1024  100 Train: 100.0 Test: 47.999998927116394\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 20.5469, Accuracy: 51.00%)\n",
            "1 1024  100 Train: 100.0 Test: 50.999999046325684\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 19.7656, Accuracy: 57.00%)\n",
            "1 1024  100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:55:18.889386: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:55:19.944593: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 22.2188, Accuracy: 57.00%)\n",
            "1 1024  100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 19.0000, Accuracy: 56.00%)\n",
            "1 1024  100 Train: 100.0 Test: 56.00000023841858\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 18.9531, Accuracy: 55.00%)\n",
            "1 1024  100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:56:11.672889: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:56:12.703968: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 26.6250, Accuracy: 52.00%)\n",
            "1 1024  100 Train: 100.0 Test: 51.99999809265137\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 16.1875, Accuracy: 55.00%)\n",
            "1 1024  100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.3203, Accuracy: 56.00%)\n",
            "1 1024  100 Train: 100.0 Test: 56.00000023841858\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:57:04.645179: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:57:05.687992: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0066, Accuracy: 99.91%)\n",
            "Test Average loss: 14.3359, Accuracy: 57.10%)\n",
            "1 1024  1000 Train: 99.91393685340881 Test: 57.10000395774841\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0084, Accuracy: 99.74%)\n",
            "Test Average loss: 16.4375, Accuracy: 53.00%)\n",
            "1 1024  1000 Train: 99.74182077816555 Test: 53.00000309944153\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0006, Accuracy: 100.00%)\n",
            "Test Average loss: 16.4531, Accuracy: 55.90%)\n",
            "1 1024  1000 Train: 99.99999489103045 Test: 55.900001525878906\n",
            "-----------------------------------------------\n",
            "2023-05-21 09:58:32.046066: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:58:33.605796: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0006, Accuracy: 100.00%)\n",
            "Test Average loss: 15.3828, Accuracy: 59.30%)\n",
            "1 1024  1000 Train: 99.99999489103045 Test: 59.3000054359436\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0126, Accuracy: 99.74%)\n",
            "Test Average loss: 16.3750, Accuracy: 54.30%)\n",
            "1 1024  1000 Train: 99.74182077816555 Test: 54.30000424385071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0076, Accuracy: 99.66%)\n",
            "Test Average loss: 15.0078, Accuracy: 56.10%)\n",
            "1 1024  1000 Train: 99.65576188904899 Test: 56.10000491142273\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 09:59:56.842875: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 09:59:57.877280: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0223, Accuracy: 99.66%)\n",
            "Test Average loss: 17.2656, Accuracy: 54.10%)\n",
            "1 1024  1000 Train: 99.65576188904899 Test: 54.100000858306885\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0074, Accuracy: 99.83%)\n",
            "Test Average loss: 15.4922, Accuracy: 57.30%)\n",
            "1 1024  1000 Train: 99.82787796429226 Test: 57.30000138282776\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0051, Accuracy: 99.83%)\n",
            "Test Average loss: 23.8594, Accuracy: 60.50%)\n",
            "1 1024  1000 Train: 99.82787881578717 Test: 60.50000190734863\n",
            "-----------------------------------------------\n",
            "terminate called without an active exception\n",
            "2023-05-21 10:01:21.155870: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 10:01:22.238614: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.6951, Accuracy: 76.02%)\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 76.01611954825265\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0022, Accuracy: 99.94%)\n",
            "Test Average loss: 4.8460, Accuracy: 63.57%)\n",
            "1 1024  10000 Train: 99.9407410621643 Test: 63.56971178736005\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0058, Accuracy: 99.83%)\n",
            "Test Average loss: 5.3438, Accuracy: 64.31%)\n",
            "1 1024  10000 Train: 99.83211013137317 Test: 64.30714981896537\n",
            "-----------------------------------------------\n",
            "2023-05-21 10:06:54.997261: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 10:06:56.037551: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0018, Accuracy: 99.98%)\n",
            "Test Average loss: 4.1647, Accuracy: 72.49%)\n",
            "1 1024  10000 Train: 99.98024311222014 Test: 72.48756459781102\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.4523, Accuracy: 72.55%)\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 72.54758902958461\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0046, Accuracy: 99.86%)\n",
            "Test Average loss: 3.7028, Accuracy: 71.44%)\n",
            "1 1024  10000 Train: 99.86173696205263 Test: 71.44143155642918\n",
            "-----------------------------------------------\n",
            "2023-05-21 10:12:34.547439: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-21 10:12:35.577162: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Files already downloaded and verified\n",
            "Train Average loss: 0.0010, Accuracy: 99.98%)\n",
            "Test Average loss: 4.8683, Accuracy: 69.17%)\n",
            "1 1024  10000 Train: 99.98024311222014 Test: 69.17338030678886\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0165, Accuracy: 99.60%)\n",
            "Test Average loss: 4.1560, Accuracy: 70.90%)\n",
            "1 1024  10000 Train: 99.60497246413934 Test: 70.90121507644653\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 3.9392, Accuracy: 72.43%)\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 72.42754016603742\n",
            "-----------------------------------------------\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "5V-revpZYfle",
        "outputId": "1b49ef9e-9550-4319-da34-3543a81079cc"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "1 128  2 Train: 100.0 Test: 0.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  2 Train: 100.0 Test: 50.0\n",
            "1 128  10 Train: 100.0 Test: 30.000001192092896\n",
            "1 128  10 Train: 100.0 Test: 30.000001192092896\n",
            "1 128  10 Train: 100.0 Test: 50.0\n",
            "1 128  10 Train: 100.0 Test: 40.00000059604645\n",
            "1 128  10 Train: 100.0 Test: 50.0\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 128  10 Train: 100.0 Test: 90.00000357627869\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 128  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 128  100 Train: 100.0 Test: 47.999998927116394\n",
            "1 128  100 Train: 100.0 Test: 57.999998331069946\n",
            "1 128  100 Train: 100.0 Test: 56.99999928474426\n",
            "1 128  100 Train: 100.0 Test: 48.99999797344208\n",
            "1 128  100 Train: 100.0 Test: 53.999996185302734\n",
            "1 128  100 Train: 100.0 Test: 55.000001192092896\n",
            "1 128  100 Train: 100.0 Test: 50.999999046325684\n",
            "1 128  100 Train: 100.0 Test: 50.999999046325684\n",
            "1 128  100 Train: 100.0 Test: 66.99999570846558\n",
            "1 128  1000 Train: 99.99999489103045 Test: 55.900001525878906\n",
            "1 128  1000 Train: 99.99999489103045 Test: 57.10000395774841\n",
            "1 128  1000 Train: 99.99999489103045 Test: 57.90000557899475\n",
            "1 128  1000 Train: 99.99999489103045 Test: 53.90000343322754\n",
            "1 128  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "1 128  1000 Train: 99.99999489103045 Test: 58.500003814697266\n",
            "1 128  1000 Train: 99.99999489103045 Test: 56.49999976158142\n",
            "1 128  10000 Train: 99.99999413724805 Test: 75.544502053942\n",
            "1 128  10000 Train: 99.99999413724805 Test: 69.11335842950004\n",
            "1 128  10000 Train: 99.99999413724805 Test: 72.53043907029289\n",
            "1 128  10000 Train: 99.99999413724805 Test: 73.72234378542218\n",
            "1 128  10000 Train: 99.99999413724805 Test: 69.21625563076564\n",
            "1 128  10000 Train: 99.99999413724805 Test: 71.85302547046116\n",
            "1 128  10000 Train: 99.63459919710628 Test: 68.55599113873073\n",
            "1 128  10000 Train: 99.99999413724805 Test: 77.19087430409023\n",
            "1 128  10000 Train: 99.249452938799 Test: 74.9013866697039\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 100.0\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 0.0\n",
            "1 256  2 Train: 100.0 Test: 50.0\n",
            "1 256  2 Train: 100.0 Test: 100.0\n",
            "1 256  10 Train: 100.0 Test: 50.0\n",
            "1 256  10 Train: 100.0 Test: 40.00000059604645\n",
            "1 256  10 Train: 100.0 Test: 30.000001192092896\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "1 256  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "1 256  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 256  10 Train: 100.0 Test: 69.9999988079071\n",
            "1 256  10 Train: 100.0 Test: 50.0\n",
            "1 256  100 Train: 100.0 Test: 52.99999713897705\n",
            "1 256  100 Train: 100.0 Test: 45.99999785423279\n",
            "1 256  100 Train: 100.0 Test: 57.999998331069946\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "1 256  100 Train: 100.0 Test: 41.999998688697815\n",
            "1 256  100 Train: 100.0 Test: 47.999998927116394\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "1 256  100 Train: 100.0 Test: 59.99999642372131\n",
            "1 256  100 Train: 100.0 Test: 53.999996185302734\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.30000329017639\n",
            "1 256  1000 Train: 99.99999489103045 Test: 56.700003147125244\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.500001668930054\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.60000038146973\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.60000538825989\n",
            "1 256  1000 Train: 99.99999489103045 Test: 55.000001192092896\n",
            "1 256  1000 Train: 99.99999489103045 Test: 56.80000185966492\n",
            "1 256  1000 Train: 99.99999489103045 Test: 54.100000858306885\n",
            "1 256  10000 Train: 99.9901186247341 Test: 68.63316552979606\n",
            "1 256  10000 Train: 99.99999413724805 Test: 75.69027457918439\n",
            "1 256  10000 Train: 99.99999413724805 Test: 69.8507947581155\n",
            "1 256  10000 Train: 99.99999413724805 Test: 73.10495461736407\n",
            "1 256  10000 Train: 99.99999413724805 Test: 73.52512223379952\n",
            "1 256  10000 Train: 99.79260808131734 Test: 74.78991406304496\n",
            "1 256  10000 Train: 99.99999413724805 Test: 65.38758192743573\n",
            "1 256  10000 Train: 99.99999413724805 Test: 75.930369751794\n",
            "1 256  10000 Train: 99.9901186247341 Test: 72.43611557143075\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "1 512  2 Train: 100.0 Test: 50.0\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "1 512  2 Train: 100.0 Test: 100.0\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "1 512  2 Train: 100.0 Test: 50.0\n",
            "1 512  2 Train: 100.0 Test: 0.0\n",
            "1 512  10 Train: 100.0 Test: 40.00000059604645\n",
            "1 512  10 Train: 100.0 Test: 40.00000059604645\n",
            "1 512  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 512  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 512  10 Train: 100.0 Test: 50.0\n",
            "1 512  10 Train: 100.0 Test: 90.00000357627869\n",
            "1 512  10 Train: 100.0 Test: 80.0000011920929\n",
            "1 512  10 Train: 100.0 Test: 69.9999988079071\n",
            "1 512  10 Train: 100.0 Test: 30.000001192092896\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "1 512  100 Train: 100.0 Test: 53.999996185302734\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "1 512  100 Train: 100.0 Test: 56.99999928474426\n",
            "1 512  100 Train: 100.0 Test: 57.999998331069946\n",
            "1 512  100 Train: 100.0 Test: 46.99999988079071\n",
            "1 512  100 Train: 100.0 Test: 52.99999713897705\n",
            "1 512  1000 Train: 99.99999489103045 Test: 54.00000214576721\n",
            "1 512  1000 Train: 99.99999489103045 Test: 55.60000538825989\n",
            "1 512  1000 Train: 99.99999489103045 Test: 58.30000042915344\n",
            "1 512  1000 Train: 99.91393685340881 Test: 57.600003480911255\n",
            "1 512  1000 Train: 99.82787881578717 Test: 56.00000023841858\n",
            "1 512  1000 Train: 99.99999489103045 Test: 54.80000376701355\n",
            "1 512  1000 Train: 99.99999489103045 Test: 55.400002002716064\n",
            "1 512  1000 Train: 99.99999489103045 Test: 53.60000133514404\n",
            "1 512  1000 Train: 99.99999489103045 Test: 58.000004291534424\n",
            "1 512  10000 Train: 99.99999413724805 Test: 73.09638006346566\n",
            "1 512  10000 Train: 99.99999413724805 Test: 72.5304399217878\n",
            "1 512  10000 Train: 99.99999413724805 Test: 76.35053821972438\n",
            "1 512  10000 Train: 99.51609275380119 Test: 72.5304399217878\n",
            "1 512  10000 Train: 99.99999413724805 Test: 68.82181252752032\n",
            "1 512  10000 Train: 99.58522143911142 Test: 75.998968737466\n",
            "1 512  10000 Train: 99.70372807784159 Test: 67.60418329920087\n",
            "1 512  10000 Train: 99.99999413724805 Test: 72.29034304618835\n",
            "1 512  10000 Train: 99.9901186247341 Test: 75.68169917379107\n",
            "1 1024  2 Train: 100.0 Test: 100.0\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "1 1024  2 Train: 100.0 Test: 0.0\n",
            "1 1024  2 Train: 100.0 Test: 50.0\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "1 1024  10 Train: 100.0 Test: 80.0000011920929\n",
            "1 1024  10 Train: 100.0 Test: 80.0000011920929\n",
            "1 1024  10 Train: 100.0 Test: 69.9999988079071\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "1 1024  10 Train: 100.0 Test: 60.00000238418579\n",
            "1 1024  10 Train: 100.0 Test: 50.0\n",
            "1 1024  10 Train: 100.0 Test: 30.000001192092896\n",
            "1 1024  10 Train: 100.0 Test: 40.00000059604645\n",
            "1 1024  100 Train: 100.0 Test: 47.999998927116394\n",
            "1 1024  100 Train: 100.0 Test: 50.999999046325684\n",
            "1 1024  100 Train: 100.0 Test: 56.99999928474426\n",
            "1 1024  100 Train: 100.0 Test: 56.99999928474426\n",
            "1 1024  100 Train: 100.0 Test: 56.00000023841858\n",
            "1 1024  100 Train: 100.0 Test: 55.000001192092896\n",
            "1 1024  100 Train: 100.0 Test: 51.99999809265137\n",
            "1 1024  100 Train: 100.0 Test: 55.000001192092896\n",
            "1 1024  100 Train: 100.0 Test: 56.00000023841858\n",
            "1 1024  1000 Train: 99.91393685340881 Test: 57.10000395774841\n",
            "1 1024  1000 Train: 99.74182077816555 Test: 53.00000309944153\n",
            "1 1024  1000 Train: 99.99999489103045 Test: 55.900001525878906\n",
            "1 1024  1000 Train: 99.99999489103045 Test: 59.3000054359436\n",
            "1 1024  1000 Train: 99.74182077816555 Test: 54.30000424385071\n",
            "1 1024  1000 Train: 99.65576188904899 Test: 56.10000491142273\n",
            "1 1024  1000 Train: 99.65576188904899 Test: 54.100000858306885\n",
            "1 1024  1000 Train: 99.82787796429226 Test: 57.30000138282776\n",
            "1 1024  1000 Train: 99.82787881578717 Test: 60.50000190734863\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 76.01611954825265\n",
            "1 1024  10000 Train: 99.9407410621643 Test: 63.56971178736005\n",
            "1 1024  10000 Train: 99.83211013137317 Test: 64.30714981896537\n",
            "1 1024  10000 Train: 99.98024311222014 Test: 72.48756459781102\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 72.54758902958461\n",
            "1 1024  10000 Train: 99.86173696205263 Test: 71.44143155642918\n",
            "1 1024  10000 Train: 99.98024311222014 Test: 69.17338030678886\n",
            "1 1024  10000 Train: 99.60497246413934 Test: 70.90121507644653\n",
            "1 1024  10000 Train: 99.99999413724805 Test: 72.42754016603742\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [],
      "metadata": {
        "id": "rfHkL-VliCT_"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Prepare Imagenet"
      ],
      "metadata": {
        "id": "trcZ0mZEXLu3"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "!wget -nc https://image-net.org/data/ILSVRC/2012/ILSVRC2012_img_val.tar --no-check-certificate"
      ],
      "metadata": {
        "id": "GqeuZgOzXNb8",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "759f63cf-15ae-4d0c-8a02-4c3139380bb3"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "--2023-05-24 12:08:13--  https://image-net.org/data/ILSVRC/2012/ILSVRC2012_img_val.tar\n",
            "Resolving image-net.org (image-net.org)... 171.64.68.16\n",
            "Connecting to image-net.org (image-net.org)|171.64.68.16|:443... connected.\n",
            "HTTP request sent, awaiting response... 200 OK\n",
            "Length: 6744924160 (6.3G) [application/x-tar]\n",
            "Saving to: ‘ILSVRC2012_img_val.tar’\n",
            "\n",
            "ILSVRC2012_img_val. 100%[===================>]   6.28G  9.64MB/s    in 10m 49s \n",
            "\n",
            "2023-05-24 12:19:03 (9.91 MB/s) - ‘ILSVRC2012_img_val.tar’ saved [6744924160/6744924160]\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "val_fixed_code =\\\n",
        "\"\"\"\n",
        "#!/usr/bin/env bash\n",
        "\n",
        "#train_tar=\"${1:-ILSVRC2012_img_train.tar}\"\n",
        "val_tar=\"${2:-ILSVRC2012_img_val.tar}\"\n",
        "\n",
        "#mkdir -p train\n",
        "mkdir -p val\n",
        "\n",
        "#echo \"Extracting training set ... (might take a while)\"\n",
        "#tar -xf \"${train_tar}\" -C train\n",
        "\n",
        "#echo \"Extracting training categories ...\"\n",
        "#cd train\n",
        "#find . -name \"*.tar\" | xargs -n1 -P8 -I {} bash -c 'mkdir -p \"${1%.tar}\"; tar -xf \"${1}\" -C \"${1%.tar}\"; rm -f \"${1}\"' -- {}\n",
        "#cd ..\n",
        "\n",
        "echo \"Extracting validation set ...\"\n",
        "tar -xf \"${val_tar}\" -C val\n",
        "\n",
        "echo \"Restructuring validation ...\"\n",
        "cd val\n",
        "\n",
        "# Python like zip from two streams\n",
        "function zip34() { while read word3 <&3; do read word4 <&4 ; echo $word3 $word4 ; done }\n",
        "\n",
        "wget https://raw.githubusercontent.com/tensorflow/models/master/research/slim/datasets/imagenet_2012_validation_synset_labels.txt\n",
        "find . -name \"*.JPEG\" | sort > images.txt\n",
        "zip34 3<images.txt 4<imagenet_2012_validation_synset_labels.txt | xargs -n2 -P8 bash -c 'mkdir -p $2; mv $1 $2' argv0\n",
        "\n",
        "cd ..\n",
        "\n",
        "#echo \"train:\" $(find train -name \"*.JPEG\" | wc -l) \"images\"\n",
        "echo \"val:\" $(find val -name \"*.JPEG\" | wc -l) \"images\"\n",
        "\"\"\"\n",
        "\n",
        "with open(\"prepare_val_fixed.sh\", 'w') as fout:\n",
        "  print(val_fixed_code, file=fout)"
      ],
      "metadata": {
        "id": "un5KekAonbLX"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "!bash prepare_val_fixed.sh"
      ],
      "metadata": {
        "id": "18B41B_wXOEp",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "02bb81a2-6fca-4ed5-c5e7-ab3447e59f1d"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Extracting validation set ...\n",
            "Restructuring validation ...\n",
            "--2023-05-24 12:19:29--  https://raw.githubusercontent.com/tensorflow/models/master/research/slim/datasets/imagenet_2012_validation_synset_labels.txt\n",
            "Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.108.133, 185.199.110.133, 185.199.111.133, ...\n",
            "Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.108.133|:443... connected.\n",
            "HTTP request sent, awaiting response... 200 OK\n",
            "Length: 500000 (488K) [text/plain]\n",
            "Saving to: ‘imagenet_2012_validation_synset_labels.txt’\n",
            "\n",
            "imagenet_2012_valid 100%[===================>] 488.28K  --.-KB/s    in 0.04s   \n",
            "\n",
            "2023-05-24 12:19:29 (10.7 MB/s) - ‘imagenet_2012_validation_synset_labels.txt’ saved [500000/500000]\n",
            "\n",
            "val: 50000 images\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "!mkdir data"
      ],
      "metadata": {
        "id": "KWLLAzn5XSU4"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "!mv val data/"
      ],
      "metadata": {
        "id": "bHQHZYtKXpPA"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "!wget -P data/ https://image-net.org/data/ILSVRC/2012/ILSVRC2012_devkit_t12.tar.gz ILSVRC2012_devkit_t12.tar.gz"
      ],
      "metadata": {
        "id": "1nGbRdaGXsbp",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "38e6f2d3-fd26-402b-816a-5e696a772e12"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "--2023-05-24 12:20:39--  https://image-net.org/data/ILSVRC/2012/ILSVRC2012_devkit_t12.tar.gz\n",
            "Resolving image-net.org (image-net.org)... 171.64.68.16\n",
            "Connecting to image-net.org (image-net.org)|171.64.68.16|:443... connected.\n",
            "HTTP request sent, awaiting response... 200 OK\n",
            "Length: 2568145 (2.4M) [application/x-gzip]\n",
            "Saving to: ‘data/ILSVRC2012_devkit_t12.tar.gz’\n",
            "\n",
            "ILSVRC2012_devkit_t 100%[===================>]   2.45M  2.37MB/s    in 1.0s    \n",
            "\n",
            "2023-05-24 12:20:41 (2.37 MB/s) - ‘data/ILSVRC2012_devkit_t12.tar.gz’ saved [2568145/2568145]\n",
            "\n",
            "--2023-05-24 12:20:41--  http://ilsvrc2012_devkit_t12.tar.gz/\n",
            "Resolving ilsvrc2012_devkit_t12.tar.gz (ilsvrc2012_devkit_t12.tar.gz)... failed: Name or service not known.\n",
            "wget: unable to resolve host address ‘ilsvrc2012_devkit_t12.tar.gz’\n",
            "FINISHED --2023-05-24 12:20:41--\n",
            "Total wall clock time: 1.6s\n",
            "Downloaded: 1 files, 2.4M in 1.0s (2.37 MB/s)\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "my_dataset = datasets.ImageFolder(root=\"data/val\")\n",
        "\n",
        "writer = DatasetWriter(\"/tmp/imagenet_val\", {\n",
        "    'image': RGBImageField(write_mode=\"smart\",\n",
        "                            max_resolution=500,\n",
        "                            compress_probability=0.5,\n",
        "                            jpeg_quality=0.9),\n",
        "    'label': IntField(),\n",
        "}, num_workers=2)\n",
        "\n",
        "writer.from_indexed_dataset(my_dataset, chunksize=100)"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "kvIdBxy6qrbP",
        "outputId": "924abc1b-bbf3-4768-a4d3-11bfd9ff5fc7"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "100%|██████████| 50000/50000 [07:33<00:00, 110.31it/s]\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "ACsIEbMOiKzm"
      },
      "source": [
        "# Imagenet embeddings"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "IMAGENET_MEAN = np.array([0.485, 0.456, 0.406]) * 255\n",
        "IMAGENET_STD = np.array([0.229, 0.224, 0.225]) * 255\n",
        "DEFAULT_CROP_RATIO = 224/256"
      ],
      "metadata": {
        "id": "7rFSTcCUpJ6S"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def create_val_loader(val_dataset, batch_size, resolution):\n",
        "  this_device = f'cuda:0'\n",
        "  val_path = Path(val_dataset)\n",
        "  assert val_path.is_file()\n",
        "  res_tuple = (resolution, resolution)\n",
        "  cropper = CenterCropRGBImageDecoder(res_tuple, ratio=DEFAULT_CROP_RATIO)\n",
        "  image_pipeline = [\n",
        "      cropper,\n",
        "      ToTensor(),\n",
        "      ToDevice(torch.device(this_device), non_blocking=True),\n",
        "      ToTorchImage(),\n",
        "      NormalizeImage(IMAGENET_MEAN, IMAGENET_STD, np.float16)\n",
        "  ]\n",
        "\n",
        "  label_pipeline = [\n",
        "      IntDecoder(),\n",
        "      ToTensor(),\n",
        "      Squeeze(),\n",
        "      ToDevice(torch.device(this_device),\n",
        "      non_blocking=True)\n",
        "  ]\n",
        "\n",
        "  loader = Loader(val_dataset,\n",
        "                  batch_size=batch_size,\n",
        "                  num_workers=2,\n",
        "                  order=OrderOption.SEQUENTIAL,\n",
        "                  drop_last=False,\n",
        "                  pipelines={\n",
        "                      'image': image_pipeline,\n",
        "                      'label': label_pipeline\n",
        "                  })\n",
        "  return loader"
      ],
      "metadata": {
        "id": "ie9efQabpTAL"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "loader = create_val_loader(\"/tmp/imagenet_val\", 500, 160)"
      ],
      "metadata": {
        "id": "7PShaYFMqJLq"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "def get_imagenet_embeddings(loader):\n",
        "  model = models.resnet18(weights=models.ResNet18_Weights.IMAGENET1K_V1).to(device)\n",
        "  model.fc = nn.Identity()\n",
        "  model.eval()\n",
        "  res = []\n",
        "  with torch.no_grad():\n",
        "    for batch in loader:\n",
        "        with autocast():\n",
        "          res.append(get_outputs(model, batch).detach().cpu())\n",
        "  return torch.cat(res).float()"
      ],
      "metadata": {
        "id": "RZWGNA0lwscu"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "imagenet_embeddings = get_imagenet_embeddings(loader)"
      ],
      "metadata": {
        "id": "2QB6nXMhw6wo",
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "outputId": "c1538ac4-514b-446e-e9c3-86f5a68bd712"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "Downloading: \"https://download.pytorch.org/models/resnet18-f37072fd.pth\" to /root/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth\n",
            "100%|██████████| 44.7M/44.7M [00:00<00:00, 243MB/s]\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "print(imagenet_embeddings.shape)\n",
        "torch.save(imagenet_embeddings, \"imagenet_embeddings.pt\")"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "sOUKA2oOyKyN",
        "outputId": "39e0b88f-6132-4818-d157-f0852808a727"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "torch.Size([50000, 512])\n"
          ]
        }
      ]
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Imagenet code"
      ],
      "metadata": {
        "id": "cfdDNLecyS2x"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "imagenet_code = \\\n",
        "\"\"\"\n",
        "from __future__ import print_function\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "import torch.nn.functional as F\n",
        "import torch.optim as optim\n",
        "from torchvision import datasets, transforms, models\n",
        "from torch.optim.lr_scheduler import StepLR\n",
        "from tqdm import tqdm\n",
        "from torch.utils.data import DataLoader, Dataset, Subset\n",
        "import random\n",
        "import matplotlib.pyplot as plt\n",
        "import numpy as np\n",
        "import math\n",
        "from collections import OrderedDict\n",
        "import tensorflow as tf\n",
        "from PIL import Image\n",
        "import os\n",
        "import itertools\n",
        "from typing import List\n",
        "from torch.cuda.amp import GradScaler, autocast\n",
        "\n",
        "from ffcv.fields import IntField, RGBImageField\n",
        "from ffcv.fields.decoders import IntDecoder, SimpleRGBImageDecoder\n",
        "from ffcv.loader import Loader, OrderOption\n",
        "from ffcv.pipeline.operation import Operation\n",
        "from ffcv.transforms import RandomHorizontalFlip, Cutout, \\\n",
        "    RandomTranslate, Convert, ToDevice, ToTensor, ToTorchImage\n",
        "from ffcv.transforms.common import Squeeze\n",
        "from ffcv.writer import DatasetWriter\n",
        "import gc\n",
        "import sys\n",
        "from ffcv.transforms import ToTensor, ToDevice, Squeeze, NormalizeImage, \\\n",
        "    RandomHorizontalFlip, ToTorchImage\n",
        "from ffcv.fields.rgb_image import CenterCropRGBImageDecoder, \\\n",
        "    RandomResizedCropRGBImageDecoder\n",
        "from ffcv.fields.basics import IntDecoder\n",
        "from pathlib import Path\n",
        "\n",
        "import traceback\n",
        "import sys\n",
        "\n",
        "n_runs, n_points, n_negatives, dim, n_samples = [int(x) for x in sys.argv[1:]]\n",
        "print(f\"Runs: {n_runs} Points: {n_points} Negatives: {n_negatives} Dim: {dim} Samples: {n_samples}\")\n",
        "\n",
        "device = torch.device(\"cuda\")\n",
        "torch.manual_seed(318946379189643)\n",
        "\n",
        "\n",
        "\n",
        "def get_labels(dataset):\n",
        "  return torch.tensor(dataset.targets).tolist()\n",
        "  # return [label for (_, label) in dataset]\n",
        "\n",
        "\n",
        "def generate_until(gen_f, pred):\n",
        "  while True:\n",
        "    res = gen_f()\n",
        "    if pred(res):\n",
        "      return res\n",
        "\n",
        "\n",
        "def gen_order_with_ground_truth(embeddings, *, allowed_indices, n_samples, n_negatives):\n",
        "    order = []\n",
        "    for _ in range(n_samples):\n",
        "      cur = random.sample(allowed_indices, k=n_negatives + 2)\n",
        "      a, *candidates = cur\n",
        "      a_emb = embeddings[a]\n",
        "      similarities = a_emb @ embeddings[candidates].T\n",
        "      best = torch.argmax(similarities)\n",
        "      candidates[0], candidates[best] = candidates[best], candidates[0]\n",
        "      order += [a] + candidates\n",
        "    return order\n",
        "\n",
        "\n",
        "def contrastive_dataloader_with_ground_truth(dataset_path, embeddings, *, allowed_indices, n_samples, n_negatives, batch_size):\n",
        "    resolution = 160\n",
        "\n",
        "    order = gen_order_with_ground_truth(embeddings, allowed_indices=allowed_indices, n_samples=n_samples, n_negatives=n_negatives)\n",
        "\n",
        "    IMAGENET_MEAN = np.array([0.485, 0.456, 0.406]) * 255\n",
        "    IMAGENET_STD = np.array([0.229, 0.224, 0.225]) * 255\n",
        "    DEFAULT_CROP_RATIO = 224/256\n",
        "    this_device = f'cuda:0'\n",
        "    res_tuple = (resolution, resolution)\n",
        "    cropper = CenterCropRGBImageDecoder(res_tuple, ratio=DEFAULT_CROP_RATIO)\n",
        "    image_pipeline = [\n",
        "        cropper,\n",
        "        ToTensor(),\n",
        "        ToDevice(torch.device(this_device), non_blocking=True),\n",
        "        ToTorchImage(),\n",
        "        NormalizeImage(IMAGENET_MEAN, IMAGENET_STD, np.float16)\n",
        "    ]\n",
        "\n",
        "    label_pipeline = [\n",
        "        IntDecoder(),\n",
        "        ToTensor(),\n",
        "        Squeeze(),\n",
        "        ToDevice(torch.device(this_device),\n",
        "        non_blocking=True)\n",
        "    ]\n",
        "    batch_size = batch_size - batch_size % (n_negatives + 2)\n",
        "\n",
        "    loader = Loader(\"/tmp/imagenet_val\",\n",
        "                    batch_size=batch_size,\n",
        "                    num_workers=2,\n",
        "                    order=OrderOption.SEQUENTIAL,\n",
        "                    indices=order,\n",
        "                    drop_last=False,\n",
        "                    pipelines={\n",
        "                        'image': image_pipeline,\n",
        "                        'label': label_pipeline\n",
        "                    })\n",
        "    return loader\n",
        "\n",
        "def get_outputs(model, batch):\n",
        "  return model(batch[0].to(device))\n",
        "\n",
        "\n",
        "logsoftmax = nn.LogSoftmax(1)\n",
        "\n",
        "\n",
        "\n",
        "def contrastive_loss_acc(outputs, n_negatives):\n",
        "  assert outputs.shape[0] % (n_negatives + 2) == 0, (outputs.shape[0], n_negatives + 2)\n",
        "  # print(outputs.shape[0] / (n_negatives + 2))\n",
        "  tuples_sep = outputs.reshape([outputs.shape[0] // (n_negatives + 2), n_negatives + 2] + list(outputs.shape[1:]))\n",
        "  anchor = tuples_sep[:, :1]\n",
        "  candidates = tuples_sep[:, 1:]\n",
        "  inner_products = (anchor * candidates).sum(dim=-1)\n",
        "  # print(anchor.shape, candidates.shape, inner_products.shape)\n",
        "  softmax = logsoftmax(inner_products)\n",
        "  loss = torch.mean(-softmax[:, 0])\n",
        "  acc = torch.mean((softmax.argmax(dim=1) == 0).float())\n",
        "  return loss, acc\n",
        "\n",
        "\n",
        "def train(model, train_loader, scaler, optimizer, epoch, n_vals, loss_acc_f):\n",
        "  model.train()\n",
        "  n_batches = len(train_loader)\n",
        "  # progress_bar = tqdm(train_loader, position=0, leave=True, miniters=10)\n",
        "  losses = []\n",
        "  # for batch in progress_bar:\n",
        "\n",
        "  for i, batch in enumerate(train_loader):\n",
        "    optimizer.zero_grad()\n",
        "    with autocast():\n",
        "      outputs = get_outputs(model, batch)\n",
        "    n_vals -= outputs.shape[0]\n",
        "    if n_vals < 0:\n",
        "      outputs = outputs[:n_vals]\n",
        "    loss, _ = loss_acc_f(outputs)\n",
        "    losses.append(loss.detach().item())\n",
        "    scaler.scale(loss).backward()\n",
        "    scaler.step(optimizer)\n",
        "    scaler.update()\n",
        "    if n_vals < 0:\n",
        "      break\n",
        "    # progress_bar.set_description(f'Train Epoch: {epoch} [{len(losses)}/{n_batches} ({100. * len(losses) / n_batches:.0f}%)]\\tLoss: {np.mean(losses):.6f}', refresh=False)\n",
        "\n",
        "\n",
        "def test(model, test_loader, msg, n_vals, loss_acc_f):\n",
        "  model.eval()\n",
        "  test_loss = []\n",
        "  correct = []\n",
        "  with torch.no_grad():\n",
        "    for batch in test_loader:\n",
        "      with autocast():\n",
        "        outputs = get_outputs(model, batch)\n",
        "      n_vals -= outputs.shape[0]\n",
        "      if n_vals < 0:\n",
        "        outputs = outputs[:n_vals]\n",
        "      loss, acc = loss_acc_f(outputs)\n",
        "      test_loss.append(loss.detach().item())\n",
        "      correct.append(acc.detach().item())\n",
        "      if n_vals < 0:\n",
        "        break\n",
        "\n",
        "  print(f'{msg} Average loss: {np.mean(test_loss):.4f}, Accuracy: {100. * np.mean(correct):.2f}%)')\n",
        "  return 100 * np.mean(correct)\n",
        "\n",
        "\n",
        "embeddings = torch.load(\"imagenet_embeddings.pt\")\n",
        "\n",
        "n_vals = n_samples * (2 + n_negatives)\n",
        "epochs = 100\n",
        "init_n_points = embeddings.shape[0]\n",
        "for run in range(n_runs):\n",
        "# train_loader = train_loaders[n_negatives][run]\n",
        "# test_loader = test_loaders[n_negatives][run]\n",
        "  allowed_indices = random.sample(range(init_n_points), k=n_points)\n",
        "  train_loader = contrastive_dataloader_with_ground_truth(\"/tmp/imagenet_val\", embeddings, allowed_indices=allowed_indices, n_samples=n_samples, n_negatives=n_negatives, batch_size=500)\n",
        "  test_loader = contrastive_dataloader_with_ground_truth(\"/tmp/imagenet_val\", embeddings, allowed_indices=allowed_indices, n_samples=10000, n_negatives=n_negatives, batch_size=1000)\n",
        "  model = models.resnet18()\n",
        "  model.fc = nn.Linear(512, dim, bias=False)\n",
        "  model = model.to(device)\n",
        "  optimizer = optim.Adadelta(model.parameters(), lr=0.1)\n",
        "  scheduler = StepLR(optimizer, step_size=0.1, gamma=0.7)\n",
        "\n",
        "  scaler = GradScaler()\n",
        "  for epoch in range(1, epochs + 1):\n",
        "      train(model, train_loader, scaler, optimizer, epoch, n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "      scheduler.step()\n",
        "  train_acc = test(model, train_loader, \"Train\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "  last_test = test(model, test_loader, \"Test\", n_vals, lambda o: contrastive_loss_acc(o, n_negatives))\n",
        "  print(f\"{n_points} {n_negatives} {dim} {n_samples} Train: {train_acc} Test: {last_test}\")\n",
        "  with open(\"res_imagenet_dif_classes.txt\", \"a\") as fout:\n",
        "    print(f\"{n_points} {n_negatives} {dim} {n_samples} Train: {train_acc} Test: {last_test}\", file=fout)\n",
        "  # gc.collect()\n",
        "  print(\"-----------------------------------------------\")\n",
        "\"\"\""
      ],
      "metadata": {
        "id": "O9Otu1ZUzTjr"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"runner_imagenet.py\", 'w') as fout:\n",
        "  print(imagenet_code, file=fout)"
      ],
      "metadata": {
        "id": "ddkE13s5yVr_"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "# Run imagenet"
      ],
      "metadata": {
        "id": "NjvQhTJ8yyXs"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "for n_points in [10000]:\n",
        "  for dim in [512]:\n",
        "    for n_samples in [2, 10, 100, 1000]:\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 4 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "AAe2gGo4Ukgb",
        "outputId": "2a396913-8607-4e80-8ea5-85667a5c7620"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-23 18:41:16.409750: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 28.0938, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f9b6e976b00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 16.2500, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 18:45:08.254085: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0020, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa4042f6c20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 21.3750, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 18:48:37.263136: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 19.1562, Accuracy: 0.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f27bcc16c40; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8457, Accuracy: 50.00%)\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 18:51:46.434486: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.6328, Accuracy: 20.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 20.000000298023224\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.5078, Accuracy: 40.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 18:54:57.618131: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.4844, Accuracy: 50.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fc15dc46a80; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2773, Accuracy: 50.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fba16d447a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 18:58:11.961297: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.1133, Accuracy: 70.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f0c7f5d2840; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2227, Accuracy: 50.00%)\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f054fc24400; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 19:01:24.284093: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.9287, Accuracy: 44.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 43.99999976158142\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f273fa3b180; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5820, Accuracy: 46.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 45.99999785423279\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 19:05:38.675553: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3350, Accuracy: 52.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 51.99999809265137\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa880dfab60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7471, Accuracy: 37.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 37.00000047683716\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 19:09:56.643763: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2891, Accuracy: 54.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f02f3656ac0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2100, Accuracy: 58.00%)\n",
            "10000 1 512 100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 19:14:17.726271: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3247, Accuracy: 67.72%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.71771758794785\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb0d176ed80; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3887, Accuracy: 43.24%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 43.24324429035187\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa98bc66080; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 19:43:35.093360: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1738, Accuracy: 68.32%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 68.31831932067871\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f2db17faba0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1873, Accuracy: 70.05%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 70.04504650831223\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-23 20:13:07.036059: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3789, Accuracy: 66.67%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 66.66666865348816\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1768, Accuracy: 67.64%)\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.64264404773712\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "^C\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res_imagenet_dif_classes.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "lY2sGS7RVTqx",
        "outputId": "b5656a30-088c-43d3-e44a-4623bee89424"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 0.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 20.000000298023224\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 100 Train: 100.0 Test: 43.99999976158142\n",
            "10000 1 512 100 Train: 100.0 Test: 45.99999785423279\n",
            "10000 1 512 100 Train: 100.0 Test: 51.99999809265137\n",
            "10000 1 512 100 Train: 100.0 Test: 37.00000047683716\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "10000 1 512 100 Train: 100.0 Test: 57.999998331069946\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.71771758794785\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 43.24324429035187\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 68.31831932067871\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 70.04504650831223\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 66.66666865348816\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.64264404773712\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "for _ in range(3):\n",
        "  for n_points in [1000, 10000]:\n",
        "    for dim in [512]:\n",
        "      for n_samples in [10000]:\n",
        "        !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "oRshXOc1VTJj",
        "outputId": "3f09478c-03aa-488e-9db1-521db1e0a431"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-23 20:42:33.602250: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3820, Accuracy: 74.05%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.04921285567745\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f0a999a04c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0073, Accuracy: 99.71%)\n",
            "Test Average loss: 2.4789, Accuracy: 75.58%)\n",
            "1000 1 512 10000 Train: 99.71360349264302 Test: 75.57590065463897\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f0a18818f00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5357, Accuracy: 72.00%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 71.99942085050768\n",
            "-----------------------------------------------\n",
            "2023-05-23 22:22:27.609403: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1253, Accuracy: 63.99%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.99108959782508\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f21aec369a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0730, Accuracy: 63.90%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.8971249903402\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f2143cbf2e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f1a7f2b65e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9783, Accuracy: 65.69%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 65.68827090724822\n",
            "-----------------------------------------------\n",
            "2023-05-24 00:03:27.320116: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0104, Accuracy: 99.76%)\n",
            "Test Average loss: 2.3699, Accuracy: 73.41%)\n",
            "1000 1 512 10000 Train: 99.76298125063788 Test: 73.41277022515574\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fef0c6483a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.1642, Accuracy: 97.50%)\n",
            "Test Average loss: 3.1062, Accuracy: 73.29%)\n",
            "1000 1 512 10000 Train: 97.4999970099965 Test: 73.28974335424363\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fee8b4c0d80; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0110, Accuracy: 99.64%)\n",
            "Test Average loss: 2.4394, Accuracy: 72.85%)\n",
            "1000 1 512 10000 Train: 99.64447500275784 Test: 72.84801121680967\n",
            "-----------------------------------------------\n",
            "2023-05-24 01:47:40.729613: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0034, Accuracy: 99.91%)\n",
            "Test Average loss: 3.1650, Accuracy: 63.51%)\n",
            "10000 1 512 10000 Train: 99.91111432919737 Test: 63.50963980920853\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f6b13256a80; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1183, Accuracy: 64.81%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.8077126472227\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f6a962f73a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.9389, Accuracy: 64.39%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.38826091827885\n",
            "-----------------------------------------------\n",
            "2023-05-24 03:30:53.946637: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4003, Accuracy: 74.60%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.60428399424399\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f16599ac4e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3080, Accuracy: 74.48%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.48222637176514\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f15d87ccf20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2510, Accuracy: 74.03%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.02983826975668\n",
            "-----------------------------------------------\n",
            "2023-05-24 05:15:43.381019: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1163, Accuracy: 63.95%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.949434603414225\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fcb42c36a20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1978, Accuracy: 64.56%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.555848029352\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fcac5ab7380; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.1750, Accuracy: 63.89%)\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.89131315292851\n",
            "-----------------------------------------------\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res_imagenet_dif_classes.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "BC5e2gA4VpBw",
        "outputId": "9419140d-821f-479e-9bc7-0a889e63843a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 2 Train: 100.0 Test: 0.0\n",
            "10000 1 512 2 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 20.000000298023224\n",
            "10000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "10000 1 512 10 Train: 100.0 Test: 50.0\n",
            "10000 1 512 100 Train: 100.0 Test: 43.99999976158142\n",
            "10000 1 512 100 Train: 100.0 Test: 45.99999785423279\n",
            "10000 1 512 100 Train: 100.0 Test: 51.99999809265137\n",
            "10000 1 512 100 Train: 100.0 Test: 37.00000047683716\n",
            "10000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "10000 1 512 100 Train: 100.0 Test: 57.999998331069946\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.71771758794785\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 43.24324429035187\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 68.31831932067871\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 70.04504650831223\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 66.66666865348816\n",
            "10000 1 512 1000 Train: 99.99999489103045 Test: 67.64264404773712\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.04921285567745\n",
            "1000 1 512 10000 Train: 99.71360349264302 Test: 75.57590065463897\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 71.99942085050768\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.99108959782508\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.8971249903402\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 65.68827090724822\n",
            "1000 1 512 10000 Train: 99.76298125063788 Test: 73.41277022515574\n",
            "1000 1 512 10000 Train: 97.4999970099965 Test: 73.28974335424363\n",
            "1000 1 512 10000 Train: 99.64447500275784 Test: 72.84801121680967\n",
            "10000 1 512 10000 Train: 99.91111432919737 Test: 63.50963980920853\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.8077126472227\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.38826091827885\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.60428399424399\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.48222637176514\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.02983826975668\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.949434603414225\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 64.555848029352\n",
            "10000 1 512 10000 Train: 99.99999413724805 Test: 63.89131315292851\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "for n_points in [10, 100, 1000, 10000]:\n",
        "  for dim in [512]:\n",
        "    for n_samples in [2, 10, 100, 1000, 10000]:\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 4 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "1UPS_th9w9Kn",
        "outputId": "994026d1-f267-4634-ea85-471770a2374c"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-23 00:24:47.793170: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:24:50.086351: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 18.8125, Accuracy: 0.00%)\n",
            "10 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:26:23.447329: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:26:25.490146: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.7510, Accuracy: 50.00%)\n",
            "10 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:28:10.150918: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:28:12.319310: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:29:56.010221: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:29:58.030778: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.2969, Accuracy: 70.00%)\n",
            "10 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:31:45.020376: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:31:47.015424: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.8809, Accuracy: 70.00%)\n",
            "10 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:33:33.004813: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:33:35.417335: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 12.9062, Accuracy: 40.00%)\n",
            "10 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:35:23.645256: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:35:26.034151: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0005, Accuracy: 100.00%)\n",
            "Test Average loss: 0.5718, Accuracy: 88.00%)\n",
            "10 1 512 100 Train: 100.0 Test: 87.99999952316284\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:37:47.143019: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:37:49.161560: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.5591, Accuracy: 88.00%)\n",
            "Test Average loss: 1.4619, Accuracy: 75.00%)\n",
            "10 1 512 100 Train: 87.99999952316284 Test: 75.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:40:07.591067: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:40:09.762112: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0043, Accuracy: 100.00%)\n",
            "Test Average loss: 0.4216, Accuracy: 92.00%)\n",
            "10 1 512 100 Train: 100.0 Test: 91.99999570846558\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:42:29.388548: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:42:31.387726: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0079, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0017, Accuracy: 100.00%)\n",
            "10 1 512 1000 Train: 99.99999489103045 Test: 100.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:49:39.668237: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:49:41.665716: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.3255, Accuracy: 90.49%)\n",
            "Test Average loss: 0.1755, Accuracy: 94.37%)\n",
            "10 1 512 1000 Train: 90.49053021839687 Test: 94.36937123537064\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 00:57:10.560634: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 00:57:12.566786: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0017, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0188, Accuracy: 99.70%)\n",
            "10 1 512 1000 Train: 99.99999489103045 Test: 99.69969987869263\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 01:04:17.378139: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 01:04:19.366257: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7fdf1eae8b20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7fde77c21560; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0001, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7fd7b2d04dc0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7fd769fc0880; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0003, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-23 04:02:35.593637: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 04:02:37.383443: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 10 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7f219fddcb00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f213f4bd540; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7f1a2e7ace00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f19e5854860; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-23 07:02:17.230134: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 07:02:19.055016: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 10 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7f6d852a4b80; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f6cc0d095c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7f6606180e20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f65bcb7c8c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Exception ignored in: <finalize object at 0x7f6d7d8d1a60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f6cc10262a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "10 1 512 10000 Train: 99.99999413724805 Test: 100.0\n",
            "-----------------------------------------------\n",
            "2023-05-23 10:49:14.695202: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:49:15.976054: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 17.1562, Accuracy: 50.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 10:51:03.570955: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:51:06.046704: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8711, Accuracy: 0.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 10:52:58.534881: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:53:01.180581: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.0938, Accuracy: 50.00%)\n",
            "100 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 10:54:50.304340: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:54:52.756856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.4414, Accuracy: 80.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 80.0000011920929\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 10:56:43.593652: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:56:46.181885: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.2539, Accuracy: 40.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 10:58:39.933724: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 10:58:42.188197: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.6719, Accuracy: 30.00%)\n",
            "100 1 512 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:00:35.349863: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:00:37.559579: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5840, Accuracy: 72.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 71.99999690055847\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:03:05.721396: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:03:07.922614: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3379, Accuracy: 61.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 61.000001430511475\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:05:34.028434: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:05:36.566897: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7939, Accuracy: 57.00%)\n",
            "100 1 512 100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:08:03.323467: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:08:05.585837: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0296, Accuracy: 99.48%)\n",
            "Test Average loss: 1.5420, Accuracy: 82.58%)\n",
            "100 1 512 1000 Train: 99.48364496231079 Test: 82.58258402347565\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:15:56.578995: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:15:59.171702: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0006, Accuracy: 100.00%)\n",
            "Test Average loss: 0.8455, Accuracy: 84.76%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 84.7597599029541\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:23:36.073000: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:23:38.363849: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 100 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5683, Accuracy: 78.90%)\n",
            "100 1 512 1000 Train: 99.99999489103045 Test: 78.90390455722809\n",
            "-----------------------------------------------\n",
            "^C\n",
            "2023-05-23 11:31:30.553224: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 11:31:32.866063: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.2697, Accuracy: 93.43%)\n",
            "Test Average loss: 0.7698, Accuracy: 85.70%)\n",
            "100 1 512 10000 Train: 93.43274411607962 Test: 85.6960210107988\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.4197, Accuracy: 90.56%)\n",
            "Exception ignored in: <finalize object at 0x7f4e213340a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f4dba53a180; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.9092, Accuracy: 84.23%)\n",
            "100 1 512 10000 Train: 90.55747243224597 Test: 84.22648752889326\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.2729, Accuracy: 93.34%)\n",
            "Exception ignored in: <finalize object at 0x7f4699769680; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f4698321fc0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Test Average loss: 0.7197, Accuracy: 86.17%)\n",
            "100 1 512 10000 Train: 93.34386430802893 Test: 86.17068894447819\n",
            "-----------------------------------------------\n",
            "2023-05-23 14:29:48.158471: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "2023-05-23 14:29:50.068494: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 100 Negatives: 1 Dim: 512 Samples: 10000\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res_imagenet_dif_classes.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "id": "YX-MMwkQ0mFD"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [],
      "metadata": {
        "id": "JvqdIznaeRWv"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "markdown",
      "source": [
        "## dimensions"
      ],
      "metadata": {
        "id": "zwPt9IoPp9iF"
      }
    },
    {
      "cell_type": "code",
      "source": [
        "for n_points in [1000]:\n",
        "  for dim in [128, 256, 512, 1024]:\n",
        "    for n_samples in [2, 10, 100, 1000]:\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 4 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "pf_bc5zDp_mO",
        "outputId": "1b9d7b98-2241-44ef-a287-89ded4614a99"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-24 12:30:42.101018: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7227, Accuracy: 50.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f0dcfbfc500; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3809, Accuracy: 50.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f0698db9320; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:34:31.200355: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4326, Accuracy: 0.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fd140370920; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2617, Accuracy: 50.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:38:02.917856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 128 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.7256, Accuracy: 50.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fc7f16b06a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 128 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:41:33.730355: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4619, Accuracy: 40.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1768, Accuracy: 30.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:44:51.293071: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.9980, Accuracy: 60.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f6fdd6307c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.4673, Accuracy: 60.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f6897aa8be0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:48:12.279804: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 128 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7090, Accuracy: 60.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.8477, Accuracy: 60.00%)\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:51:32.429834: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2246, Accuracy: 54.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f42799bcb40; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2490, Accuracy: 65.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 64.99999761581421\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 12:56:09.368250: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1240, Accuracy: 54.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f040ccc4ac0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0273, Accuracy: 55.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:00:46.698258: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 128 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1094, Accuracy: 52.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 51.99999809265137\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fad4fbd06a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0947, Accuracy: 53.00%)\n",
            "1000 1 128 100 Train: 100.0 Test: 52.99999713897705\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:05:11.358699: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 1000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3157, Accuracy: 75.38%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 75.37537664175034\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3458, Accuracy: 73.87%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 73.87387454509735\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0062, Accuracy: 99.66%)\n",
            "^C\n",
            "2023-05-24 13:18:29.938487: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 1000\n",
            "Train Average loss: 0.0065, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7581, Accuracy: 48.72%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 48.723725974559784\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f4f8eb5c620; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4904, Accuracy: 74.85%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 74.84984993934631\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:31:17.625473: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 128 Samples: 1000\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 5.5620, Accuracy: 49.70%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 49.699701368808746\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa6df8f04c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3217, Accuracy: 76.13%)\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 76.12612694501877\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f9fa9bca040; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0318, Accuracy: 96.43%)\n",
            "^C\n",
            "2023-05-24 13:43:58.754839: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.9736, Accuracy: 50.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f73735a83c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0283, Accuracy: 100.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:47:11.777080: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4746, Accuracy: 50.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f8a70e745e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.6436, Accuracy: 50.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f832b32efe0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:50:23.726623: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 256 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 4.9961, Accuracy: 50.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb198f4c5c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 21.9062, Accuracy: 50.00%)\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7faa5352ca20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:53:33.578957: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.6367, Accuracy: 40.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f1483cd8480; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.7480, Accuracy: 50.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 13:56:48.743148: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.0859, Accuracy: 50.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f2d828f4600; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.4531, Accuracy: 40.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f263cd30a00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:00:00.463711: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 256 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2734, Accuracy: 50.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f8ee455c600; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 6.3984, Accuracy: 40.00%)\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:03:26.756152: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7100, Accuracy: 49.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 48.99999797344208\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f5014e90880; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 2.1621, Accuracy: 51.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 50.999999046325684\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f48cf26cc60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:07:42.873978: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1826, Accuracy: 49.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 48.99999797344208\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f17ed9d84e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7432, Accuracy: 59.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 58.99999737739563\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f10a7d988e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:12:02.503518: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 256 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0176, Accuracy: 59.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 58.99999737739563\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa9d220c420; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1924, Accuracy: 55.00%)\n",
            "1000 1 256 100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:16:36.863768: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 1000\n",
            "Train Average loss: 0.0020, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4268, Accuracy: 74.10%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 74.09909963607788\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb724ba89c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3405, Accuracy: 73.87%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.87387603521347\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0311, Accuracy: 96.43%)\n",
            "^C\n",
            "2023-05-24 14:29:30.763199: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 1000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2924, Accuracy: 74.25%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 74.24924969673157\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f53e3c40a20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3132, Accuracy: 73.05%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.04804921150208\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:42:19.467616: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 256 Samples: 1000\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3572, Accuracy: 73.87%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.87387603521347\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4443, Accuracy: 49.85%)\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 49.84985142946243\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:55:12.225907: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0005, Accuracy: 100.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f623fe5c480; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 16.8438, Accuracy: 0.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 14:58:23.638223: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 15.9688, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f3808474640; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f30c28694e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:01:32.575611: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.6709, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 19.4375, Accuracy: 50.00%)\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:04:42.345994: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.0605, Accuracy: 50.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 14.0234, Accuracy: 50.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:08:10.537831: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1094, Accuracy: 50.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fae0164c500; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 18.9531, Accuracy: 40.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fa6c5add320; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:11:30.793952: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3291, Accuracy: 80.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 80.0000011920929\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fd68f670600; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5664, Accuracy: 70.00%)\n",
            "1000 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fcf59ad1480; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:14:41.950110: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.2598, Accuracy: 52.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 51.99999809265137\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f534a224800; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.6289, Accuracy: 41.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 40.99999964237213\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:19:02.401628: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.4912, Accuracy: 61.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 61.000001430511475\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f2b61d044a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.0938, Accuracy: 46.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 45.99999785423279\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:23:22.690495: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.6719, Accuracy: 55.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f235a77c660; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.5342, Accuracy: 54.00%)\n",
            "1000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:27:45.731188: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0009, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1107, Accuracy: 75.98%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 75.97597688436508\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7efb18a28860; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "Test Average loss: 3.6838, Accuracy: 49.55%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 49.54955130815506\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:40:50.075636: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1719, Accuracy: 73.65%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 73.64865094423294\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fd7035203e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0004, Accuracy: 100.00%)\n",
            "Test Average loss: 1.7173, Accuracy: 50.00%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 50.00000149011612\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 15:53:51.706879: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 1000\n",
            "Train Average loss: 0.0015, Accuracy: 100.00%)\n",
            "Test Average loss: 1.1013, Accuracy: 73.87%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 73.87387454509735\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f8098a4c720; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0793, Accuracy: 75.75%)\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 75.75075179338455\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7952e2a1c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0003, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:07:04.998858: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.3750, Accuracy: 50.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7ff328c78360; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 19.9375, Accuracy: 50.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7febe2f0ad60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:10:19.515545: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0000, Accuracy: 100.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f5ec12c0340; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 0.0155, Accuracy: 100.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 100.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:13:34.352828: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 1024 Samples: 2\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.0625, Accuracy: 0.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 0.0\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb8d89103c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 5.3750, Accuracy: 50.00%)\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:16:48.355349: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 8.7969, Accuracy: 30.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 30.000001192092896\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f32d0aa4700; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 1.3867, Accuracy: 70.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:20:02.946255: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 7.8203, Accuracy: 40.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 40.00000059604645\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7701a68540; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3105, Accuracy: 70.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:23:23.422677: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 1024 Samples: 10\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 10.3672, Accuracy: 20.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 20.000000298023224\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fc46e6e4740; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.9961, Accuracy: 70.00%)\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fbd28ca4b20; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:26:34.202429: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2734, Accuracy: 57.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 56.99999928474426\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7e38f90a60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5957, Accuracy: 55.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 55.000001192092896\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f76f3344de0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:31:05.048913: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0391, Accuracy: 46.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 45.99999785423279\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.2676, Accuracy: 58.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 57.999998331069946\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:35:45.004061: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 1024 Samples: 100\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 3.0293, Accuracy: 47.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 46.99999988079071\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f1221fb06a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.6426, Accuracy: 47.00%)\n",
            "1000 1 1024 100 Train: 100.0 Test: 46.99999988079071\n",
            "-----------------------------------------------\n",
            "/usr/local/lib/python3.10/dist-packages/torch/optim/lr_scheduler.py:139: UserWarning: Detected call of `lr_scheduler.step()` before `optimizer.step()`. In PyTorch 1.1.0 and later, you should call them in the opposite order: `optimizer.step()` before `lr_scheduler.step()`.  Failure to do this will result in PyTorch skipping the first value of the learning rate schedule. See more details at https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate\n",
            "  warnings.warn(\"Detected call of `lr_scheduler.step()` before `optimizer.step()`. \"\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:40:04.959640: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 1000\n",
            "Train Average loss: 0.0004, Accuracy: 100.00%)\n",
            "Test Average loss: 2.0710, Accuracy: 49.55%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 49.54955130815506\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb5f3c64a40; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0004, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2742, Accuracy: 46.77%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 46.77177220582962\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 16:53:19.020749: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 1024 Samples: 1000\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.8589, Accuracy: 48.72%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 48.723724484443665\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f99dedec4a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0005, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0450, Accuracy: 72.30%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 72.29730039834976\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "^C\n",
            "2023-05-24 17:06:28.255078: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 1024 Samples: 1000\n",
            "Train Average loss: 0.0004, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0735, Accuracy: 76.80%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 76.80180221796036\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f3a320e48c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "Test Average loss: 1.0948, Accuracy: 73.50%)\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 73.49850088357925\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0002, Accuracy: 100.00%)\n",
            "^C\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res_imagenet_dif_classes.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "zh85qREAqFu_",
        "outputId": "02226252-7271-499f-c1cf-bc5d3573504a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "1000 1 128 2 Train: 100.0 Test: 0.0\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "1000 1 128 2 Train: 100.0 Test: 50.0\n",
            "1000 1 128 2 Train: 100.0 Test: 100.0\n",
            "1000 1 128 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 128 10 Train: 100.0 Test: 30.000001192092896\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "1000 1 128 10 Train: 100.0 Test: 60.00000238418579\n",
            "1000 1 128 100 Train: 100.0 Test: 53.999996185302734\n",
            "1000 1 128 100 Train: 100.0 Test: 64.99999761581421\n",
            "1000 1 128 100 Train: 100.0 Test: 53.999996185302734\n",
            "1000 1 128 100 Train: 100.0 Test: 55.000001192092896\n",
            "1000 1 128 100 Train: 100.0 Test: 51.99999809265137\n",
            "1000 1 128 100 Train: 100.0 Test: 52.99999713897705\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 75.37537664175034\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 73.87387454509735\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 48.723725974559784\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 74.84984993934631\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 49.699701368808746\n",
            "1000 1 128 1000 Train: 99.99999489103045 Test: 76.12612694501877\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "1000 1 256 2 Train: 100.0 Test: 100.0\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "1000 1 256 2 Train: 100.0 Test: 50.0\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 256 10 Train: 100.0 Test: 50.0\n",
            "1000 1 256 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 256 100 Train: 100.0 Test: 48.99999797344208\n",
            "1000 1 256 100 Train: 100.0 Test: 50.999999046325684\n",
            "1000 1 256 100 Train: 100.0 Test: 48.99999797344208\n",
            "1000 1 256 100 Train: 100.0 Test: 58.99999737739563\n",
            "1000 1 256 100 Train: 100.0 Test: 58.99999737739563\n",
            "1000 1 256 100 Train: 100.0 Test: 55.000001192092896\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 74.09909963607788\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.87387603521347\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 74.24924969673157\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.04804921150208\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 73.87387603521347\n",
            "1000 1 256 1000 Train: 99.99999489103045 Test: 49.84985142946243\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "1000 1 512 2 Train: 100.0 Test: 0.0\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "1000 1 512 2 Train: 100.0 Test: 100.0\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "1000 1 512 2 Train: 100.0 Test: 50.0\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "1000 1 512 10 Train: 100.0 Test: 50.0\n",
            "1000 1 512 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 512 10 Train: 100.0 Test: 80.0000011920929\n",
            "1000 1 512 10 Train: 100.0 Test: 69.9999988079071\n",
            "1000 1 512 100 Train: 100.0 Test: 51.99999809265137\n",
            "1000 1 512 100 Train: 100.0 Test: 40.99999964237213\n",
            "1000 1 512 100 Train: 100.0 Test: 61.000001430511475\n",
            "1000 1 512 100 Train: 100.0 Test: 45.99999785423279\n",
            "1000 1 512 100 Train: 100.0 Test: 55.000001192092896\n",
            "1000 1 512 100 Train: 100.0 Test: 53.999996185302734\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 75.97597688436508\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 49.54955130815506\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 73.64865094423294\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 50.00000149011612\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 73.87387454509735\n",
            "1000 1 512 1000 Train: 99.99999489103045 Test: 75.75075179338455\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "1000 1 1024 2 Train: 100.0 Test: 100.0\n",
            "1000 1 1024 2 Train: 100.0 Test: 100.0\n",
            "1000 1 1024 2 Train: 100.0 Test: 0.0\n",
            "1000 1 1024 2 Train: 100.0 Test: 50.0\n",
            "1000 1 1024 10 Train: 100.0 Test: 30.000001192092896\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "1000 1 1024 10 Train: 100.0 Test: 40.00000059604645\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "1000 1 1024 10 Train: 100.0 Test: 20.000000298023224\n",
            "1000 1 1024 10 Train: 100.0 Test: 69.9999988079071\n",
            "1000 1 1024 100 Train: 100.0 Test: 56.99999928474426\n",
            "1000 1 1024 100 Train: 100.0 Test: 55.000001192092896\n",
            "1000 1 1024 100 Train: 100.0 Test: 45.99999785423279\n",
            "1000 1 1024 100 Train: 100.0 Test: 57.999998331069946\n",
            "1000 1 1024 100 Train: 100.0 Test: 46.99999988079071\n",
            "1000 1 1024 100 Train: 100.0 Test: 46.99999988079071\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 49.54955130815506\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 46.77177220582962\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 48.723724484443665\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 72.29730039834976\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 76.80180221796036\n",
            "1000 1 1024 1000 Train: 99.99999489103045 Test: 73.49850088357925\n",
            "\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "for n_points in [1000]:\n",
        "  for dim in [128, 256, 512, 1024]:\n",
        "    for n_samples in [10000]:\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 3 {n_points} 1 {dim} {n_samples}\n",
        "      !python runner_imagenet.py 4 {n_points} 1 {dim} {n_samples}"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "a67f_ulCqD5f",
        "outputId": "ea917969-0a1b-41fc-ab7c-bc6e151d5d06"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "2023-05-24 17:18:57.029190: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 10000\n",
            "Train Average loss: 0.0129, Accuracy: 99.59%)\n",
            "Test Average loss: 2.5403, Accuracy: 73.72%)\n",
            "1000 1 128 10000 Train: 99.5852216345365 Test: 73.71985085548893\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fe5feff86a0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3597, Accuracy: 74.49%)\n",
            "1000 1 128 10000 Train: 99.99999413724805 Test: 74.49481987184093\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fe58de490c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7fdec93ddfa0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0173, Accuracy: 99.47%)\n",
            "Test Average loss: 2.6936, Accuracy: 72.73%)\n",
            "1000 1 128 10000 Train: 99.46671480038127 Test: 72.72886057053843\n",
            "-----------------------------------------------\n",
            "2023-05-24 18:53:20.296736: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 128 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3128, Accuracy: 74.63%)\n",
            "1000 1 128 10000 Train: 99.99999413724805 Test: 74.62656401818798\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f30bf594d00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0185, Accuracy: 99.41%)\n",
            "Test Average loss: 2.4756, Accuracy: 73.87%)\n",
            "1000 1 128 10000 Train: 99.407461627585 Test: 73.86806395746046\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f3054611720; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3958, Accuracy: 73.57%)\n",
            "1000 1 128 10000 Train: 99.99999413724805 Test: 73.57163890715567\n",
            "-----------------------------------------------\n",
            "2023-05-24 20:28:14.160644: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 128 Samples: 10000\n",
            "Train Average loss: 0.0001, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4238, Accuracy: 72.85%)\n",
            "1000 1 128 10000 Train: 99.99999413724805 Test: 72.85091742392508\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7e8effc6c0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3980, Accuracy: 74.08%)\n",
            "1000 1 128 10000 Train: 99.99999413724805 Test: 74.08408676424334\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7e1dd8d0e0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0118, Accuracy: 99.69%)\n",
            "Test Average loss: 2.4782, Accuracy: 71.86%)\n",
            "1000 1 128 10000 Train: 99.69385256532763 Test: 71.86380182543108\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f7759515300; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f7e8fb42820; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Exception ignored in: <finalize object at 0x7f7e8f74ffe0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0083, Accuracy: 99.77%)\n",
            "Test Average loss: 2.4700, Accuracy: 73.35%)\n",
            "1000 1 128 10000 Train: 99.77285715400195 Test: 73.35174102937022\n",
            "-----------------------------------------------\n",
            "2023-05-24 22:35:21.207979: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 10000\n",
            "Train Average loss: 0.0035, Accuracy: 99.89%)\n",
            "Test Average loss: 2.4616, Accuracy: 72.94%)\n",
            "1000 1 256 10000 Train: 99.89136349959452 Test: 72.94488222368301\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb2b8e1c820; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0018, Accuracy: 99.93%)\n",
            "Test Average loss: 2.3685, Accuracy: 75.72%)\n",
            "1000 1 256 10000 Train: 99.9308654519378 Test: 75.71830134237966\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fb237c85240; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0209, Accuracy: 99.46%)\n",
            "Test Average loss: 2.4639, Accuracy: 74.56%)\n",
            "1000 1 256 10000 Train: 99.45683919015478 Test: 74.55584887535342\n",
            "-----------------------------------------------\n",
            "2023-05-25 00:11:48.957375: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 256 Samples: 10000\n",
            "Train Average loss: 0.0078, Accuracy: 99.73%)\n",
            "Test Average loss: 2.2611, Accuracy: 74.05%)\n",
            "1000 1 256 10000 Train: 99.73335481080852 Test: 74.05211906279287\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fca1cfc8a00; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.1525, Accuracy: 75.52%)\n",
            "1000 1 256 10000 Train: 99.99999413724805 Test: 75.5216529292445\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7fc99be41440; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.0916, Accuracy: 75.95%)\n",
            "1000 1 256 10000 Train: 99.99999413724805 Test: 75.9469170724192\n",
            "-----------------------------------------------\n",
            "2023-05-25 01:49:33.904084: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 256 Samples: 10000\n",
            "Train Average loss: 0.0016, Accuracy: 99.95%)\n",
            "Test Average loss: 2.5167, Accuracy: 73.74%)\n",
            "1000 1 256 10000 Train: 99.95061657467826 Test: 73.74213126397902\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.2917, Accuracy: 75.14%)\n",
            "1000 1 256 10000 Train: 99.99999413724805 Test: 75.13707510886654\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0171, Accuracy: 99.70%)\n",
            "Test Average loss: 2.4782, Accuracy: 73.54%)\n",
            "1000 1 256 10000 Train: 99.70372798012906 Test: 73.53579671152175\n",
            "-----------------------------------------------\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3699, Accuracy: 74.31%)\n",
            "1000 1 256 10000 Train: 99.99999413724805 Test: 74.31367097362396\n",
            "-----------------------------------------------\n",
            "2023-05-25 03:58:14.246148: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.5138, Accuracy: 73.97%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 73.96784155599534\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f8153ca4560; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0243, Accuracy: 99.41%)\n",
            "Test Average loss: 2.4043, Accuracy: 74.28%)\n",
            "1000 1 512 10000 Train: 99.40746113902233 Test: 74.28460967156195\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f80d2ad8fa0; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.4424, Accuracy: 74.53%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 74.5306622597479\n",
            "-----------------------------------------------\n",
            "2023-05-25 05:38:14.505947: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 3 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0259, Accuracy: 99.31%)\n",
            "Test Average loss: 2.5017, Accuracy: 73.30%)\n",
            "1000 1 512 10000 Train: 99.30870581845768 Test: 73.29652482463467\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f3ab30e0540; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0090, Accuracy: 99.82%)\n",
            "Test Average loss: 2.4531, Accuracy: 73.09%)\n",
            "1000 1 512 10000 Train: 99.82223481428429 Test: 73.09406418954173\n",
            "-----------------------------------------------\n",
            "Exception ignored in: <finalize object at 0x7f3a35e68f60; dead>\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/lib/python3.10/weakref.py\", line 591, in __call__\n",
            "    return info.func(*info.args, **(info.kwargs or {}))\n",
            "  File \"/usr/local/lib/python3.10/dist-packages/numba/core/dispatcher.py\", line 312, in finalizer\n",
            "    for cres in overloads.values():\n",
            "KeyError: (array(uint8, 1d, C), array(uint8, 1d, C), uint32, uint32, uint32, uint32, Literal[int](0), Literal[int](0), Literal[int](1), Literal[int](1), Literal[bool](False), Literal[bool](False))\n",
            "Train Average loss: 0.0034, Accuracy: 99.94%)\n",
            "Test Average loss: 2.5753, Accuracy: 72.70%)\n",
            "1000 1 512 10000 Train: 99.9407410621643 Test: 72.69592342838165\n",
            "-----------------------------------------------\n",
            "2023-05-25 07:17:19.808421: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
            "Runs: 4 Points: 1000 Negatives: 1 Dim: 512 Samples: 10000\n",
            "Train Average loss: 0.0000, Accuracy: 100.00%)\n",
            "Test Average loss: 2.3791, Accuracy: 75.05%)\n",
            "1000 1 512 10000 Train: 99.99999413724805 Test: 75.0527972175229\n",
            "-----------------------------------------------\n"
          ]
        }
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "with open(\"res_imagenet_dif_classes.txt\", \"r\") as fin:\n",
        "  print(fin.read())"
      ],
      "metadata": {
        "id": "9zuxzq_PqGWY"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [],
      "metadata": {
        "id": "5t6VKVc2qJcz"
      },
      "execution_count": null,
      "outputs": []
    }
  ],
  "metadata": {
    "accelerator": "GPU",
    "colab": {
      "provenance": [],
      "gpuType": "V100",
      "toc_visible": true,
      "machine_shape": "hm"
    },
    "gpuClass": "standard",
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}