{
  "cells": [
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "zIS27VaNbX0L"
      },
      "source": [
        "# **Loading full-tuned model**"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 1,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "F2l9MJsZyznV",
        "outputId": "7c7fb865-2360-4909-ec92-4ecf555befe3"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "py38_cu102_pyt181\n"
          ]
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages/tqdm/auto.py:22: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
            "  from .autonotebook import tqdm as notebook_tqdm\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Looking in links: https://dl.fbaipublicfiles.com/vissl/packaging/apexwheels/py38_cu102_pyt181/download.html\n",
            "Requirement already satisfied: apex in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (0.1)\n",
            "Cloning into 'vissl'...\n",
            "remote: Enumerating objects: 12020, done.\u001b[K\n",
            "remote: Counting objects: 100% (616/616), done.\u001b[K\n",
            "remote: Compressing objects: 100% (260/260), done.\u001b[K\n",
            "remote: Total 12020 (delta 377), reused 551 (delta 345), pack-reused 11404\u001b[K\n",
            "Receiving objects: 100% (12020/12020), 18.44 MiB | 836.00 KiB/s, done.\n",
            "Resolving deltas: 100% (8430/8430), done.\n",
            "/home/erik/Documents/UCPH/AdversarialTransfer/vissl\n",
            "Note: switching to 'v0.1.6'.\n",
            "\n",
            "You are in 'detached HEAD' state. You can look around, make experimental\n",
            "changes and commit them, and you can discard any commits you make in this\n",
            "state without impacting any branches by switching back to a branch.\n",
            "\n",
            "If you want to create a new branch to retain commits you create, you may\n",
            "do so (now or later) by using -c with the switch command. Example:\n",
            "\n",
            "  git switch -c <new-branch-name>\n",
            "\n",
            "Or undo this operation with:\n",
            "\n",
            "  git switch -\n",
            "\n",
            "Turn off this advice by setting config variable advice.detachedHead to false\n",
            "\n",
            "HEAD is now at dac766a @allow-large-files [vissl][PR] V0.1.6 build fairscale pip pckg @allow-large-files (#465)\n",
            "Switched to a new branch 'v0.1.6'\n",
            "Collecting cython==0.29.22\n",
            "  Downloading Cython-0.29.22-cp38-cp38-manylinux1_x86_64.whl (1.9 MB)\n",
            "Collecting fvcore==0.1.3.post20210317\n",
            "  Downloading fvcore-0.1.3.post20210317.tar.gz (47 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25hRequirement already satisfied: iopath==0.1.9 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from -r requirements.txt (line 5)) (0.1.9)\n",
            "Collecting hydra-core==1.0.7\n",
            "  Downloading hydra_core-1.0.7-py3-none-any.whl (123 kB)\n",
            "Collecting numpy==1.19.5\n",
            "  Downloading numpy-1.19.5-cp38-cp38-manylinux2010_x86_64.whl (14.9 MB)\n",
            "Collecting parameterized==0.7.4\n",
            "  Downloading parameterized-0.7.4-py2.py3-none-any.whl (25 kB)\n",
            "Collecting scikit-learn==0.24.1\n",
            "  Downloading scikit_learn-0.24.1-cp38-cp38-manylinux2010_x86_64.whl (24.9 MB)\n",
            "Collecting submitit==1.3.3\n",
            "  Downloading submitit-1.3.3.tar.gz (54 kB)\n",
            "  Installing build dependencies ... \u001b[?25ldone\n",
            "\u001b[?25h  Getting requirements to build wheel ... \u001b[?25ldone\n",
            "\u001b[?25h  Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25hCollecting tabulate==0.8.9\n",
            "  Downloading tabulate-0.8.9-py3-none-any.whl (25 kB)\n",
            "Requirement already satisfied: yacs>=0.1.6 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->-r requirements.txt (line 4)) (0.1.8)\n",
            "Requirement already satisfied: pyyaml>=5.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->-r requirements.txt (line 4)) (6.0)\n",
            "Requirement already satisfied: tqdm in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->-r requirements.txt (line 4)) (4.64.1)\n",
            "Requirement already satisfied: termcolor>=1.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->-r requirements.txt (line 4)) (2.2.0)\n",
            "Requirement already satisfied: Pillow in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->-r requirements.txt (line 4)) (9.2.0)\n",
            "Requirement already satisfied: portalocker in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from iopath==0.1.9->-r requirements.txt (line 5)) (2.7.0)\n",
            "Requirement already satisfied: importlib-resources in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from hydra-core==1.0.7->-r requirements.txt (line 6)) (5.10.2)\n",
            "Collecting antlr4-python3-runtime==4.8\n",
            "  Downloading antlr4-python3-runtime-4.8.tar.gz (112 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25hCollecting omegaconf<2.1,>=2.0.5\n",
            "  Downloading omegaconf-2.0.6-py3-none-any.whl (36 kB)\n",
            "Requirement already satisfied: joblib>=0.11 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->-r requirements.txt (line 9)) (1.2.0)\n",
            "Requirement already satisfied: scipy>=0.19.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->-r requirements.txt (line 9)) (1.9.3)\n",
            "Requirement already satisfied: threadpoolctl>=2.0.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->-r requirements.txt (line 9)) (3.1.0)\n",
            "Collecting cloudpickle>=1.2.1\n",
            "  Downloading cloudpickle-2.2.1-py3-none-any.whl (25 kB)\n",
            "Requirement already satisfied: typing-extensions>=3.7.4.2 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from submitit==1.3.3->-r requirements.txt (line 10)) (4.3.0)\n",
            "Requirement already satisfied: zipp>=3.1.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from importlib-resources->hydra-core==1.0.7->-r requirements.txt (line 6)) (3.13.0)\n",
            "Building wheels for collected packages: fvcore, submitit, antlr4-python3-runtime\n",
            "  Building wheel for fvcore (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for fvcore: filename=fvcore-0.1.3.post20210317-py3-none-any.whl size=58518 sha256=0f1c043d0cc35635121d835ca012004c4c978327c4006d285e447ec978288f05\n",
            "  Stored in directory: /home/erik/.cache/pip/wheels/19/65/1b/67f264eee136ba1a866c47cc5af6934e423ee209b7c62c2352\n",
            "  Building wheel for submitit (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for submitit: filename=submitit-1.3.3-py3-none-any.whl size=66061 sha256=57b040a902ac9f969c2986a73124b895c0e140b3e69df9610f8bb9ba586403c6\n",
            "  Stored in directory: /home/erik/.cache/pip/wheels/d4/3b/dc/34a0c899f3148c2fdcf9c2fc857643780000cef5de2c627477\n",
            "  Building wheel for antlr4-python3-runtime (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for antlr4-python3-runtime: filename=antlr4_python3_runtime-4.8-py3-none-any.whl size=141210 sha256=6a63122976c3fab419c5c21b7453e79e6f6cb98b54e88e9941a5c1ea107e077d\n",
            "  Stored in directory: /home/erik/.cache/pip/wheels/c8/d0/ab/d43c02eaddc5b9004db86950802442ad9a26f279c619e28da0\n",
            "Successfully built fvcore submitit antlr4-python3-runtime\n",
            "Installing collected packages: tabulate, parameterized, antlr4-python3-runtime, omegaconf, numpy, cython, cloudpickle, submitit, hydra-core, fvcore, scikit-learn\n",
            "  Attempting uninstall: tabulate\n",
            "    Found existing installation: tabulate 0.9.0\n",
            "    Uninstalling tabulate-0.9.0:\n",
            "      Successfully uninstalled tabulate-0.9.0\n",
            "  Attempting uninstall: parameterized\n",
            "    Found existing installation: parameterized 0.8.1\n",
            "    Uninstalling parameterized-0.8.1:\n",
            "      Successfully uninstalled parameterized-0.8.1\n",
            "  Attempting uninstall: antlr4-python3-runtime\n",
            "    Found existing installation: antlr4-python3-runtime 4.9.3\n",
            "    Uninstalling antlr4-python3-runtime-4.9.3:\n",
            "      Successfully uninstalled antlr4-python3-runtime-4.9.3\n",
            "  Attempting uninstall: omegaconf\n",
            "    Found existing installation: omegaconf 2.3.0\n",
            "    Uninstalling omegaconf-2.3.0:\n",
            "      Successfully uninstalled omegaconf-2.3.0\n",
            "  Attempting uninstall: numpy\n",
            "    Found existing installation: numpy 1.23.3\n",
            "    Uninstalling numpy-1.23.3:\n",
            "      Successfully uninstalled numpy-1.23.3\n",
            "  Attempting uninstall: hydra-core\n",
            "    Found existing installation: hydra-core 1.3.1\n",
            "    Uninstalling hydra-core-1.3.1:\n",
            "      Successfully uninstalled hydra-core-1.3.1\n",
            "  Attempting uninstall: fvcore\n",
            "    Found existing installation: fvcore 0.1.5.post20221221\n",
            "    Uninstalling fvcore-0.1.5.post20221221:\n",
            "      Successfully uninstalled fvcore-0.1.5.post20221221\n",
            "  Attempting uninstall: scikit-learn\n",
            "    Found existing installation: scikit-learn 1.2.0\n",
            "    Uninstalling scikit-learn-1.2.0:\n",
            "      Successfully uninstalled scikit-learn-1.2.0\n",
            "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
            "matplotlib 3.7.0 requires numpy>=1.20, but you have numpy 1.19.5 which is incompatible.\u001b[0m\u001b[31m\n",
            "\u001b[0mSuccessfully installed antlr4-python3-runtime-4.8 cloudpickle-2.2.1 cython-0.29.22 fvcore-0.1.3.post20210317 hydra-core-1.0.7 numpy-1.19.5 omegaconf-2.0.6 parameterized-0.7.4 scikit-learn-0.24.1 submitit-1.3.3 tabulate-0.8.9\n",
            "Collecting opencv-python\n",
            "  Downloading opencv_python-4.7.0.68-cp37-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (61.8 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m61.8/61.8 MB\u001b[0m \u001b[31m888.0 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:02\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: numpy>=1.17.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from opencv-python) (1.19.5)\n",
            "Installing collected packages: opencv-python\n",
            "Successfully installed opencv-python-4.7.0.68\n",
            "\u001b[33mWARNING: Skipping classy_vision as it is not installed.\u001b[0m\u001b[33m\n",
            "\u001b[0mCollecting classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d\n",
            "  Downloading https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d\n",
            "\u001b[2K     \u001b[32m\\\u001b[0m \u001b[32m1.3 MB\u001b[0m \u001b[31m860.3 kB/s\u001b[0m \u001b[33m0:00:01\u001b[0m0m\n",
            "\u001b[?25h  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25hRequirement already satisfied: fvcore>=0.1.3 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.1.3.post20210317)\n",
            "Collecting setuptools<58\n",
            "  Downloading setuptools-57.5.0-py3-none-any.whl (819 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m819.3/819.3 kB\u001b[0m \u001b[31m938.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: torch>=1.6 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (1.8.1)\n",
            "Requirement already satisfied: torchvision>=0.7 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.9.1)\n",
            "Requirement already satisfied: wheel in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.37.1)\n",
            "Requirement already satisfied: termcolor>=1.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (2.2.0)\n",
            "Requirement already satisfied: pyyaml>=5.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (6.0)\n",
            "Requirement already satisfied: numpy in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (1.19.5)\n",
            "Requirement already satisfied: tabulate in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.8.9)\n",
            "Requirement already satisfied: iopath>=0.1.2 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.1.9)\n",
            "Requirement already satisfied: yacs>=0.1.6 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (0.1.8)\n",
            "Requirement already satisfied: Pillow in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (9.2.0)\n",
            "Requirement already satisfied: tqdm in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (4.64.1)\n",
            "Requirement already satisfied: typing_extensions in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from torch>=1.6->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (4.3.0)\n",
            "Requirement already satisfied: portalocker in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from iopath>=0.1.2->fvcore>=0.1.3->classy-vision@ https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d) (2.7.0)\n",
            "Building wheels for collected packages: classy-vision\n",
            "  Building wheel for classy-vision (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for classy-vision: filename=classy_vision-0.7.0.dev0-py3-none-any.whl size=361410 sha256=259bf3bd4740d13d0e1ad44f257d9776ee899463fba7c1e17aeb3a1cce4bf67d\n",
            "  Stored in directory: /tmp/pip-ephem-wheel-cache-5ngoxai_/wheels/87/15/48/332729b7c650b41d36ba9a508ec64a145fcebcb9f439b4ec2d\n",
            "Successfully built classy-vision\n",
            "Installing collected packages: setuptools, classy-vision\n",
            "  Attempting uninstall: setuptools\n",
            "    Found existing installation: setuptools 63.4.1\n",
            "    Uninstalling setuptools-63.4.1:\n",
            "      Successfully uninstalled setuptools-63.4.1\n",
            "Successfully installed classy-vision-0.7.0.dev0 setuptools-57.5.0\n",
            "\u001b[33mWARNING: Skipping fairscale as it is not installed.\u001b[0m\u001b[33m\n",
            "\u001b[0mCollecting fairscale@ https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6\n",
            "  Downloading https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6\n",
            "\u001b[2K     \u001b[32m-\u001b[0m \u001b[32m932.5 kB\u001b[0m \u001b[31m868.1 kB/s\u001b[0m \u001b[33m0:00:01\u001b[0m\n",
            "\u001b[?25h  Installing build dependencies ... \u001b[?25ldone\n",
            "\u001b[?25h  Getting requirements to build wheel ... \u001b[?25ldone\n",
            "\u001b[?25h  Installing backend dependencies ... \u001b[?25ldone\n",
            "\u001b[?25h  Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25hRequirement already satisfied: torch>=1.6.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fairscale@ https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6) (1.8.1)\n",
            "Requirement already satisfied: typing_extensions in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from torch>=1.6.0->fairscale@ https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6) (4.3.0)\n",
            "Requirement already satisfied: numpy in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from torch>=1.6.0->fairscale@ https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6) (1.19.5)\n",
            "Building wheels for collected packages: fairscale\n",
            "  Building wheel for fairscale (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for fairscale: filename=fairscale-0.3.7-py3-none-any.whl size=229079 sha256=f55bb54b65be3e313eca1ae06e32466e025080535a1bd97797ab201474b46f04\n",
            "  Stored in directory: /tmp/pip-ephem-wheel-cache-ohika4jg/wheels/b3/74/d2/f18349146b066675584ce1075487bbf224abd981195b4baf3f\n",
            "Successfully built fairscale\n",
            "Installing collected packages: fairscale\n",
            "Successfully installed fairscale-0.3.7\n",
            "Obtaining file:///home/erik/Documents/UCPH/AdversarialTransfer/vissl\n",
            "  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25hRequirement already satisfied: cython==0.29.22 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.29.22)\n",
            "Requirement already satisfied: fvcore==0.1.3.post20210317 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.1.3.post20210317)\n",
            "Requirement already satisfied: iopath==0.1.9 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.1.9)\n",
            "Requirement already satisfied: hydra-core==1.0.7 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (1.0.7)\n",
            "Requirement already satisfied: numpy==1.19.5 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (1.19.5)\n",
            "Requirement already satisfied: parameterized==0.7.4 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.7.4)\n",
            "Requirement already satisfied: scikit-learn==0.24.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.24.1)\n",
            "Requirement already satisfied: submitit==1.3.3 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (1.3.3)\n",
            "Requirement already satisfied: tabulate==0.8.9 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from vissl==0.1.6) (0.8.9)\n",
            "Collecting black==19.3b0\n",
            "  Downloading black-19.3b0-py36-none-any.whl (89 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m89.9/89.9 kB\u001b[0m \u001b[31m809.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting sphinx\n",
            "  Downloading sphinx-6.1.3-py3-none-any.whl (3.0 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.0/3.0 MB\u001b[0m \u001b[31m921.9 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting isort==5.7.0\n",
            "  Downloading isort-5.7.0-py3-none-any.whl (104 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m104.2/104.2 kB\u001b[0m \u001b[31m820.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting flake8==3.8.1\n",
            "  Downloading flake8-3.8.1-py2.py3-none-any.whl (72 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m72.5/72.5 kB\u001b[0m \u001b[31m829.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting flake8-bugbear\n",
            "  Downloading flake8_bugbear-23.2.13-py3-none-any.whl (27 kB)\n",
            "Collecting flake8-comprehensions\n",
            "  Downloading flake8_comprehensions-3.10.1-py3-none-any.whl (7.3 kB)\n",
            "Collecting pre-commit\n",
            "  Downloading pre_commit-3.0.4-py2.py3-none-any.whl (202 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m202.2/202.2 kB\u001b[0m \u001b[31m929.5 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting nbconvert\n",
            "  Downloading nbconvert-7.2.9-py3-none-any.whl (274 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m274.9/274.9 kB\u001b[0m \u001b[31m930.9 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting bs4\n",
            "  Downloading bs4-0.0.1.tar.gz (1.1 kB)\n",
            "  Preparing metadata (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25hCollecting faiss-gpu\n",
            "  Downloading faiss_gpu-1.7.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (85.5 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m85.5/85.5 MB\u001b[0m \u001b[31m913.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:03\u001b[0m\n",
            "\u001b[?25hCollecting pycocotools>=2.0.1\n",
            "  Downloading pycocotools-2.0.6.tar.gz (24 kB)\n",
            "  Installing build dependencies ... \u001b[?25ldone\n",
            "\u001b[?25h  Getting requirements to build wheel ... \u001b[?25ldone\n",
            "\u001b[?25h  Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25hCollecting tensorboard>=1.15\n",
            "  Downloading tensorboard-2.12.0-py3-none-any.whl (5.6 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m5.6/5.6 MB\u001b[0m \u001b[31m882.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting toml>=0.9.4\n",
            "  Downloading toml-0.10.2-py2.py3-none-any.whl (16 kB)\n",
            "Collecting click>=6.5\n",
            "  Using cached click-8.1.3-py3-none-any.whl (96 kB)\n",
            "Collecting appdirs\n",
            "  Downloading appdirs-1.4.4-py2.py3-none-any.whl (9.6 kB)\n",
            "Collecting attrs>=18.1.0\n",
            "  Downloading attrs-22.2.0-py3-none-any.whl (60 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.0/60.0 kB\u001b[0m \u001b[31m627.1 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting pyflakes<2.3.0,>=2.2.0\n",
            "  Downloading pyflakes-2.2.0-py2.py3-none-any.whl (66 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m67.0/67.0 kB\u001b[0m \u001b[31m608.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting pycodestyle<2.7.0,>=2.6.0a1\n",
            "  Downloading pycodestyle-2.6.0-py2.py3-none-any.whl (41 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m41.4/41.4 kB\u001b[0m \u001b[31m806.1 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:--:--\u001b[0m\n",
            "\u001b[?25hCollecting mccabe<0.7.0,>=0.6.0\n",
            "  Downloading mccabe-0.6.1-py2.py3-none-any.whl (8.6 kB)\n",
            "Requirement already satisfied: pyyaml>=5.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->vissl==0.1.6) (6.0)\n",
            "Requirement already satisfied: yacs>=0.1.6 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->vissl==0.1.6) (0.1.8)\n",
            "Requirement already satisfied: tqdm in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->vissl==0.1.6) (4.64.1)\n",
            "Requirement already satisfied: termcolor>=1.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->vissl==0.1.6) (2.2.0)\n",
            "Requirement already satisfied: Pillow in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from fvcore==0.1.3.post20210317->vissl==0.1.6) (9.2.0)\n",
            "Requirement already satisfied: antlr4-python3-runtime==4.8 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from hydra-core==1.0.7->vissl==0.1.6) (4.8)\n",
            "Requirement already satisfied: omegaconf<2.1,>=2.0.5 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from hydra-core==1.0.7->vissl==0.1.6) (2.0.6)\n",
            "Requirement already satisfied: importlib-resources in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from hydra-core==1.0.7->vissl==0.1.6) (5.10.2)\n",
            "Requirement already satisfied: portalocker in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from iopath==0.1.9->vissl==0.1.6) (2.7.0)\n",
            "Requirement already satisfied: threadpoolctl>=2.0.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->vissl==0.1.6) (3.1.0)\n",
            "Requirement already satisfied: joblib>=0.11 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->vissl==0.1.6) (1.2.0)\n",
            "Requirement already satisfied: scipy>=0.19.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from scikit-learn==0.24.1->vissl==0.1.6) (1.9.3)\n",
            "Requirement already satisfied: typing-extensions>=3.7.4.2 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from submitit==1.3.3->vissl==0.1.6) (4.3.0)\n",
            "Requirement already satisfied: cloudpickle>=1.2.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from submitit==1.3.3->vissl==0.1.6) (2.2.1)\n",
            "Requirement already satisfied: matplotlib>=2.1.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from pycocotools>=2.0.1->vissl==0.1.6) (3.7.0)\n",
            "Requirement already satisfied: wheel>=0.26 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from tensorboard>=1.15->vissl==0.1.6) (0.37.1)\n",
            "Collecting google-auth<3,>=1.6.3\n",
            "  Downloading google_auth-2.16.0-py2.py3-none-any.whl (177 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m177.8/177.8 kB\u001b[0m \u001b[31m774.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting werkzeug>=1.0.1\n",
            "  Using cached Werkzeug-2.2.2-py3-none-any.whl (232 kB)\n",
            "Collecting requests<3,>=2.21.0\n",
            "  Downloading requests-2.28.2-py3-none-any.whl (62 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.8/62.8 kB\u001b[0m \u001b[31m783.7 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m0:01\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: setuptools>=41.0.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from tensorboard>=1.15->vissl==0.1.6) (57.5.0)\n",
            "Collecting markdown>=2.6.8\n",
            "  Using cached Markdown-3.4.1-py3-none-any.whl (93 kB)\n",
            "Collecting grpcio>=1.48.2\n",
            "  Downloading grpcio-1.51.1-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (4.8 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m4.8/4.8 MB\u001b[0m \u001b[31m919.6 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting tensorboard-plugin-wit>=1.6.0\n",
            "  Using cached tensorboard_plugin_wit-1.8.1-py3-none-any.whl (781 kB)\n",
            "Collecting protobuf>=3.19.6\n",
            "  Downloading protobuf-4.21.12-cp37-abi3-manylinux2014_x86_64.whl (409 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m409.8/409.8 kB\u001b[0m \u001b[31m931.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting tensorboard-data-server<0.8.0,>=0.7.0\n",
            "  Downloading tensorboard_data_server-0.7.0-py3-none-manylinux2014_x86_64.whl (6.6 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.6/6.6 MB\u001b[0m \u001b[31m919.9 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting google-auth-oauthlib<0.5,>=0.4.1\n",
            "  Using cached google_auth_oauthlib-0.4.6-py2.py3-none-any.whl (18 kB)\n",
            "Collecting absl-py>=0.4\n",
            "  Downloading absl_py-1.4.0-py3-none-any.whl (126 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m126.5/126.5 kB\u001b[0m \u001b[31m874.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting beautifulsoup4\n",
            "  Downloading beautifulsoup4-4.11.2-py3-none-any.whl (129 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.4/129.4 kB\u001b[0m \u001b[31m893.7 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting tinycss2\n",
            "  Downloading tinycss2-1.2.1-py3-none-any.whl (21 kB)\n",
            "Collecting markupsafe>=2.0\n",
            "  Downloading MarkupSafe-2.1.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (25 kB)\n",
            "Requirement already satisfied: jupyter-core>=4.7 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbconvert->vissl==0.1.6) (5.2.0)\n",
            "Collecting nbclient>=0.5.0\n",
            "  Downloading nbclient-0.7.2-py3-none-any.whl (71 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m72.0/72.0 kB\u001b[0m \u001b[31m851.6 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: packaging in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbconvert->vissl==0.1.6) (23.0)\n",
            "Collecting mistune<3,>=2.0.3\n",
            "  Downloading mistune-2.0.5-py2.py3-none-any.whl (24 kB)\n",
            "Collecting jinja2>=3.0\n",
            "  Using cached Jinja2-3.1.2-py3-none-any.whl (133 kB)\n",
            "Collecting nbformat>=5.1\n",
            "  Downloading nbformat-5.7.3-py3-none-any.whl (78 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m78.1/78.1 kB\u001b[0m \u001b[31m865.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting pandocfilters>=1.4.1\n",
            "  Downloading pandocfilters-1.5.0-py2.py3-none-any.whl (8.7 kB)\n",
            "Collecting bleach\n",
            "  Downloading bleach-6.0.0-py3-none-any.whl (162 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m162.5/162.5 kB\u001b[0m \u001b[31m827.0 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting defusedxml\n",
            "  Downloading defusedxml-0.7.1-py2.py3-none-any.whl (25 kB)\n",
            "Requirement already satisfied: pygments>=2.4.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbconvert->vissl==0.1.6) (2.14.0)\n",
            "Requirement already satisfied: traitlets>=5.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbconvert->vissl==0.1.6) (5.9.0)\n",
            "Requirement already satisfied: importlib-metadata>=3.6 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbconvert->vissl==0.1.6) (6.0.0)\n",
            "Collecting jupyterlab-pygments\n",
            "  Downloading jupyterlab_pygments-0.2.2-py2.py3-none-any.whl (21 kB)\n",
            "Collecting nodeenv>=0.11.1\n",
            "  Downloading nodeenv-1.7.0-py2.py3-none-any.whl (21 kB)\n",
            "Collecting cfgv>=2.0.0\n",
            "  Downloading cfgv-3.3.1-py2.py3-none-any.whl (7.3 kB)\n",
            "Collecting virtualenv>=20.10.0\n",
            "  Downloading virtualenv-20.19.0-py3-none-any.whl (8.7 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m8.7/8.7 MB\u001b[0m \u001b[31m921.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting identify>=1.0.0\n",
            "  Downloading identify-2.5.18-py2.py3-none-any.whl (98 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m98.8/98.8 kB\u001b[0m \u001b[31m889.2 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting docutils<0.20,>=0.18\n",
            "  Downloading docutils-0.19-py3-none-any.whl (570 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m570.5/570.5 kB\u001b[0m \u001b[31m899.9 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting babel>=2.9\n",
            "  Downloading Babel-2.11.0-py3-none-any.whl (9.5 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m9.5/9.5 MB\u001b[0m \u001b[31m925.3 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hCollecting imagesize>=1.3\n",
            "  Downloading imagesize-1.4.1-py2.py3-none-any.whl (8.8 kB)\n",
            "Collecting sphinxcontrib-serializinghtml>=1.1.5\n",
            "  Downloading sphinxcontrib_serializinghtml-1.1.5-py2.py3-none-any.whl (94 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m94.0/94.0 kB\u001b[0m \u001b[31m784.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting snowballstemmer>=2.0\n",
            "  Downloading snowballstemmer-2.2.0-py2.py3-none-any.whl (93 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m93.0/93.0 kB\u001b[0m \u001b[31m921.7 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting sphinxcontrib-devhelp\n",
            "  Downloading sphinxcontrib_devhelp-1.0.2-py2.py3-none-any.whl (84 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m84.7/84.7 kB\u001b[0m \u001b[31m931.5 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting sphinxcontrib-qthelp\n",
            "  Downloading sphinxcontrib_qthelp-1.0.3-py2.py3-none-any.whl (90 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m90.6/90.6 kB\u001b[0m \u001b[31m934.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting sphinxcontrib-applehelp\n",
            "  Downloading sphinxcontrib_applehelp-1.0.4-py3-none-any.whl (120 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m120.6/120.6 kB\u001b[0m \u001b[31m950.7 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting alabaster<0.8,>=0.7\n",
            "  Downloading alabaster-0.7.13-py3-none-any.whl (13 kB)\n",
            "Collecting sphinxcontrib-jsmath\n",
            "  Downloading sphinxcontrib_jsmath-1.0.1-py2.py3-none-any.whl (5.1 kB)\n",
            "Collecting sphinxcontrib-htmlhelp>=2.0.0\n",
            "  Downloading sphinxcontrib_htmlhelp-2.0.1-py3-none-any.whl (99 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m99.8/99.8 kB\u001b[0m \u001b[31m956.9 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting pytz>=2015.7\n",
            "  Downloading pytz-2022.7.1-py2.py3-none-any.whl (499 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m499.4/499.4 kB\u001b[0m \u001b[31m937.0 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting rsa<5,>=3.1.4\n",
            "  Using cached rsa-4.9-py3-none-any.whl (34 kB)\n",
            "Collecting pyasn1-modules>=0.2.1\n",
            "  Using cached pyasn1_modules-0.2.8-py2.py3-none-any.whl (155 kB)\n",
            "Requirement already satisfied: six>=1.9.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from google-auth<3,>=1.6.3->tensorboard>=1.15->vissl==0.1.6) (1.16.0)\n",
            "Collecting cachetools<6.0,>=2.0.0\n",
            "  Downloading cachetools-5.3.0-py3-none-any.whl (9.3 kB)\n",
            "Collecting requests-oauthlib>=0.7.0\n",
            "  Using cached requests_oauthlib-1.3.1-py2.py3-none-any.whl (23 kB)\n",
            "Requirement already satisfied: zipp>=0.5 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from importlib-metadata>=3.6->nbconvert->vissl==0.1.6) (3.13.0)\n",
            "Requirement already satisfied: platformdirs>=2.5 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from jupyter-core>=4.7->nbconvert->vissl==0.1.6) (3.0.0)\n",
            "Collecting matplotlib>=2.1.0\n",
            "  Downloading matplotlib-3.6.3-cp38-cp38-manylinux_2_12_x86_64.manylinux2010_x86_64.whl (9.4 MB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m9.4/9.4 MB\u001b[0m \u001b[31m922.5 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: python-dateutil>=2.7 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (2.8.2)\n",
            "Requirement already satisfied: fonttools>=4.22.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (4.38.0)\n",
            "Requirement already satisfied: contourpy>=1.0.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (1.0.7)\n",
            "Requirement already satisfied: pyparsing>=2.2.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (3.0.9)\n",
            "Requirement already satisfied: kiwisolver>=1.0.1 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (1.4.4)\n",
            "Requirement already satisfied: cycler>=0.10 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from matplotlib>=2.1.0->pycocotools>=2.0.1->vissl==0.1.6) (0.11.0)\n",
            "Requirement already satisfied: jupyter-client>=6.1.12 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from nbclient>=0.5.0->nbconvert->vissl==0.1.6) (8.0.2)\n",
            "Collecting jsonschema>=2.6\n",
            "  Downloading jsonschema-4.17.3-py3-none-any.whl (90 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m90.4/90.4 kB\u001b[0m \u001b[31m904.1 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting fastjsonschema\n",
            "  Downloading fastjsonschema-2.16.2-py3-none-any.whl (22 kB)\n",
            "Collecting idna<4,>=2.5\n",
            "  Using cached idna-3.4-py3-none-any.whl (61 kB)\n",
            "Collecting charset-normalizer<4,>=2\n",
            "  Downloading charset_normalizer-3.0.1-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (195 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m195.4/195.4 kB\u001b[0m \u001b[31m837.2 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting urllib3<1.27,>=1.21.1\n",
            "  Downloading urllib3-1.26.14-py2.py3-none-any.whl (140 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m140.6/140.6 kB\u001b[0m \u001b[31m887.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: certifi>=2017.4.17 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from requests<3,>=2.21.0->tensorboard>=1.15->vissl==0.1.6) (2022.12.7)\n",
            "Collecting distlib<1,>=0.3.6\n",
            "  Downloading distlib-0.3.6-py2.py3-none-any.whl (468 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m468.5/468.5 kB\u001b[0m \u001b[31m935.0 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting filelock<4,>=3.4.1\n",
            "  Downloading filelock-3.9.0-py3-none-any.whl (9.7 kB)\n",
            "Collecting soupsieve>1.2\n",
            "  Using cached soupsieve-2.3.2.post1-py3-none-any.whl (37 kB)\n",
            "Collecting webencodings\n",
            "  Downloading webencodings-0.5.1-py2.py3-none-any.whl (11 kB)\n",
            "Collecting pyrsistent!=0.17.0,!=0.17.1,!=0.17.2,>=0.14.0\n",
            "  Downloading pyrsistent-0.19.3-py3-none-any.whl (57 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.5/57.5 kB\u001b[0m \u001b[31m979.4 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hCollecting pkgutil-resolve-name>=1.3.10\n",
            "  Using cached pkgutil_resolve_name-1.3.10-py3-none-any.whl (4.7 kB)\n",
            "Requirement already satisfied: pyzmq>=23.0 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from jupyter-client>=6.1.12->nbclient>=0.5.0->nbconvert->vissl==0.1.6) (25.0.0)\n",
            "Requirement already satisfied: tornado>=6.2 in /home/erik/anaconda3/envs/vissl_env/lib/python3.8/site-packages (from jupyter-client>=6.1.12->nbclient>=0.5.0->nbconvert->vissl==0.1.6) (6.2)\n",
            "Collecting pyasn1<0.5.0,>=0.4.6\n",
            "  Using cached pyasn1-0.4.8-py2.py3-none-any.whl (77 kB)\n",
            "Collecting oauthlib>=3.0.0\n",
            "  Downloading oauthlib-3.2.2-py3-none-any.whl (151 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m151.7/151.7 kB\u001b[0m \u001b[31m938.8 kB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
            "\u001b[?25hBuilding wheels for collected packages: pycocotools, bs4\n",
            "  Building wheel for pycocotools (pyproject.toml) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for pycocotools: filename=pycocotools-2.0.6-cp38-cp38-linux_x86_64.whl size=425703 sha256=7f6caf17fefe208a32c8d88e4215692d5529f1087fce03ce2ea13c0f8683144c\n",
            "  Stored in directory: /home/erik/.cache/pip/wheels/3e/08/ac/58126fe59992032701437336493f6132e1b72381a62d00b595\n",
            "  Building wheel for bs4 (setup.py) ... \u001b[?25ldone\n",
            "\u001b[?25h  Created wheel for bs4: filename=bs4-0.0.1-py3-none-any.whl size=1272 sha256=18cd3dea37707295ff9338b5632d0e24babc46849277e8debbaa8ba2b98f2131\n",
            "  Stored in directory: /home/erik/.cache/pip/wheels/75/78/21/68b124549c9bdc94f822c02fb9aa3578a669843f9767776bca\n",
            "Successfully built pycocotools bs4\n",
            "Installing collected packages: webencodings, tensorboard-plugin-wit, snowballstemmer, pytz, pyasn1, mistune, mccabe, fastjsonschema, faiss-gpu, distlib, charset-normalizer, appdirs, urllib3, toml, tinycss2, tensorboard-data-server, sphinxcontrib-serializinghtml, sphinxcontrib-qthelp, sphinxcontrib-jsmath, sphinxcontrib-htmlhelp, sphinxcontrib-devhelp, sphinxcontrib-applehelp, soupsieve, rsa, pyrsistent, pyflakes, pycodestyle, pyasn1-modules, protobuf, pkgutil-resolve-name, pandocfilters, oauthlib, nodeenv, markupsafe, jupyterlab-pygments, isort, imagesize, idna, identify, grpcio, filelock, docutils, defusedxml, click, cfgv, cachetools, bleach, babel, attrs, alabaster, absl-py, werkzeug, virtualenv, requests, matplotlib, markdown, jsonschema, jinja2, google-auth, flake8, black, beautifulsoup4, vissl, sphinx, requests-oauthlib, pycocotools, pre-commit, nbformat, flake8-comprehensions, flake8-bugbear, bs4, nbclient, google-auth-oauthlib, tensorboard, nbconvert\n",
            "  Attempting uninstall: matplotlib\n",
            "    Found existing installation: matplotlib 3.7.0\n",
            "    Uninstalling matplotlib-3.7.0:\n",
            "      Successfully uninstalled matplotlib-3.7.0\n",
            "  Attempting uninstall: vissl\n",
            "    Found existing installation: vissl 0.1.6\n",
            "    Uninstalling vissl-0.1.6:\n",
            "      Successfully uninstalled vissl-0.1.6\n",
            "  Running setup.py develop for vissl\n",
            "Successfully installed absl-py-1.4.0 alabaster-0.7.13 appdirs-1.4.4 attrs-22.2.0 babel-2.11.0 beautifulsoup4-4.11.2 black-19.3b0 bleach-6.0.0 bs4-0.0.1 cachetools-5.3.0 cfgv-3.3.1 charset-normalizer-3.0.1 click-8.1.3 defusedxml-0.7.1 distlib-0.3.6 docutils-0.19 faiss-gpu-1.7.2 fastjsonschema-2.16.2 filelock-3.9.0 flake8-3.8.1 flake8-bugbear-23.2.13 flake8-comprehensions-3.10.1 google-auth-2.16.0 google-auth-oauthlib-0.4.6 grpcio-1.51.1 identify-2.5.18 idna-3.4 imagesize-1.4.1 isort-5.7.0 jinja2-3.1.2 jsonschema-4.17.3 jupyterlab-pygments-0.2.2 markdown-3.4.1 markupsafe-2.1.2 matplotlib-3.6.3 mccabe-0.6.1 mistune-2.0.5 nbclient-0.7.2 nbconvert-7.2.9 nbformat-5.7.3 nodeenv-1.7.0 oauthlib-3.2.2 pandocfilters-1.5.0 pkgutil-resolve-name-1.3.10 pre-commit-3.0.4 protobuf-4.21.12 pyasn1-0.4.8 pyasn1-modules-0.2.8 pycocotools-2.0.6 pycodestyle-2.6.0 pyflakes-2.2.0 pyrsistent-0.19.3 pytz-2022.7.1 requests-2.28.2 requests-oauthlib-1.3.1 rsa-4.9 snowballstemmer-2.2.0 soupsieve-2.3.2.post1 sphinx-6.1.3 sphinxcontrib-applehelp-1.0.4 sphinxcontrib-devhelp-1.0.2 sphinxcontrib-htmlhelp-2.0.1 sphinxcontrib-jsmath-1.0.1 sphinxcontrib-qthelp-1.0.3 sphinxcontrib-serializinghtml-1.1.5 tensorboard-2.12.0 tensorboard-data-server-0.7.0 tensorboard-plugin-wit-1.8.1 tinycss2-1.2.1 toml-0.10.2 urllib3-1.26.14 virtualenv-20.19.0 vissl-0.1.6 webencodings-0.5.1 werkzeug-2.2.2\n"
          ]
        }
      ],
      "source": [
        "# Install pytorch version 1.8\n",
        "# !pip install torch==1.8.0+cu101 torchvision==0.9.0+cu101 -f https://download.pytorch.org/whl/torch_stable.html\n",
        "\n",
        "# install Apex by checking system settings: cuda version, pytorch version, and python version\n",
        "import sys\n",
        "import torch\n",
        "version_str=\"\".join([\n",
        "    f\"py3{sys.version_info.minor}_cu\",\n",
        "    torch.version.cuda.replace(\".\",\"\"),\n",
        "    f\"_pyt{torch.__version__[0:5:2]}\"\n",
        "])\n",
        "print(version_str)\n",
        "\n",
        "# install apex (pre-compiled with optimizer C++ extensions and CUDA kernels)\n",
        "!pip install apex -f https://dl.fbaipublicfiles.com/vissl/packaging/apexwheels/{version_str}/download.html\n",
        "\n",
        "# # clone vissl repository and checkout latest version.\n",
        "!git clone --recursive https://github.com/facebookresearch/vissl.git\n",
        "\n",
        "%cd vissl/\n",
        "\n",
        "!git checkout v0.1.6\n",
        "!git checkout -b v0.1.6\n",
        "\n",
        "# install vissl dependencies\n",
        "!pip install --progress-bar off -r requirements.txt\n",
        "!pip install opencv-python\n",
        "\n",
        "# update classy vision install to commit compatible with v0.1.6\n",
        "!pip uninstall -y classy_vision\n",
        "!pip install classy-vision@https://github.com/facebookresearch/ClassyVision/tarball/4785d5ee19d3bcedd5b28c1eb51ea1f59188b54d\n",
        "\n",
        "# Update fairscale to commit compatible with v0.1.6\n",
        "!pip uninstall -y fairscale\n",
        "!pip install fairscale@https://github.com/facebookresearch/fairscale/tarball/df7db85cef7f9c30a5b821007754b96eb1f977b6\n",
        "\n",
        "# install vissl dev mode (e stands for editable)\n",
        "!pip install -e .[dev]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 1,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "6SoUkgnwyU3G",
        "outputId": "448a9e55-6fc3-4d78-e4d9-29d5010ad982"
      },
      "outputs": [
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "/home/erik/anaconda3/envs/env_ats/lib/python3.8/site-packages/tqdm/auto.py:22: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
            "  from .autonotebook import tqdm as notebook_tqdm\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n"
          ]
        }
      ],
      "source": [
        "import os\n",
        "from PIL import Image\n",
        "\n",
        "import numpy as np\n",
        "import matplotlib.pyplot as plt\n",
        "from omegaconf import OmegaConf\n",
        "\n",
        "import apex\n",
        "import vissl\n",
        "import yaml\n",
        "from vissl.utils.hydra_config import AttrDict\n",
        "from vissl.utils.hydra_config import compose_hydra_configuration, convert_to_attrdict\n",
        "from vissl.models import build_model\n",
        "from vissl.utils.checkpoint import init_model_from_consolidated_weights\n",
        "\n",
        "import torch\n",
        "import torch.nn as nn\n",
        "import torchvision.transforms as transforms\n",
        "import torch.nn.functional as F\n",
        "from torchvision.datasets import MNIST\n",
        "from vissl.utils.io import save_file\n",
        "from classy_vision.generic.util import load_checkpoint\n",
        "\n",
        "from torch.utils.data import DataLoader\n",
        "from vissl.data.ssl_transforms.mnist_img_pil_to_rgb_mode import MNISTImgPil2RGB\n",
        "from vissl.models.base_ssl_model import BaseSSLMultiInputOutputModel\n",
        "import torchvision.transforms as vision_transforms\n",
        "from tqdm import tqdm\n",
        "\n",
        "\n",
        "plt.rcParams[\"savefig.bbox\"] = 'tight'\n",
        "device = torch.device(\"cuda:0\" if torch.cuda.is_available() else \"cpu\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ycV_MQ6HyVwL"
      },
      "outputs": [],
      "source": [
        "# Downloadng configs and backbone.\n",
        "!wget -q -O /content/resnet50-19c8e357.pth https://download.pytorch.org/models/resnet50-19c8e357.pth > /dev/null\n",
        "!wget -q -O configs/config/benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml https://raw.githubusercontent.com/facebookresearch/vissl/main/configs/config/benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 20,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 379,
          "referenced_widgets": [
            "04ed3be3e4ee4a8b8169e46e1680d149",
            "b457bc23a8e64915baf0ba3c2a6b47fd",
            "d9553549b2d345049e107ec6f784f18b",
            "8f3d7ac36d934bf3b5866872410298eb",
            "86a29711e44a4cf3b495d5b5889a59e7",
            "d9bad2ff744e486aab9f90d9ae6b309e",
            "efefeefc09464cd883d5b10927c6d49b",
            "7dbb7fe18d0f4aed8f72eaaea1ee67a8",
            "82daabde61c945309fb19be31a7ef7d5",
            "5f94b05328da4e23adc15f7f6eb4e937",
            "fbf834b6b8564382b09cfe3b82dfd28c",
            "7280424dedbb407e8ac139f9adbf60a8",
            "97889e1a72d149479b042b4b24cdef3d",
            "486af1494c654b9b917d5f67a33f8f18",
            "75a3d4f67843440491448f273df1392a",
            "d10bd232bca94aa686ea6be815cd3948",
            "ff53d6bf93034731a3f36eedb3bbf6a4",
            "6b657966bd90498dac074b3f8d9ee6d1",
            "13be9d99438d4e91b8fb0935feeb04d6",
            "169ffc9494474b17b93ebf8467993673",
            "ac99589b5ed04cef8fb0cfd651686525",
            "5402033b366e4fbbaea81cf8faf8eccf",
            "9faf373ea16e487a8d7545efbe5ff404",
            "35b9c446ca3f44fd93025b18ad6e07cd",
            "9fea91ddc0154270a1fc79cd68217766",
            "f88e1a88b4264fac8bb02b17b32a9f47",
            "33cbf5dbac8c45c0bb6a9a44028e4ea3",
            "d18449be12ec4a61acd4b5f22e6f9b75",
            "6064004fabc648d0b5b035274d5c3425",
            "58474f7c3b064736b1792d0dadc0b3fc",
            "01fbe0cab1144cd3a3946b487da67a76",
            "fb0390b8a3384a68be7b0dc5a35093f3",
            "b239237acd33488ca73c46163688249f",
            "1987475dc3e147c195f7ac285657fa2b",
            "103c139cbdfe4b3b85e0a9a5514a6f9f",
            "4ce75f7cd5614e43b14f7ce27d7d8808",
            "6974105051a3492585f5e5d8f47a702e",
            "b4c3831ca0c841f4b4a9ad718e0f222f",
            "4d20a6f8e0444109a59f967c52f54401",
            "0ea01ccede9e4b5c9da043e764b8ff33",
            "707369e8ef3d4e7c8add8703e90a5f1c",
            "b5e2ab3980f34a9db83e9dfc37234ec5",
            "f95058a5b1624167832c9c339f3a0074",
            "1a3ce30907f7454d84516066700749a3"
          ]
        },
        "id": "MkSoRV2hFTUF",
        "outputId": "8b3d0723-7183-4a8f-f304-242eba5024b8"
      },
      "outputs": [],
      "source": [
        "# Preparing MNIST.\n",
        "\n",
        "ROOT = \"ats/data/\"  # Where to save data.\n",
        "_ = MNIST(root=ROOT, train=True, download=True)\n",
        "LABEL2IDX = {str(i): i for i in range(10)}\n",
        "N_CLASSES = len(LABEL2IDX)\n",
        "IDX2LABEL = {v: k for k, v in LABEL2IDX.items()}\n",
        "\n",
        "json_data = {\n",
        "    \"MNIST\": {\n",
        "      \"train\": [\n",
        "        ROOT, \"<unused>\"\n",
        "      ],\n",
        "      \"val\": [\n",
        "        ROOT, \"<unused>\"\n",
        "      ]\n",
        "    }\n",
        "}\n",
        "\n",
        "save_file(json_data, \"configs/config/dataset_catalog.json\", append_to_json=False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 6,
      "metadata": {},
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "/home/erik/Documents/UCPH/AdversarialTransfer\n"
          ]
        }
      ],
      "source": [
        "!pwd"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "_bhczvjUGSQ6",
        "outputId": "edbae9e2-28ea-41fd-feca-52a5938701f9"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "####### overrides: ['hydra.verbose=true', 'config=benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml', 'config.DATA.TRAIN.DATA_SOURCES=[torchvision_dataset]', 'config.DATA.TRAIN.LABEL_SOURCES=[torchvision_dataset]', 'config.DATA.TRAIN.DATASET_NAMES=[MNIST]', 'config.DATA.TRAIN.DATA_PATHS=[/content/data/]', 'config.DATA.TEST.DATA_SOURCES=[torchvision_dataset]', 'config.DATA.TEST.LABEL_SOURCES=[torchvision_dataset]', 'config.DATA.TEST.DATASET_NAMES=[MNIST]', 'config.DATA.TEST.DATA_PATHS=[/content/data/]', 'config.TEST_MODEL=True', 'config.DATA.TEST.BATCHSIZE_PER_REPLICA=64', 'config.DATA.TRAIN.BATCHSIZE_PER_REPLICA=64', 'config.DISTRIBUTED.NUM_NODES=1', 'config.DISTRIBUTED.NUM_PROC_PER_NODE=1', 'config.OPTIMIZER.num_epochs=1', 'config.OPTIMIZER.param_schedulers.lr.values=[0.01]', 'config.OPTIMIZER.param_schedulers.lr.milestones=[]', 'config.CHECKPOINT.DIR=/content/my_trash_2/', 'config.CHECKPOINT.OVERWRITE_EXISTING=False', 'config.MODEL.WEIGHTS_INIT.PARAMS_FILE=/content/resnet50-19c8e357.pth', 'config.MODEL.WEIGHTS_INIT.STATE_DICT_KEY_NAME=', 'config.MODEL.WEIGHTS_INIT.APPEND_PREFIX=trunk._feature_blocks.', 'config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True', 'config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_ONLY=False', 'config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=False', 'config.MODEL.FEATURE_EVAL_SETTINGS.EXTRACT_TRUNK_FEATURES_ONLY=False', 'config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=False', 'config.MODEL.HEAD.PARAMS=[[eval_mlp, {in_channels: 2048, dims: [2048, 10]}]]', 'config.HOOKS.TENSORBOARD_SETUP.USE_TENSORBOARD=true']\n",
            "INFO 2023-02-14 14:16:13,776 distributed_launcher.py: 183: Spawning process for node_id: 0, local_rank: 0, dist_rank: 0, dist_run_id: localhost:56453\n",
            "INFO 2023-02-14 14:16:13,777 train.py:  94: Env set for rank: 0, dist_rank: 0\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: CGROUP_MEMORY_EVENTS:\t/sys/fs/cgroup/memory.events /var/colab/cgroup/jupyter-children/memory.events\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: CLICOLOR:\t1\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: CLOUDSDK_CONFIG:\t/content/.config\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: CLOUDSDK_PYTHON:\tpython3\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: COLAB_BACKEND_VERSION:\tnext\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: COLAB_RELEASE_TAG:\trelease-colab-20230210-060047-RC00\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: CUDA_VERSION:\t11.6.2\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: DATALAB_SETTINGS_OVERRIDES:\t{\"kernelManagerProxyPort\":6000,\"kernelManagerProxyHost\":\"172.28.0.12\",\"jupyterArgs\":[\"--ip=172.28.0.12\",\"--transport=ipc\"],\"debugAdapterMultiplexerPath\":\"/usr/local/bin/dap_multiplexer\",\"enableLsp\":true}\n",
            "INFO 2023-02-14 14:16:13,777 env.py:  50: DEBIAN_FRONTEND:\tnoninteractive\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: ENABLE_DIRECTORYPREFETCHER:\t1\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: ENV:\t/root/.bashrc\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: GCE_METADATA_TIMEOUT:\t3\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: GCS_READ_CACHE_BLOCK_SIZE_MB:\t16\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: GIT_PAGER:\tcat\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: HOME:\t/root\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: HOSTNAME:\t50e721256dd1\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: JPY_PARENT_PID:\t90\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: KMP_EXTRA_ARGS:\t--listen_host=172.28.0.12 --target_host=172.28.0.12 --tunnel_background_save_url=https://colab.research.google.com/tun/m/cc48301118ce562b961b3c22d803539adc1e0c19/gpu-t4-s-3pstg0xtyz8tz --tunnel_background_save_delay=10s --tunnel_periodic_background_save_frequency=30m0s --enable_output_coalescing=true --output_coalescing_required=true\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: KMP_LISTEN_PORT:\t6000\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: KMP_TARGET_PORT:\t9000\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: LANG:\ten_US.UTF-8\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: LAST_FORCED_REBUILD:\t20230130\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: LD_LIBRARY_PATH:\t/usr/lib64-nvidia\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: LIBRARY_PATH:\t/usr/local/cuda/lib64/stubs\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: LOCAL_RANK:\t0\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: MPLBACKEND:\tmodule://ipykernel.pylab.backend_inline\n",
            "INFO 2023-02-14 14:16:13,778 env.py:  50: NCCL_VERSION:\t2.12.10-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NO_GCE_CHECK:\tFalse\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NVARCH:\tx86_64\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NVIDIA_DRIVER_CAPABILITIES:\tcompute,utility\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NVIDIA_PRODUCT_NAME:\tCUDA\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NVIDIA_REQUIRE_CUDA:\tcuda>=11.6 brand=tesla,driver>=418,driver<419 brand=tesla,driver>=450,driver<451 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NVIDIA_VISIBLE_DEVICES:\tall\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDA_COMPAT_PACKAGE:\tcuda-compat-11-6\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDA_CUDART_DEV_VERSION:\t11.6.55-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDA_CUDART_VERSION:\t11.6.55-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDA_LIB_VERSION:\t11.6.2-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDNN_PACKAGE:\tlibcudnn8=8.4.0.27-1+cuda11.6\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDNN_PACKAGE_DEV:\tlibcudnn8-dev=8.4.0.27-1+cuda11.6\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDNN_PACKAGE_NAME:\tlibcudnn8\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_CUDNN_VERSION:\t8.4.0.27\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_DEV_PACKAGE:\tlibcublas-dev-11-6=11.9.2.110-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_DEV_PACKAGE_NAME:\tlibcublas-dev-11-6\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_DEV_VERSION:\t11.9.2.110-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_PACKAGE:\tlibcublas-11-6=11.9.2.110-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_PACKAGE_NAME:\tlibcublas-11-6\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUBLAS_VERSION:\t11.9.2.110-1\n",
            "INFO 2023-02-14 14:16:13,779 env.py:  50: NV_LIBCUSPARSE_DEV_VERSION:\t11.7.2.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBCUSPARSE_VERSION:\t11.7.2.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_DEV_PACKAGE:\tlibnccl-dev=2.12.10-1+cuda11.6\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_DEV_PACKAGE_NAME:\tlibnccl-dev\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_DEV_PACKAGE_VERSION:\t2.12.10-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_PACKAGE:\tlibnccl2=2.12.10-1+cuda11.6\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_PACKAGE_NAME:\tlibnccl2\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNCCL_PACKAGE_VERSION:\t2.12.10-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNPP_DEV_PACKAGE:\tlibnpp-dev-11-6=11.6.3.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNPP_DEV_VERSION:\t11.6.3.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNPP_PACKAGE:\tlibnpp-11-6=11.6.3.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_LIBNPP_VERSION:\t11.6.3.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_NVML_DEV_VERSION:\t11.6.55-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_NVPROF_DEV_PACKAGE:\tcuda-nvprof-11-6=11.6.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_NVPROF_VERSION:\t11.6.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: NV_NVTX_VERSION:\t11.6.124-1\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: OLDPWD:\t/\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: PAGER:\tcat\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: PATH:\t/opt/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/tools/node/bin:/tools/google-cloud-sdk/bin\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: PWD:\t/content/vissl\n",
            "INFO 2023-02-14 14:16:13,780 env.py:  50: PYDEVD_USE_FRAME_EVAL:\tNO\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: PYTHONPATH:\t/env/python\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: PYTHONWARNINGS:\tignore:::pip._internal.cli.base_command\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: RANK:\t0\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: SHELL:\t/bin/bash\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: SHLVL:\t0\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TBE_CREDS_ADDR:\t172.28.0.1:8008\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TBE_EPHEM_CREDS_ADDR:\t172.28.0.1:8009\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TBE_RUNTIME_ADDR:\t172.28.0.1:8011\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TCLLIBPATH:\t/usr/share/tcltk/tcllib1.20\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TERM:\txterm-color\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: TF_FORCE_GPU_ALLOW_GROWTH:\ttrue\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: USE_AUTH_EPHEM:\t1\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: VM_GCE_METADATA_HOST:\t169.254.169.253\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: WORLD_SIZE:\t1\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: _:\t/usr/bin/python3\n",
            "INFO 2023-02-14 14:16:13,781 env.py:  50: __EGL_VENDOR_LIBRARY_DIRS:\t/usr/lib64-nvidia:/usr/share/glvnd/egl_vendor.d/\n",
            "INFO 2023-02-14 14:16:13,781 misc.py: 161: Set start method of multiprocessing to forkserver\n",
            "INFO 2023-02-14 14:16:13,781 train.py: 105: Setting seed....\n",
            "INFO 2023-02-14 14:16:13,781 misc.py: 173: MACHINE SEED: 1\n",
            "INFO 2023-02-14 14:16:13,783 hydra_config.py: 132: Training with config:\n",
            "INFO 2023-02-14 14:16:13,788 hydra_config.py: 141: {'CHECKPOINT': {'APPEND_DISTR_RUN_ID': False,\n",
            "                'AUTO_RESUME': True,\n",
            "                'BACKEND': 'disk',\n",
            "                'CHECKPOINT_FREQUENCY': 1,\n",
            "                'CHECKPOINT_ITER_FREQUENCY': -1,\n",
            "                'DIR': '/content/my_trash_2/',\n",
            "                'LATEST_CHECKPOINT_RESUME_FILE_NUM': 1,\n",
            "                'OVERWRITE_EXISTING': False,\n",
            "                'USE_SYMLINK_CHECKPOINT_FOR_RESUME': False},\n",
            " 'CLUSTERFIT': {'CLUSTER_BACKEND': 'faiss',\n",
            "                'DATA_LIMIT': -1,\n",
            "                'DATA_LIMIT_SAMPLING': {'SEED': 0},\n",
            "                'FEATURES': {'DATASET_NAME': '',\n",
            "                             'DATA_PARTITION': 'TRAIN',\n",
            "                             'DIMENSIONALITY_REDUCTION': 0,\n",
            "                             'EXTRACT': False,\n",
            "                             'LAYER_NAME': '',\n",
            "                             'PATH': '.',\n",
            "                             'TEST_PARTITION': 'TEST'},\n",
            "                'NUM_CLUSTERS': 16000,\n",
            "                'NUM_ITER': 50,\n",
            "                'OUTPUT_DIR': '.'},\n",
            " 'DATA': {'DDP_BUCKET_CAP_MB': 25,\n",
            "          'ENABLE_ASYNC_GPU_COPY': True,\n",
            "          'NUM_DATALOADER_WORKERS': 5,\n",
            "          'PIN_MEMORY': True,\n",
            "          'TEST': {'BASE_DATASET': 'generic_ssl',\n",
            "                   'BATCHSIZE_PER_REPLICA': 64,\n",
            "                   'COLLATE_FUNCTION': 'default_collate',\n",
            "                   'COLLATE_FUNCTION_PARAMS': {},\n",
            "                   'COPY_DESTINATION_DIR': '/tmp/mnist/',\n",
            "                   'COPY_TO_LOCAL_DISK': False,\n",
            "                   'DATASET_NAMES': ['MNIST'],\n",
            "                   'DATA_LIMIT': -1,\n",
            "                   'DATA_LIMIT_SAMPLING': {'IS_BALANCED': False,\n",
            "                                           'SEED': 0,\n",
            "                                           'SKIP_NUM_SAMPLES': 0},\n",
            "                   'DATA_PATHS': ['/content/data/'],\n",
            "                   'DATA_SOURCES': ['torchvision_dataset'],\n",
            "                   'DEFAULT_GRAY_IMG_SIZE': 224,\n",
            "                   'DROP_LAST': False,\n",
            "                   'ENABLE_QUEUE_DATASET': False,\n",
            "                   'INPUT_KEY_NAMES': ['data'],\n",
            "                   'LABEL_PATHS': [],\n",
            "                   'LABEL_SOURCES': ['torchvision_dataset'],\n",
            "                   'LABEL_TYPE': 'standard',\n",
            "                   'MMAP_MODE': True,\n",
            "                   'NEW_IMG_PATH_PREFIX': '',\n",
            "                   'RANDOM_SYNTHETIC_IMAGES': False,\n",
            "                   'REMOVE_IMG_PATH_PREFIX': '',\n",
            "                   'TARGET_KEY_NAMES': ['label'],\n",
            "                   'TRANSFORMS': [{'box': [2, 2],\n",
            "                                   'name': 'MNISTImgPil2RGB',\n",
            "                                   'size': 32},\n",
            "                                  {'name': 'Resize', 'size': 224},\n",
            "                                  {'name': 'ToTensor'},\n",
            "                                  {'mean': [0.485, 0.456, 0.406],\n",
            "                                   'name': 'Normalize',\n",
            "                                   'std': [0.229, 0.224, 0.225]}],\n",
            "                   'USE_DEBUGGING_SAMPLER': False,\n",
            "                   'USE_STATEFUL_DISTRIBUTED_SAMPLER': False},\n",
            "          'TRAIN': {'BASE_DATASET': 'generic_ssl',\n",
            "                    'BATCHSIZE_PER_REPLICA': 64,\n",
            "                    'COLLATE_FUNCTION': 'default_collate',\n",
            "                    'COLLATE_FUNCTION_PARAMS': {},\n",
            "                    'COPY_DESTINATION_DIR': '/tmp/mnist/',\n",
            "                    'COPY_TO_LOCAL_DISK': False,\n",
            "                    'DATASET_NAMES': ['MNIST'],\n",
            "                    'DATA_LIMIT': -1,\n",
            "                    'DATA_LIMIT_SAMPLING': {'IS_BALANCED': False,\n",
            "                                            'SEED': 0,\n",
            "                                            'SKIP_NUM_SAMPLES': 0},\n",
            "                    'DATA_PATHS': ['/content/data/'],\n",
            "                    'DATA_SOURCES': ['torchvision_dataset'],\n",
            "                    'DEFAULT_GRAY_IMG_SIZE': 224,\n",
            "                    'DROP_LAST': False,\n",
            "                    'ENABLE_QUEUE_DATASET': False,\n",
            "                    'INPUT_KEY_NAMES': ['data'],\n",
            "                    'LABEL_PATHS': [],\n",
            "                    'LABEL_SOURCES': ['torchvision_dataset'],\n",
            "                    'LABEL_TYPE': 'standard',\n",
            "                    'MMAP_MODE': True,\n",
            "                    'NEW_IMG_PATH_PREFIX': '',\n",
            "                    'RANDOM_SYNTHETIC_IMAGES': False,\n",
            "                    'REMOVE_IMG_PATH_PREFIX': '',\n",
            "                    'TARGET_KEY_NAMES': ['label'],\n",
            "                    'TRANSFORMS': [{'box': [2, 2],\n",
            "                                    'name': 'MNISTImgPil2RGB',\n",
            "                                    'size': 32},\n",
            "                                   {'name': 'Resize', 'size': 224},\n",
            "                                   {'name': 'ToTensor'},\n",
            "                                   {'mean': [0.485, 0.456, 0.406],\n",
            "                                    'name': 'Normalize',\n",
            "                                    'std': [0.229, 0.224, 0.225]}],\n",
            "                    'USE_DEBUGGING_SAMPLER': False,\n",
            "                    'USE_STATEFUL_DISTRIBUTED_SAMPLER': False}},\n",
            " 'DISTRIBUTED': {'BACKEND': 'nccl',\n",
            "                 'BROADCAST_BUFFERS': True,\n",
            "                 'INIT_METHOD': 'tcp',\n",
            "                 'MANUAL_GRADIENT_REDUCTION': False,\n",
            "                 'NCCL_DEBUG': False,\n",
            "                 'NCCL_SOCKET_NTHREADS': '',\n",
            "                 'NUM_NODES': 1,\n",
            "                 'NUM_PROC_PER_NODE': 1,\n",
            "                 'RUN_ID': 'auto'},\n",
            " 'EXTRACT_FEATURES': {'CHUNK_THRESHOLD': 0, 'OUTPUT_DIR': ''},\n",
            " 'HOOKS': {'CHECK_NAN': True,\n",
            "           'LOG_GPU_STATS': True,\n",
            "           'MEMORY_SUMMARY': {'DUMP_MEMORY_ON_EXCEPTION': False,\n",
            "                              'LOG_ITERATION_NUM': 0,\n",
            "                              'PRINT_MEMORY_SUMMARY': True},\n",
            "           'MODEL_COMPLEXITY': {'COMPUTE_COMPLEXITY': False,\n",
            "                                'INPUT_SHAPE': [3, 224, 224]},\n",
            "           'PERF_STATS': {'MONITOR_PERF_STATS': True,\n",
            "                          'PERF_STAT_FREQUENCY': -1,\n",
            "                          'ROLLING_BTIME_FREQ': -1},\n",
            "           'TENSORBOARD_SETUP': {'EXPERIMENT_LOG_DIR': 'tensorboard',\n",
            "                                 'FLUSH_EVERY_N_MIN': 5,\n",
            "                                 'LOG_DIR': '.',\n",
            "                                 'LOG_PARAMS': True,\n",
            "                                 'LOG_PARAMS_EVERY_N_ITERS': 310,\n",
            "                                 'LOG_PARAMS_GRADIENTS': True,\n",
            "                                 'USE_TENSORBOARD': True}},\n",
            " 'IMG_RETRIEVAL': {'CROP_QUERY_ROI': False,\n",
            "                   'DATASET_PATH': '',\n",
            "                   'DEBUG_MODE': False,\n",
            "                   'EVAL_BINARY_PATH': '',\n",
            "                   'EVAL_DATASET_NAME': 'Paris',\n",
            "                   'FEATS_PROCESSING_TYPE': '',\n",
            "                   'GEM_POOL_POWER': 4.0,\n",
            "                   'IMG_SCALINGS': [1],\n",
            "                   'NORMALIZE_FEATURES': True,\n",
            "                   'NUM_DATABASE_SAMPLES': -1,\n",
            "                   'NUM_QUERY_SAMPLES': -1,\n",
            "                   'NUM_TRAINING_SAMPLES': -1,\n",
            "                   'N_PCA': 512,\n",
            "                   'RESIZE_IMG': 1024,\n",
            "                   'SAVE_FEATURES': False,\n",
            "                   'SAVE_RETRIEVAL_RANKINGS_SCORES': True,\n",
            "                   'SIMILARITY_MEASURE': 'cosine_similarity',\n",
            "                   'SPATIAL_LEVELS': 3,\n",
            "                   'TRAIN_DATASET_NAME': 'Oxford',\n",
            "                   'TRAIN_PCA_WHITENING': True,\n",
            "                   'USE_DISTRACTORS': False,\n",
            "                   'WHITEN_IMG_LIST': ''},\n",
            " 'LOG_FREQUENCY': 200,\n",
            " 'LOSS': {'CrossEntropyLoss': {'ignore_index': -1},\n",
            "          'barlow_twins_loss': {'embedding_dim': 8192,\n",
            "                                'lambda_': 0.0051,\n",
            "                                'scale_loss': 0.024},\n",
            "          'bce_logits_multiple_output_single_target': {'normalize_output': False,\n",
            "                                                       'reduction': 'none',\n",
            "                                                       'world_size': 1},\n",
            "          'cross_entropy_multiple_output_single_target': {'ignore_index': -1,\n",
            "                                                          'normalize_output': False,\n",
            "                                                          'reduction': 'mean',\n",
            "                                                          'temperature': 1.0,\n",
            "                                                          'weight': None},\n",
            "          'deepclusterv2_loss': {'BATCHSIZE_PER_REPLICA': 256,\n",
            "                                 'DROP_LAST': True,\n",
            "                                 'kmeans_iters': 10,\n",
            "                                 'memory_params': {'crops_for_mb': [0],\n",
            "                                                   'embedding_dim': 128},\n",
            "                                 'num_clusters': [3000, 3000, 3000],\n",
            "                                 'num_crops': 2,\n",
            "                                 'num_train_samples': -1,\n",
            "                                 'temperature': 0.1},\n",
            "          'dino_loss': {'crops_for_teacher': [0, 1],\n",
            "                        'ema_center': 0.9,\n",
            "                        'momentum': 0.996,\n",
            "                        'normalize_last_layer': True,\n",
            "                        'output_dim': 65536,\n",
            "                        'student_temp': 0.1,\n",
            "                        'teacher_temp_max': 0.07,\n",
            "                        'teacher_temp_min': 0.04,\n",
            "                        'teacher_temp_warmup_iters': 37500},\n",
            "          'moco_loss': {'embedding_dim': 128,\n",
            "                        'momentum': 0.999,\n",
            "                        'queue_size': 65536,\n",
            "                        'temperature': 0.2},\n",
            "          'multicrop_simclr_info_nce_loss': {'buffer_params': {'effective_batch_size': 4096,\n",
            "                                                               'embedding_dim': 128,\n",
            "                                                               'world_size': 64},\n",
            "                                             'num_crops': 2,\n",
            "                                             'temperature': 0.1},\n",
            "          'name': 'cross_entropy_multiple_output_single_target',\n",
            "          'nce_loss_with_memory': {'loss_type': 'nce',\n",
            "                                   'loss_weights': [1.0],\n",
            "                                   'memory_params': {'embedding_dim': 128,\n",
            "                                                     'memory_size': -1,\n",
            "                                                     'momentum': 0.5,\n",
            "                                                     'norm_init': True,\n",
            "                                                     'update_mem_on_forward': True},\n",
            "                                   'negative_sampling_params': {'num_negatives': 16000,\n",
            "                                                                'type': 'random'},\n",
            "                                   'norm_constant': -1,\n",
            "                                   'norm_embedding': True,\n",
            "                                   'num_train_samples': -1,\n",
            "                                   'temperature': 0.07,\n",
            "                                   'update_mem_with_emb_index': -100},\n",
            "          'simclr_info_nce_loss': {'buffer_params': {'effective_batch_size': 4096,\n",
            "                                                     'embedding_dim': 128,\n",
            "                                                     'world_size': 64},\n",
            "                                   'temperature': 0.1},\n",
            "          'swav_loss': {'crops_for_assign': [0, 1],\n",
            "                        'embedding_dim': 128,\n",
            "                        'epsilon': 0.05,\n",
            "                        'normalize_last_layer': True,\n",
            "                        'num_crops': 2,\n",
            "                        'num_iters': 3,\n",
            "                        'num_prototypes': [3000],\n",
            "                        'output_dir': '.',\n",
            "                        'queue': {'local_queue_length': 0,\n",
            "                                  'queue_length': 0,\n",
            "                                  'start_iter': 0},\n",
            "                        'temp_hard_assignment_iters': 0,\n",
            "                        'temperature': 0.1,\n",
            "                        'use_double_precision': False},\n",
            "          'swav_momentum_loss': {'crops_for_assign': [0, 1],\n",
            "                                 'embedding_dim': 128,\n",
            "                                 'epsilon': 0.05,\n",
            "                                 'momentum': 0.99,\n",
            "                                 'momentum_eval_mode_iter_start': 0,\n",
            "                                 'normalize_last_layer': True,\n",
            "                                 'num_crops': 2,\n",
            "                                 'num_iters': 3,\n",
            "                                 'num_prototypes': [3000],\n",
            "                                 'queue': {'local_queue_length': 0,\n",
            "                                           'queue_length': 0,\n",
            "                                           'start_iter': 0},\n",
            "                                 'temperature': 0.1,\n",
            "                                 'use_double_precision': False}},\n",
            " 'MACHINE': {'DEVICE': 'gpu'},\n",
            " 'METERS': {'accuracy_list_meter': {'meter_names': [],\n",
            "                                    'num_meters': 1,\n",
            "                                    'topk_values': [1]},\n",
            "            'enable_training_meter': True,\n",
            "            'mean_ap_list_meter': {'max_cpu_capacity': -1,\n",
            "                                   'meter_names': [],\n",
            "                                   'num_classes': 9605,\n",
            "                                   'num_meters': 1},\n",
            "            'model_output_mask': False,\n",
            "            'name': 'accuracy_list_meter',\n",
            "            'names': ['accuracy_list_meter'],\n",
            "            'precision_at_k_list_meter': {'meter_names': [],\n",
            "                                          'num_meters': 1,\n",
            "                                          'topk_values': [1]},\n",
            "            'recall_at_k_list_meter': {'meter_names': [],\n",
            "                                       'num_meters': 1,\n",
            "                                       'topk_values': [1]}},\n",
            " 'MODEL': {'ACTIVATION_CHECKPOINTING': {'NUM_ACTIVATION_CHECKPOINTING_SPLITS': 2,\n",
            "                                        'USE_ACTIVATION_CHECKPOINTING': False},\n",
            "           'AMP_PARAMS': {'AMP_ARGS': {'opt_level': 'O1'},\n",
            "                          'AMP_TYPE': 'apex',\n",
            "                          'USE_AMP': False},\n",
            "           'BASE_MODEL_NAME': 'multi_input_output_model',\n",
            "           'CUDA_CACHE': {'CLEAR_CUDA_CACHE': False, 'CLEAR_FREQ': 100},\n",
            "           'FEATURE_EVAL_SETTINGS': {'EVAL_MODE_ON': True,\n",
            "                                     'EVAL_TRUNK_AND_HEAD': False,\n",
            "                                     'EXTRACT_TRUNK_FEATURES_ONLY': False,\n",
            "                                     'FREEZE_TRUNK_AND_HEAD': False,\n",
            "                                     'FREEZE_TRUNK_ONLY': False,\n",
            "                                     'LINEAR_EVAL_FEAT_POOL_OPS_MAP': [['res5',\n",
            "                                                                        ['AdaptiveAvgPool2d',\n",
            "                                                                         [[1,\n",
            "                                                                           1]]]]],\n",
            "                                     'SHOULD_FLATTEN_FEATS': False},\n",
            "           'FSDP_CONFIG': {'AUTO_WRAP_THRESHOLD': 0,\n",
            "                           'bucket_cap_mb': 0,\n",
            "                           'clear_autocast_cache': True,\n",
            "                           'compute_dtype': torch.float32,\n",
            "                           'flatten_parameters': True,\n",
            "                           'fp32_reduce_scatter': False,\n",
            "                           'mixed_precision': True,\n",
            "                           'verbose': True},\n",
            "           'GRAD_CLIP': {'MAX_NORM': 1, 'NORM_TYPE': 2, 'USE_GRAD_CLIP': False},\n",
            "           'HEAD': {'BATCHNORM_EPS': 1e-05,\n",
            "                    'BATCHNORM_MOMENTUM': 0.1,\n",
            "                    'PARAMS': [['eval_mlp',\n",
            "                                {'dims': [2048, 10], 'in_channels': 2048}]],\n",
            "                    'PARAMS_MULTIPLIER': 1.0},\n",
            "           'INPUT_TYPE': 'rgb',\n",
            "           'MULTI_INPUT_HEAD_MAPPING': [],\n",
            "           'NON_TRAINABLE_PARAMS': [],\n",
            "           'SHARDED_DDP_SETUP': {'USE_SDP': False, 'reduce_buffer_size': -1},\n",
            "           'SINGLE_PASS_EVERY_CROP': False,\n",
            "           'SYNC_BN_CONFIG': {'CONVERT_BN_TO_SYNC_BN': True,\n",
            "                              'GROUP_SIZE': 8,\n",
            "                              'SYNC_BN_TYPE': 'apex'},\n",
            "           'TEMP_FROZEN_PARAMS_ITER_MAP': [],\n",
            "           'TRUNK': {'CONVIT': {'CLASS_TOKEN_IN_LOCAL_LAYERS': False,\n",
            "                                'LOCALITY_DIM': 10,\n",
            "                                'LOCALITY_STRENGTH': 1.0,\n",
            "                                'N_GPSA_LAYERS': 10,\n",
            "                                'USE_LOCAL_INIT': True},\n",
            "                     'EFFICIENT_NETS': {},\n",
            "                     'NAME': 'resnet',\n",
            "                     'REGNET': {},\n",
            "                     'RESNETS': {'DEPTH': 50,\n",
            "                                 'GROUPNORM_GROUPS': 32,\n",
            "                                 'GROUPS': 1,\n",
            "                                 'LAYER4_STRIDE': 2,\n",
            "                                 'NORM': 'BatchNorm',\n",
            "                                 'STANDARDIZE_CONVOLUTIONS': False,\n",
            "                                 'WIDTH_MULTIPLIER': 1,\n",
            "                                 'WIDTH_PER_GROUP': 64,\n",
            "                                 'ZERO_INIT_RESIDUAL': False},\n",
            "                     'VISION_TRANSFORMERS': {'ATTENTION_DROPOUT_RATE': 0,\n",
            "                                             'CLASSIFIER': 'token',\n",
            "                                             'DROPOUT_RATE': 0,\n",
            "                                             'DROP_PATH_RATE': 0,\n",
            "                                             'HIDDEN_DIM': 768,\n",
            "                                             'IMAGE_SIZE': 224,\n",
            "                                             'MLP_DIM': 3072,\n",
            "                                             'NUM_HEADS': 12,\n",
            "                                             'NUM_LAYERS': 12,\n",
            "                                             'PATCH_SIZE': 16,\n",
            "                                             'QKV_BIAS': False,\n",
            "                                             'QK_SCALE': False,\n",
            "                                             'name': None},\n",
            "                     'XCIT': {'ATTENTION_DROPOUT_RATE': 0,\n",
            "                              'DROPOUT_RATE': 0,\n",
            "                              'DROP_PATH_RATE': 0.05,\n",
            "                              'ETA': 1,\n",
            "                              'HIDDEN_DIM': 384,\n",
            "                              'IMAGE_SIZE': 224,\n",
            "                              'NUM_HEADS': 8,\n",
            "                              'NUM_LAYERS': 12,\n",
            "                              'PATCH_SIZE': 16,\n",
            "                              'QKV_BIAS': True,\n",
            "                              'QK_SCALE': False,\n",
            "                              'TOKENS_NORM': True,\n",
            "                              'name': None}},\n",
            "           'WEIGHTS_INIT': {'APPEND_PREFIX': 'trunk._feature_blocks.',\n",
            "                            'PARAMS_FILE': '/content/resnet50-19c8e357.pth',\n",
            "                            'REMOVE_PREFIX': '',\n",
            "                            'SKIP_LAYERS': ['num_batches_tracked'],\n",
            "                            'STATE_DICT_KEY_NAME': ''},\n",
            "           '_MODEL_INIT_SEED': 1},\n",
            " 'MONITORING': {'MONITOR_ACTIVATION_STATISTICS': 0},\n",
            " 'MULTI_PROCESSING_METHOD': 'forkserver',\n",
            " 'NEAREST_NEIGHBOR': {'L2_NORM_FEATS': False, 'SIGMA': 0.1, 'TOPK': 200},\n",
            " 'OPTIMIZER': {'betas': [0.9, 0.999],\n",
            "               'construct_single_param_group_only': False,\n",
            "               'head_optimizer_params': {'use_different_lr': False,\n",
            "                                         'use_different_wd': False,\n",
            "                                         'weight_decay': 0.0005},\n",
            "               'larc_config': {'clip': False,\n",
            "                               'eps': 1e-08,\n",
            "                               'trust_coefficient': 0.001},\n",
            "               'momentum': 0.9,\n",
            "               'name': 'sgd',\n",
            "               'nesterov': True,\n",
            "               'non_regularized_parameters': [],\n",
            "               'num_epochs': 1,\n",
            "               'param_schedulers': {'lr': {'auto_lr_scaling': {'auto_scale': True,\n",
            "                                                               'base_lr_batch_size': 256,\n",
            "                                                               'base_value': 0.01,\n",
            "                                                               'scaling_type': 'linear'},\n",
            "                                           'end_value': 0.0,\n",
            "                                           'interval_scaling': [],\n",
            "                                           'lengths': [],\n",
            "                                           'milestones': [],\n",
            "                                           'name': 'multistep',\n",
            "                                           'schedulers': [],\n",
            "                                           'start_value': 0.1,\n",
            "                                           'update_interval': 'epoch',\n",
            "                                           'value': 0.1,\n",
            "                                           'values': [0.0025]},\n",
            "                                    'lr_head': {'auto_lr_scaling': {'auto_scale': True,\n",
            "                                                                    'base_lr_batch_size': 256,\n",
            "                                                                    'base_value': 0.01,\n",
            "                                                                    'scaling_type': 'linear'},\n",
            "                                                'end_value': 0.0,\n",
            "                                                'interval_scaling': [],\n",
            "                                                'lengths': [],\n",
            "                                                'milestones': [],\n",
            "                                                'name': 'multistep',\n",
            "                                                'schedulers': [],\n",
            "                                                'start_value': 0.1,\n",
            "                                                'update_interval': 'epoch',\n",
            "                                                'value': 0.1,\n",
            "                                                'values': [0.0025]}},\n",
            "               'regularize_bias': True,\n",
            "               'regularize_bn': False,\n",
            "               'use_larc': False,\n",
            "               'use_zero': False,\n",
            "               'weight_decay': 0.0005},\n",
            " 'PROFILING': {'MEMORY_PROFILING': {'TRACK_BY_LAYER_MEMORY': False},\n",
            "               'NUM_ITERATIONS': 10,\n",
            "               'OUTPUT_FOLDER': '.',\n",
            "               'PROFILED_RANKS': [0, 1],\n",
            "               'RUNTIME_PROFILING': {'LEGACY_PROFILER': False,\n",
            "                                     'PROFILE_CPU': True,\n",
            "                                     'PROFILE_GPU': True,\n",
            "                                     'USE_PROFILER': False},\n",
            "               'START_ITERATION': 0,\n",
            "               'STOP_TRAINING_AFTER_PROFILING': False,\n",
            "               'WARMUP_ITERATIONS': 0},\n",
            " 'REPRODUCIBILITY': {'CUDDN_DETERMINISTIC': False},\n",
            " 'SEED_VALUE': 1,\n",
            " 'SLURM': {'ADDITIONAL_PARAMETERS': {},\n",
            "           'COMMENT': 'vissl job',\n",
            "           'CONSTRAINT': '',\n",
            "           'LOG_FOLDER': '.',\n",
            "           'MEM_GB': 250,\n",
            "           'NAME': 'vissl',\n",
            "           'NUM_CPU_PER_PROC': 8,\n",
            "           'PARTITION': '',\n",
            "           'PORT_ID': 40050,\n",
            "           'TIME_HOURS': 72,\n",
            "           'TIME_MINUTES': 0,\n",
            "           'USE_SLURM': False},\n",
            " 'SVM': {'cls_list': [],\n",
            "         'costs': {'base': -1.0,\n",
            "                   'costs_list': [0.1, 0.01],\n",
            "                   'power_range': [4, 20]},\n",
            "         'cross_val_folds': 3,\n",
            "         'dual': True,\n",
            "         'force_retrain': False,\n",
            "         'loss': 'squared_hinge',\n",
            "         'low_shot': {'dataset_name': 'voc',\n",
            "                      'k_values': [1, 2, 4, 8, 16, 32, 64, 96],\n",
            "                      'sample_inds': [1, 2, 3, 4, 5]},\n",
            "         'max_iter': 2000,\n",
            "         'normalize': True,\n",
            "         'penalty': 'l2'},\n",
            " 'TEST_EVERY_NUM_EPOCH': 1,\n",
            " 'TEST_MODEL': True,\n",
            " 'TEST_ONLY': False,\n",
            " 'TRAINER': {'TASK_NAME': 'self_supervision_task',\n",
            "             'TRAIN_STEP_NAME': 'standard_train_step'},\n",
            " 'VERBOSE': True}\n",
            "INFO 2023-02-14 14:16:14,356 train.py: 117: System config:\n",
            "-------------------  ---------------------------------------------------------------\n",
            "sys.platform         linux\n",
            "Python               3.8.10 (default, Nov 14 2022, 12:59:47) [GCC 9.4.0]\n",
            "numpy                1.19.5\n",
            "Pillow               7.1.2\n",
            "vissl                0.1.6 @/content/vissl/vissl\n",
            "GPU available        True\n",
            "GPU 0                Tesla T4\n",
            "CUDA_HOME            /usr/local/cuda\n",
            "torchvision          0.9.0+cu101 @/usr/local/lib/python3.8/dist-packages/torchvision\n",
            "hydra                1.0.7 @/usr/local/lib/python3.8/dist-packages/hydra\n",
            "classy_vision        0.7.0.dev @/usr/local/lib/python3.8/dist-packages/classy_vision\n",
            "tensorboard          2.11.2\n",
            "apex                 0.1 @/usr/local/lib/python3.8/dist-packages/apex\n",
            "cv2                  4.6.0\n",
            "PyTorch              1.8.0+cu101 @/usr/local/lib/python3.8/dist-packages/torch\n",
            "PyTorch debug build  False\n",
            "-------------------  ---------------------------------------------------------------\n",
            "PyTorch built with:\n",
            "  - GCC 7.3\n",
            "  - C++ Version: 201402\n",
            "  - Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications\n",
            "  - Intel(R) MKL-DNN v1.7.0 (Git Hash 7aed236906b1f7a05c0917e5257a1af05e9ff683)\n",
            "  - OpenMP 201511 (a.k.a. OpenMP 4.5)\n",
            "  - NNPACK is enabled\n",
            "  - CPU capability usage: AVX2\n",
            "  - CUDA Runtime 10.1\n",
            "  - NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70\n",
            "  - CuDNN 7.6.3\n",
            "  - Magma 2.5.2\n",
            "  - Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=10.1, CUDNN_VERSION=7.6.3, CXX_COMPILER=/opt/rh/devtoolset-7/root/usr/bin/c++, CXX_FLAGS= -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wno-sign-compare -Wno-unused-parameter -Wno-unused-variable -Wno-unused-function -Wno-unused-result -Wno-unused-local-typedefs -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.8.0, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=ON, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, \n",
            "\n",
            "CPU info:\n",
            "-------------------------------  ----------------------------------\n",
            "Architecture                     x86_64\n",
            "CPU op-mode(s)                   32-bit, 64-bit\n",
            "Byte Order                       Little Endian\n",
            "Address sizes                    46 bits physical, 48 bits virtual\n",
            "CPU(s)                           2\n",
            "On-line CPU(s) list              0,1\n",
            "Thread(s) per core               2\n",
            "Core(s) per socket               1\n",
            "Socket(s)                        1\n",
            "NUMA node(s)                     1\n",
            "Vendor ID                        GenuineIntel\n",
            "CPU family                       6\n",
            "Model                            85\n",
            "Model name                       Intel(R) Xeon(R) CPU @ 2.00GHz\n",
            "Stepping                         3\n",
            "CPU MHz                          2000.144\n",
            "BogoMIPS                         4000.28\n",
            "Hypervisor vendor                KVM\n",
            "Virtualization type              full\n",
            "L1d cache                        32 KiB\n",
            "L1i cache                        32 KiB\n",
            "L2 cache                         1 MiB\n",
            "L3 cache                         38.5 MiB\n",
            "NUMA node0 CPU(s)                0,1\n",
            "Vulnerability Itlb multihit      Not affected\n",
            "Vulnerability L1tf               Mitigation; PTE Inversion\n",
            "Vulnerability Mds                Vulnerable; SMT Host state unknown\n",
            "Vulnerability Meltdown           Vulnerable\n",
            "Vulnerability Mmio stale data    Vulnerable\n",
            "Vulnerability Retbleed           Vulnerable\n",
            "Vulnerability Spec store bypass  Vulnerable\n",
            "Vulnerability Spectre v1         Vulnerable\n",
            "Vulnerability Spectre v2         Vulnerable, IBPB\n",
            "Vulnerability Srbds              Not affected\n",
            "Vulnerability Tsx async abort    Vulnerable\n",
            "-------------------------------  ----------------------------------\n",
            "INFO 2023-02-14 14:16:14,357 tensorboard.py:  49: Tensorboard dir: /content/my_trash_2//tb_logs\n",
            "2023-02-14 14:16:14.360792: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 AVX512F FMA\n",
            "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
            "Traceback (most recent call last):\n",
            "  File \"/usr/local/lib/python3.8/dist-packages/tensorboard/compat/__init__.py\", line 42, in tf\n",
            "    from tensorboard.compat import notf  # noqa: F401\n",
            "ImportError: cannot import name 'notf' from 'tensorboard.compat' (/usr/local/lib/python3.8/dist-packages/tensorboard/compat/__init__.py)\n",
            "\n",
            "During handling of the above exception, another exception occurred:\n",
            "\n",
            "RuntimeError: module compiled against API version 0xe but this version of numpy is 0xd\n",
            "INFO 2023-02-14 14:16:14,676 tensorboard_hook.py:  90: Setting up SSL Tensorboard Hook...\n",
            "INFO 2023-02-14 14:16:14,676 tensorboard_hook.py: 102: Tensorboard config: log_params: True, log_params_freq: 310, log_params_gradients: True, log_activation_statistics: 0\n",
            "INFO 2023-02-14 14:16:14,677 trainer_main.py: 112: Using Distributed init method: tcp://localhost:56453, world_size: 1, rank: 0\n",
            "INFO 2023-02-14 14:16:14,678 distributed_c10d.py: 187: Added key: store_based_barrier_key:1 to store for rank: 0\n",
            "INFO 2023-02-14 14:16:14,678 trainer_main.py: 130: | initialized host 50e721256dd1 as rank 0 (0)\n",
            "INFO 2023-02-14 14:16:19,136 train_task.py: 181: Not using Automatic Mixed Precision\n",
            "INFO 2023-02-14 14:16:19,137 train_task.py: 455: Building model....\n",
            "INFO 2023-02-14 14:16:19,137 resnext.py:  64: ResNeXT trunk, supports activation checkpointing. Deactivated\n",
            "INFO 2023-02-14 14:16:19,137 resnext.py:  87: Building model: ResNeXt50-1x64d-w1-BatchNorm2d\n",
            "INFO 2023-02-14 14:16:19,771 model_helpers.py: 177: Using SyncBN group size: 1\n",
            "INFO 2023-02-14 14:16:19,771 model_helpers.py: 181: Converting BN layers to Apex SyncBN\n",
            "INFO 2023-02-14 14:16:19,771 distributed_c10d.py: 187: Added key: store_based_barrier_key:2 to store for rank: 0\n",
            "INFO 2023-02-14 14:16:19,778 train_task.py: 429: Initializing model from: /content/resnet50-19c8e357.pth\n",
            "INFO 2023-02-14 14:16:19,778 util.py: 276: Attempting to load checkpoint from /content/resnet50-19c8e357.pth\n",
            "INFO 2023-02-14 14:16:19,990 util.py: 281: Loaded checkpoint from /content/resnet50-19c8e357.pth\n",
            "INFO 2023-02-14 14:16:19,990 util.py: 240: Broadcasting checkpoint loaded from /content/resnet50-19c8e357.pth\n",
            "INFO 2023-02-14 14:16:23,059 train_task.py: 435: Checkpoint loaded: /content/resnet50-19c8e357.pth...\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 885: Loaded: trunk._feature_blocks.conv1.weight                              of shape: torch.Size([64, 3, 7, 7]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 885: Loaded: trunk._feature_blocks.bn1.weight                                of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 885: Loaded: trunk._feature_blocks.bn1.bias                                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 885: Loaded: trunk._feature_blocks.bn1.running_mean                          of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 885: Loaded: trunk._feature_blocks.bn1.running_var                           of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,061 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.conv1.weight                     of shape: torch.Size([64, 64, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn1.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn1.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn1.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn1.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.0.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.conv2.weight                     of shape: torch.Size([64, 64, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn2.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn2.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn2.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,062 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn2.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.0.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.conv3.weight                     of shape: torch.Size([256, 64, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn3.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn3.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn3.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.bn3.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.0.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.downsample.0.weight              of shape: torch.Size([256, 64, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.downsample.1.weight              of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.downsample.1.bias                of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.downsample.1.running_mean        of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,063 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.0.downsample.1.running_var         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.0.downsample.1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.conv1.weight                     of shape: torch.Size([64, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn1.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn1.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn1.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn1.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.1.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.conv2.weight                     of shape: torch.Size([64, 64, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn2.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn2.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn2.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn2.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,064 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.1.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.conv3.weight                     of shape: torch.Size([256, 64, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn3.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn3.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn3.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.1.bn3.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.1.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.conv1.weight                     of shape: torch.Size([64, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn1.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn1.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn1.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn1.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,065 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.2.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.conv2.weight                     of shape: torch.Size([64, 64, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn2.weight                       of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn2.bias                         of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn2.running_mean                 of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn2.running_var                  of shape: torch.Size([64]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.2.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.conv3.weight                     of shape: torch.Size([256, 64, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn3.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn3.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn3.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer1.2.bn3.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,066 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer1.2.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.conv1.weight                     of shape: torch.Size([128, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn1.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn1.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn1.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn1.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.0.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.conv2.weight                     of shape: torch.Size([128, 128, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn2.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn2.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,067 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn2.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn2.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.0.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.conv3.weight                     of shape: torch.Size([512, 128, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn3.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn3.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn3.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.bn3.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.0.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.downsample.0.weight              of shape: torch.Size([512, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,068 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.downsample.1.weight              of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.downsample.1.bias                of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.downsample.1.running_mean        of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.0.downsample.1.running_var         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.0.downsample.1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.conv1.weight                     of shape: torch.Size([128, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn1.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn1.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn1.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn1.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,069 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.1.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.conv2.weight                     of shape: torch.Size([128, 128, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn2.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn2.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn2.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn2.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.1.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.conv3.weight                     of shape: torch.Size([512, 128, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn3.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn3.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn3.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,070 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.1.bn3.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.1.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.conv1.weight                     of shape: torch.Size([128, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn1.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn1.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn1.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn1.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.2.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.conv2.weight                     of shape: torch.Size([128, 128, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,071 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn2.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,072 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn2.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,072 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn2.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,075 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn2.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,075 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.2.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,075 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.conv3.weight                     of shape: torch.Size([512, 128, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,075 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn3.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,075 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn3.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,076 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn3.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,076 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.2.bn3.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,076 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.2.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,076 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.conv1.weight                     of shape: torch.Size([128, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn1.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn1.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn1.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn1.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.3.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.conv2.weight                     of shape: torch.Size([128, 128, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn2.weight                       of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,077 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn2.bias                         of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn2.running_mean                 of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn2.running_var                  of shape: torch.Size([128]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.3.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.conv3.weight                     of shape: torch.Size([512, 128, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn3.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn3.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn3.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer2.3.bn3.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,078 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer2.3.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.conv1.weight                     of shape: torch.Size([256, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,079 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.0.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,080 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.0.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,081 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.0.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.downsample.0.weight              of shape: torch.Size([1024, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.downsample.1.weight              of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.downsample.1.bias                of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.downsample.1.running_mean        of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.0.downsample.1.running_var         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,082 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.0.downsample.1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.conv1.weight                     of shape: torch.Size([256, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,083 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.1.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.1.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,084 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.1.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.1.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.conv1.weight                     of shape: torch.Size([256, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,085 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.2.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,086 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.2.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.2.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,087 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.2.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.conv1.weight                     of shape: torch.Size([256, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,088 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.3.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.3.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,089 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.3.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.3.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.conv1.weight                     of shape: torch.Size([256, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,090 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.4.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,091 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.4.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.4.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.4.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.conv1.weight                     of shape: torch.Size([256, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn1.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn1.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,092 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn1.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,177 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn1.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,177 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.5.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,178 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.conv2.weight                     of shape: torch.Size([256, 256, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,178 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn2.weight                       of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,178 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn2.bias                         of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,178 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn2.running_mean                 of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,179 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn2.running_var                  of shape: torch.Size([256]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,179 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.5.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,179 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.conv3.weight                     of shape: torch.Size([1024, 256, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,179 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn3.weight                       of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,179 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn3.bias                         of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,180 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn3.running_mean                 of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,180 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer3.5.bn3.running_var                  of shape: torch.Size([1024]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,180 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer3.5.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,180 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.conv1.weight                     of shape: torch.Size([512, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,181 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn1.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,181 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn1.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,181 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn1.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,181 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn1.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,181 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.0.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,183 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.conv2.weight                     of shape: torch.Size([512, 512, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,183 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn2.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,184 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn2.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,184 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn2.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,184 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn2.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,184 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.0.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.conv3.weight                     of shape: torch.Size([2048, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn3.weight                       of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn3.bias                         of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn3.running_mean                 of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.bn3.running_var                  of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,185 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.0.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.downsample.0.weight              of shape: torch.Size([2048, 1024, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.downsample.1.weight              of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.downsample.1.bias                of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.downsample.1.running_mean        of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.0.downsample.1.running_var         of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,187 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.0.downsample.1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,188 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.conv1.weight                     of shape: torch.Size([512, 2048, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,188 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn1.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,188 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn1.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,188 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn1.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,188 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn1.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,189 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.1.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,190 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.conv2.weight                     of shape: torch.Size([512, 512, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,191 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn2.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,191 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn2.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,191 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn2.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,191 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn2.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,191 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.1.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.conv3.weight                     of shape: torch.Size([2048, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn3.weight                       of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn3.bias                         of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn3.running_mean                 of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.1.bn3.running_var                  of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,192 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.1.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.conv1.weight                     of shape: torch.Size([512, 2048, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn1.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn1.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn1.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn1.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,193 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.2.bn1.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,195 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.conv2.weight                     of shape: torch.Size([512, 512, 3, 3]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,195 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn2.weight                       of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,195 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn2.bias                         of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,195 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn2.running_mean                 of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,195 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn2.running_var                  of shape: torch.Size([512]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,196 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.2.bn2.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,196 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.conv3.weight                     of shape: torch.Size([2048, 512, 1, 1]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn3.weight                       of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn3.bias                         of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn3.running_mean                 of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 885: Loaded: trunk._feature_blocks.layer4.2.bn3.running_var                  of shape: torch.Size([2048]) from checkpoint\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 851: Ignored layer:\ttrunk._feature_blocks.layer4.2.bn3.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.channel_bn.weight, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.channel_bn.bias, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.channel_bn.running_mean, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.channel_bn.running_var, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 851: Ignored layer:\theads.0.channel_bn.num_batches_tracked\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.clf.clf.0.weight, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 894: Not found:\t\theads.0.clf.clf.0.bias, not initialized\n",
            "INFO 2023-02-14 14:16:23,197 checkpoint.py: 901: Extra layers not loaded from checkpoint: ['trunk._feature_blocks.fc.weight', 'trunk._feature_blocks.fc.bias', 'trunk._feature_blocks.type']\n",
            "INFO 2023-02-14 14:16:23,198 train_task.py: 656: Broadcast model BN buffers from primary on every forward pass\n",
            "INFO 2023-02-14 14:16:23,198 classification_task.py: 387: Synchronized Batch Normalization is disabled\n",
            "INFO 2023-02-14 14:16:23,235 optimizer_helper.py: 293: \n",
            "Trainable params: 163, \n",
            "Non-Trainable params: 0, \n",
            "Trunk Regularized Parameters: 53, \n",
            "Trunk Unregularized Parameters 106, \n",
            "Head Regularized Parameters: 2, \n",
            "Head Unregularized Parameters: 2 \n",
            "Remaining Regularized Parameters: 0 \n",
            "Remaining Unregularized Parameters: 0\n",
            "INFO 2023-02-14 14:16:23,236 ssl_dataset.py: 156: Rank: 0 split: TEST Data files:\n",
            "['/content/data/']\n",
            "INFO 2023-02-14 14:16:23,236 ssl_dataset.py: 159: Rank: 0 split: TEST Label files:\n",
            "[]\n",
            "INFO 2023-02-14 14:16:23,240 ssl_dataset.py: 156: Rank: 0 split: TRAIN Data files:\n",
            "['/content/data/']\n",
            "INFO 2023-02-14 14:16:23,240 ssl_dataset.py: 159: Rank: 0 split: TRAIN Label files:\n",
            "[]\n",
            "INFO 2023-02-14 14:16:23,256 misc.py: 161: Set start method of multiprocessing to forkserver\n",
            "INFO 2023-02-14 14:16:23,256 __init__.py: 126: Created the Distributed Sampler....\n",
            "INFO 2023-02-14 14:16:23,256 __init__.py: 101: Distributed Sampler config:\n",
            "{'num_replicas': 1, 'rank': 0, 'epoch': 0, 'num_samples': 10000, 'total_size': 10000, 'shuffle': True, 'seed': 0}\n",
            "/usr/local/lib/python3.8/dist-packages/torch/utils/data/dataloader.py:474: UserWarning: This DataLoader will create 5 worker processes in total. Our suggested max number of worker in current system is 2, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.\n",
            "  warnings.warn(_create_warning_msg(\n",
            "INFO 2023-02-14 14:16:23,256 __init__.py: 215: Wrapping the dataloader to async device copies\n",
            "INFO 2023-02-14 14:16:23,257 misc.py: 161: Set start method of multiprocessing to forkserver\n",
            "INFO 2023-02-14 14:16:23,257 __init__.py: 126: Created the Distributed Sampler....\n",
            "INFO 2023-02-14 14:16:23,257 __init__.py: 101: Distributed Sampler config:\n",
            "{'num_replicas': 1, 'rank': 0, 'epoch': 0, 'num_samples': 60000, 'total_size': 60000, 'shuffle': True, 'seed': 0}\n",
            "INFO 2023-02-14 14:16:23,257 __init__.py: 215: Wrapping the dataloader to async device copies\n",
            "INFO 2023-02-14 14:16:23,257 train_task.py: 384: Building loss...\n",
            "INFO 2023-02-14 14:16:23,257 trainer_main.py: 268: Training 1 epochs\n",
            "INFO 2023-02-14 14:16:23,258 trainer_main.py: 269: One epoch = 938 iterations.\n",
            "INFO 2023-02-14 14:16:23,258 trainer_main.py: 270: Total 60000 samples in one epoch\n",
            "INFO 2023-02-14 14:16:23,258 trainer_main.py: 276: Total 938 iterations for training\n",
            "INFO 2023-02-14 14:16:23,419 logger.py:  84: Tue Feb 14 14:16:23 2023       \n",
            "+-----------------------------------------------------------------------------+\n",
            "| NVIDIA-SMI 510.47.03    Driver Version: 510.47.03    CUDA Version: 11.6     |\n",
            "|-------------------------------+----------------------+----------------------+\n",
            "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\n",
            "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\n",
            "|                               |                      |               MIG M. |\n",
            "|===============================+======================+======================|\n",
            "|   0  Tesla T4            Off  | 00000000:00:04.0 Off |                    0 |\n",
            "| N/A   70C    P0    31W /  70W |   3813MiB / 15360MiB |      4%      Default |\n",
            "|                               |                      |                  N/A |\n",
            "+-------------------------------+----------------------+----------------------+\n",
            "                                                                               \n",
            "+-----------------------------------------------------------------------------+\n",
            "| Processes:                                                                  |\n",
            "|  GPU   GI   CI        PID   Type   Process name                  GPU Memory |\n",
            "|        ID   ID                                                   Usage      |\n",
            "|=============================================================================|\n",
            "|    0   N/A  N/A      2206      C                                    2635MiB |\n",
            "|    0   N/A  N/A   1706789      C                                    1175MiB |\n",
            "+-----------------------------------------------------------------------------+\n",
            "\n",
            "INFO 2023-02-14 14:16:23,420 trainer_main.py: 173: Model is:\n",
            " Classy <class 'vissl.models.base_ssl_model.BaseSSLMultiInputOutputModel'>:\n",
            "BaseSSLMultiInputOutputModel(\n",
            "  (_heads): ModuleDict()\n",
            "  (trunk): ResNeXt(\n",
            "    (_feature_blocks): ModuleDict(\n",
            "      (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)\n",
            "      (bn1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "      (conv1_relu): ReLU(inplace=True)\n",
            "      (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)\n",
            "      (layer1): Sequential(\n",
            "        (0): Bottleneck(\n",
            "          (conv1): Conv2d(64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "          (downsample): Sequential(\n",
            "            (0): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "            (1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          )\n",
            "        )\n",
            "        (1): Bottleneck(\n",
            "          (conv1): Conv2d(256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (2): Bottleneck(\n",
            "          (conv1): Conv2d(256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "      )\n",
            "      (layer2): Sequential(\n",
            "        (0): Bottleneck(\n",
            "          (conv1): Conv2d(256, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "          (downsample): Sequential(\n",
            "            (0): Conv2d(256, 512, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
            "            (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          )\n",
            "        )\n",
            "        (1): Bottleneck(\n",
            "          (conv1): Conv2d(512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (2): Bottleneck(\n",
            "          (conv1): Conv2d(512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (3): Bottleneck(\n",
            "          (conv1): Conv2d(512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "      )\n",
            "      (layer3): Sequential(\n",
            "        (0): Bottleneck(\n",
            "          (conv1): Conv2d(512, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "          (downsample): Sequential(\n",
            "            (0): Conv2d(512, 1024, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
            "            (1): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          )\n",
            "        )\n",
            "        (1): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (2): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (3): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (4): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (5): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "      )\n",
            "      (layer4): Sequential(\n",
            "        (0): Bottleneck(\n",
            "          (conv1): Conv2d(1024, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(<SUPPORTED_L4_STRIDE.two: 2>, <SUPPORTED_L4_STRIDE.two: 2>), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "          (downsample): Sequential(\n",
            "            (0): Conv2d(1024, 2048, kernel_size=(1, 1), stride=(<SUPPORTED_L4_STRIDE.two: 2>, <SUPPORTED_L4_STRIDE.two: 2>), bias=False)\n",
            "            (1): SyncBatchNorm(2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          )\n",
            "        )\n",
            "        (1): Bottleneck(\n",
            "          (conv1): Conv2d(2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "        (2): Bottleneck(\n",
            "          (conv1): Conv2d(2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
            "          (bn2): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (conv3): Conv2d(512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
            "          (bn3): SyncBatchNorm(2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "          (relu): ReLU(inplace=True)\n",
            "        )\n",
            "      )\n",
            "      (avgpool): AdaptiveAvgPool2d(output_size=(1, 1))\n",
            "      (flatten): Flatten()\n",
            "    )\n",
            "  )\n",
            "  (heads): ModuleList(\n",
            "    (0): LinearEvalMLP(\n",
            "      (channel_bn): SyncBatchNorm(2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
            "      (clf): MLP(\n",
            "        (clf): Sequential(\n",
            "          (0): Linear(in_features=2048, out_features=10, bias=True)\n",
            "        )\n",
            "      )\n",
            "    )\n",
            "  )\n",
            ")\n",
            "INFO 2023-02-14 14:16:23,488 trainer_main.py: 174: Loss is: CrossEntropyMultipleOutputSingleTargetLoss(\n",
            "  (criterion): CrossEntropyMultipleOutputSingleTargetCriterion(\n",
            "    (_losses): ModuleList()\n",
            "  )\n",
            ")\n",
            "INFO 2023-02-14 14:16:23,489 trainer_main.py: 175: Starting training....\n",
            "INFO 2023-02-14 14:16:23,489 __init__.py: 101: Distributed Sampler config:\n",
            "{'num_replicas': 1, 'rank': 0, 'epoch': 0, 'num_samples': 60000, 'total_size': 60000, 'shuffle': True, 'seed': 0}\n",
            "/usr/local/lib/python3.8/dist-packages/torch/utils/data/dataloader.py:474: UserWarning: This DataLoader will create 5 worker processes in total. Our suggested max number of worker in current system is 2, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.\n",
            "  warnings.warn(_create_warning_msg(\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "INFO 2023-02-14 14:16:34,597 trainer_main.py: 333: Phase advanced. Rank: 0\n",
            "INFO 2023-02-14 14:16:34,598 log_hooks.py:  76: ========= Memory Summary at on_phase_start =======\n",
            "|===========================================================================|\n",
            "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
            "|---------------------------------------------------------------------------|\n",
            "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
            "|===========================================================================|\n",
            "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocated memory      |  129816 KB |  129816 KB |  129816 KB |     512 B  |\n",
            "|       from large pool |  111872 KB |  111872 KB |  111872 KB |       0 B  |\n",
            "|       from small pool |   17944 KB |   17944 KB |   17944 KB |     512 B  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active memory         |  129816 KB |  129816 KB |  129816 KB |     512 B  |\n",
            "|       from large pool |  111872 KB |  111872 KB |  111872 KB |       0 B  |\n",
            "|       from small pool |   17944 KB |   17944 KB |   17944 KB |     512 B  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved memory   |  161792 KB |  161792 KB |  161792 KB |       0 B  |\n",
            "|       from large pool |  141312 KB |  141312 KB |  141312 KB |       0 B  |\n",
            "|       from small pool |   20480 KB |   20480 KB |   20480 KB |       0 B  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable memory |   31976 KB |   31977 KB |   91546 KB |   59570 KB |\n",
            "|       from large pool |   29440 KB |   29440 KB |   75776 KB |   46336 KB |\n",
            "|       from small pool |    2536 KB |    2537 KB |   15770 KB |   13234 KB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocations           |     329    |     329    |     330    |       1    |\n",
            "|       from large pool |      18    |      18    |      18    |       0    |\n",
            "|       from small pool |     311    |     311    |     312    |       1    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active allocs         |     329    |     329    |     330    |       1    |\n",
            "|       from large pool |      18    |      18    |      18    |       0    |\n",
            "|       from small pool |     311    |     311    |     312    |       1    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved segments |      16    |      16    |      16    |       0    |\n",
            "|       from large pool |       6    |       6    |       6    |       0    |\n",
            "|       from small pool |      10    |      10    |      10    |       0    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable allocs |       9    |       9    |      17    |       8    |\n",
            "|       from large pool |       6    |       6    |       6    |       0    |\n",
            "|       from small pool |       3    |       5    |      11    |       8    |\n",
            "|===========================================================================|\n",
            "\n",
            "\n",
            "INFO 2023-02-14 14:16:38,426 state_update_hooks.py: 115: Starting phase 0 [train]\n",
            "INFO 2023-02-14 14:16:39,691 log_hooks.py:  76: ========= Memory Summary at on_forward =======\n",
            "|===========================================================================|\n",
            "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
            "|---------------------------------------------------------------------------|\n",
            "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
            "|===========================================================================|\n",
            "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocated memory      |    5372 MB |    7826 MB |   26208 MB |   20835 MB |\n",
            "|       from large pool |    5353 MB |    7808 MB |   26187 MB |   20833 MB |\n",
            "|       from small pool |      18 MB |      18 MB |      21 MB |       2 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active memory         |    5372 MB |    7826 MB |   26208 MB |   20835 MB |\n",
            "|       from large pool |    5353 MB |    7808 MB |   26187 MB |   20833 MB |\n",
            "|       from small pool |      18 MB |      18 MB |      21 MB |       2 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved memory   |    8208 MB |    9352 MB |   15652 MB |    7444 MB |\n",
            "|       from large pool |    8186 MB |    9332 MB |   15630 MB |    7444 MB |\n",
            "|       from small pool |      22 MB |      22 MB |      22 MB |       0 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable memory |  245096 KB |    1603 MB |   10952 MB |   10713 MB |\n",
            "|       from large pool |  241920 KB |    1600 MB |   10933 MB |   10697 MB |\n",
            "|       from small pool |    3176 KB |       3 MB |      19 MB |      15 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocations           |     602    |     607    |    1493    |     891    |\n",
            "|       from large pool |     123    |     123    |     163    |      40    |\n",
            "|       from small pool |     479    |     484    |    1330    |     851    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active allocs         |     614    |     618    |    1493    |     879    |\n",
            "|       from large pool |     123    |     123    |     163    |      40    |\n",
            "|       from small pool |     491    |     495    |    1330    |     839    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved segments |      32    |      32    |      37    |       5    |\n",
            "|       from large pool |      21    |      22    |      26    |       5    |\n",
            "|       from small pool |      11    |      11    |      11    |       0    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable allocs |      45    |      57    |     679    |     634    |\n",
            "|       from large pool |      15    |      16    |      31    |      16    |\n",
            "|       from small pool |      30    |      42    |     648    |     618    |\n",
            "|===========================================================================|\n",
            "\n",
            "\n",
            "INFO 2023-02-14 14:16:44,482 log_hooks.py:  76: ========= Memory Summary at on_backward =======\n",
            "|===========================================================================|\n",
            "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
            "|---------------------------------------------------------------------------|\n",
            "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
            "|===========================================================================|\n",
            "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocated memory      |  263605 KB |    7973 MB |   70144 MB |   69887 MB |\n",
            "|       from large pool |  227968 KB |    7955 MB |   70104 MB |   69881 MB |\n",
            "|       from small pool |   35637 KB |      34 MB |      40 MB |       5 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active memory         |  263605 KB |    7973 MB |   70144 MB |   69887 MB |\n",
            "|       from large pool |  227968 KB |    7955 MB |   70104 MB |   69881 MB |\n",
            "|       from small pool |   35637 KB |      34 MB |      40 MB |       5 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved memory   |    3200 MB |    9352 MB |   21418 MB |   18218 MB |\n",
            "|       from large pool |    3162 MB |    9332 MB |   21380 MB |   18218 MB |\n",
            "|       from small pool |      38 MB |      38 MB |      38 MB |       0 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable memory |    2942 MB |    3332 MB |   40942 MB |   37999 MB |\n",
            "|       from large pool |    2939 MB |    3329 MB |   40910 MB |   37971 MB |\n",
            "|       from small pool |       3 MB |       4 MB |      31 MB |      28 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocations           |     499    |     612    |    2131    |    1632    |\n",
            "|       from large pool |      36    |     126    |     414    |     378    |\n",
            "|       from small pool |     463    |     489    |    1717    |    1254    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active allocs         |     499    |     618    |    2131    |    1632    |\n",
            "|       from large pool |      36    |     126    |     414    |     378    |\n",
            "|       from small pool |     463    |     495    |    1717    |    1254    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved segments |      30    |      37    |      50    |      20    |\n",
            "|       from large pool |      11    |      22    |      31    |      20    |\n",
            "|       from small pool |      19    |      19    |      19    |       0    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable allocs |      52    |      69    |    1065    |    1013    |\n",
            "|       from large pool |      14    |      19    |     151    |     137    |\n",
            "|       from small pool |      38    |      52    |     914    |     876    |\n",
            "|===========================================================================|\n",
            "\n",
            "\n",
            "INFO 2023-02-14 14:16:44,491 log_hooks.py:  76: ========= Memory Summary at on_update =======\n",
            "|===========================================================================|\n",
            "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
            "|---------------------------------------------------------------------------|\n",
            "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
            "|===========================================================================|\n",
            "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocated memory      |  356686 KB |    7973 MB |   70420 MB |   70072 MB |\n",
            "|       from large pool |  303360 KB |    7955 MB |   70329 MB |   70032 MB |\n",
            "|       from small pool |   53326 KB |      53 MB |      91 MB |      39 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active memory         |  356686 KB |    7973 MB |   70420 MB |   70072 MB |\n",
            "|       from large pool |  303360 KB |    7955 MB |   70329 MB |   70032 MB |\n",
            "|       from small pool |   53326 KB |      53 MB |      91 MB |      39 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved memory   |    3220 MB |    9352 MB |   21438 MB |   18218 MB |\n",
            "|       from large pool |    3162 MB |    9332 MB |   21380 MB |   18218 MB |\n",
            "|       from small pool |      58 MB |      58 MB |      58 MB |       0 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable memory |    2871 MB |    3332 MB |   41143 MB |   38271 MB |\n",
            "|       from large pool |    2865 MB |    3329 MB |   41061 MB |   38195 MB |\n",
            "|       from small pool |       5 MB |       6 MB |      82 MB |      76 MB |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Allocations           |     662    |     663    |    2512    |    1850    |\n",
            "|       from large pool |      53    |     126    |     465    |     412    |\n",
            "|       from small pool |     609    |     610    |    2047    |    1438    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Active allocs         |     662    |     663    |    2512    |    1850    |\n",
            "|       from large pool |      53    |     126    |     465    |     412    |\n",
            "|       from small pool |     609    |     610    |    2047    |    1438    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| GPU reserved segments |      40    |      40    |      60    |      20    |\n",
            "|       from large pool |      11    |      22    |      31    |      20    |\n",
            "|       from small pool |      29    |      29    |      29    |       0    |\n",
            "|---------------------------------------------------------------------------|\n",
            "| Non-releasable allocs |      37    |      71    |    1174    |    1137    |\n",
            "|       from large pool |      16    |      19    |     172    |     156    |\n",
            "|       from small pool |      21    |      54    |    1002    |     981    |\n",
            "|===========================================================================|\n",
            "\n",
            "\n",
            "INFO 2023-02-14 14:16:44,491 tensorboard_hook.py: 236: Logging Parameter gradients. Iteration 0\n",
            "INFO 2023-02-14 14:16:47,593 tensorboard_hook.py: 255: Logging metrics. Iteration 0\n",
            "INFO 2023-02-14 14:16:47,595 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 0; lr: 0.0025; loss: 2.36162; btime(ms): 0; eta: 0:00:00; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:16:48,301 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 1; lr: 0.0025; loss: 2.11086; btime(ms): 24337; eta: 6:20:04; peak_mem(M): 7973; max_iterations: 938;\n",
            "INFO 2023-02-14 14:16:50,609 tensorboard_hook.py: 255: Logging metrics. Iteration 5\n",
            "INFO 2023-02-14 14:16:50,839 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 5; lr: 0.0025; loss: 1.22663; btime(ms): 5345; eta: 1:23:07; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:16:53,807 tensorboard_hook.py: 255: Logging metrics. Iteration 10\n",
            "INFO 2023-02-14 14:16:54,036 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 10; lr: 0.0025; loss: 0.45048; btime(ms): 2991; eta: 0:46:15; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:16:57,008 tensorboard_hook.py: 255: Logging metrics. Iteration 15\n",
            "INFO 2023-02-14 14:16:57,243 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 15; lr: 0.0025; loss: 0.21688; btime(ms): 2207; eta: 0:33:57; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:00,234 tensorboard_hook.py: 255: Logging metrics. Iteration 20\n",
            "INFO 2023-02-14 14:17:00,470 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 20; lr: 0.0025; loss: 0.07088; btime(ms): 1816; eta: 0:27:47; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:03,496 tensorboard_hook.py: 255: Logging metrics. Iteration 25\n",
            "INFO 2023-02-14 14:17:03,735 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 25; lr: 0.0025; loss: 0.167; btime(ms): 1583; eta: 0:24:05; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:06,819 tensorboard_hook.py: 255: Logging metrics. Iteration 30\n",
            "INFO 2023-02-14 14:17:07,064 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 30; lr: 0.0025; loss: 0.08164; btime(ms): 1429; eta: 0:21:38; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:10,165 tensorboard_hook.py: 255: Logging metrics. Iteration 35\n",
            "INFO 2023-02-14 14:17:10,406 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 35; lr: 0.0025; loss: 0.05063; btime(ms): 1321; eta: 0:19:52; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:13,508 tensorboard_hook.py: 255: Logging metrics. Iteration 40\n",
            "INFO 2023-02-14 14:17:13,749 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 40; lr: 0.0025; loss: 0.04043; btime(ms): 1239; eta: 0:18:33; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:16,849 tensorboard_hook.py: 255: Logging metrics. Iteration 45\n",
            "INFO 2023-02-14 14:17:17,092 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 45; lr: 0.0025; loss: 0.05849; btime(ms): 1176; eta: 0:17:30; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:20,013 logger.py:  84: Tue Feb 14 14:17:19 2023       \n",
            "+-----------------------------------------------------------------------------+\n",
            "| NVIDIA-SMI 510.47.03    Driver Version: 510.47.03    CUDA Version: 11.6     |\n",
            "|-------------------------------+----------------------+----------------------+\n",
            "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\n",
            "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\n",
            "|                               |                      |               MIG M. |\n",
            "|===============================+======================+======================|\n",
            "|   0  Tesla T4            Off  | 00000000:00:04.0 Off |                    0 |\n",
            "| N/A   79C    P0    46W /  70W |  10169MiB / 15360MiB |     20%      Default |\n",
            "|                               |                      |                  N/A |\n",
            "+-------------------------------+----------------------+----------------------+\n",
            "                                                                               \n",
            "+-----------------------------------------------------------------------------+\n",
            "| Processes:                                                                  |\n",
            "|  GPU   GI   CI        PID   Type   Process name                  GPU Memory |\n",
            "|        ID   ID                                                   Usage      |\n",
            "|=============================================================================|\n",
            "|    0   N/A  N/A      2206      C                                    2635MiB |\n",
            "|    0   N/A  N/A   1706789      C                                    7531MiB |\n",
            "+-----------------------------------------------------------------------------+\n",
            "\n",
            "INFO 2023-02-14 14:17:20,450 tensorboard_hook.py: 255: Logging metrics. Iteration 50\n",
            "INFO 2023-02-14 14:17:20,681 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 50; lr: 0.0025; loss: 0.02569; btime(ms): 1124; eta: 0:16:38; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:23,710 tensorboard_hook.py: 255: Logging metrics. Iteration 55\n",
            "INFO 2023-02-14 14:17:23,943 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 55; lr: 0.0025; loss: 0.0887; btime(ms): 1087; eta: 0:16:00; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:26,918 tensorboard_hook.py: 255: Logging metrics. Iteration 60\n",
            "INFO 2023-02-14 14:17:27,149 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 60; lr: 0.0025; loss: 0.07003; btime(ms): 1050; eta: 0:15:22; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:30,101 tensorboard_hook.py: 255: Logging metrics. Iteration 65\n",
            "INFO 2023-02-14 14:17:30,331 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 65; lr: 0.0025; loss: 0.14523; btime(ms): 1018; eta: 0:14:49; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:33,269 tensorboard_hook.py: 255: Logging metrics. Iteration 70\n",
            "INFO 2023-02-14 14:17:33,494 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 70; lr: 0.0025; loss: 0.04909; btime(ms): 991; eta: 0:14:20; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:36,429 tensorboard_hook.py: 255: Logging metrics. Iteration 75\n",
            "INFO 2023-02-14 14:17:36,654 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 75; lr: 0.0025; loss: 0.01396; btime(ms): 967; eta: 0:13:54; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:39,598 tensorboard_hook.py: 255: Logging metrics. Iteration 80\n",
            "INFO 2023-02-14 14:17:39,830 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 80; lr: 0.0025; loss: 0.03805; btime(ms): 946; eta: 0:13:31; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:42,771 tensorboard_hook.py: 255: Logging metrics. Iteration 85\n",
            "INFO 2023-02-14 14:17:42,994 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 85; lr: 0.0025; loss: 0.01166; btime(ms): 928; eta: 0:13:11; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:45,913 tensorboard_hook.py: 255: Logging metrics. Iteration 90\n",
            "INFO 2023-02-14 14:17:46,136 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 90; lr: 0.0025; loss: 0.02166; btime(ms): 911; eta: 0:12:52; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:49,053 tensorboard_hook.py: 255: Logging metrics. Iteration 95\n",
            "INFO 2023-02-14 14:17:49,278 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 95; lr: 0.0025; loss: 0.21921; btime(ms): 896; eta: 0:12:35; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:17:52,211 tensorboard_hook.py: 255: Logging metrics. Iteration 100\n",
            "INFO 2023-02-14 14:17:52,437 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 100; lr: 0.0025; loss: 0.05573; btime(ms): 883; eta: 0:12:20; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:18:56,469 tensorboard_hook.py: 255: Logging metrics. Iteration 200\n",
            "INFO 2023-02-14 14:18:56,699 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 200; lr: 0.0025; loss: 0.03004; btime(ms): 762; eta: 0:09:22; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:20:09,497 tensorboard_hook.py: 236: Logging Parameter gradients. Iteration 310\n",
            "INFO 2023-02-14 14:21:10,402 tensorboard_hook.py: 255: Logging metrics. Iteration 400\n",
            "INFO 2023-02-14 14:21:10,627 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 400; lr: 0.0025; loss: 0.09139; btime(ms): 716; eta: 0:06:25; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:23:18,405 tensorboard_hook.py: 255: Logging metrics. Iteration 600\n",
            "INFO 2023-02-14 14:23:18,633 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 600; lr: 0.0025; loss: 0.00084; btime(ms): 690; eta: 0:03:53; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:23:34,090 tensorboard_hook.py: 236: Logging Parameter gradients. Iteration 620\n",
            "INFO 2023-02-14 14:25:32,211 tensorboard_hook.py: 255: Logging metrics. Iteration 800\n",
            "INFO 2023-02-14 14:25:32,440 log_hooks.py: 277: Rank: 0; [ep: 0] iter: 800; lr: 0.0025; loss: 0.08653; btime(ms): 685; eta: 0:01:34; peak_mem(M): 7973;\n",
            "INFO 2023-02-14 14:26:58,181 tensorboard_hook.py: 236: Logging Parameter gradients. Iteration 930\n",
            "INFO 2023-02-14 14:27:06,856 trainer_main.py: 214: Meters synced\n",
            "INFO 2023-02-14 14:27:06,856 log_hooks.py: 566: Average train batch time (ms) for 938 batches: 674\n",
            "INFO 2023-02-14 14:27:06,857 log_hooks.py: 575: Train step time breakdown (rank 0):\n",
            "               Timer     Host    CudaEvent\n",
            "         read_sample:    2.68 ms    0.08 ms\n",
            "             forward:  247.33 ms  200.77 ms\n",
            "        loss_compute:    0.68 ms    0.65 ms\n",
            "     loss_all_reduce:    0.14 ms    0.14 ms\n",
            "       meters_update:    0.60 ms    0.63 ms\n",
            "            backward:   28.13 ms  433.16 ms\n",
            "      optimizer_step:  183.03 ms    7.15 ms\n",
            "    train_step_total:  668.75 ms  669.65 ms\n",
            "/usr/local/lib/python3.8/dist-packages/torch/cuda/memory.py:260: FutureWarning: torch.cuda.reset_max_memory_allocated now calls torch.cuda.reset_peak_memory_stats, which resets /all/ peak memory stats.\n",
            "  warnings.warn(\n",
            "/usr/local/lib/python3.8/dist-packages/torch/cuda/memory.py:286: FutureWarning: torch.cuda.reset_max_memory_cached now calls torch.cuda.reset_peak_memory_stats, which resets /all/ peak memory stats.\n",
            "  warnings.warn(\n",
            "INFO 2023-02-14 14:27:13,602 log_hooks.py: 498: Rank: 0, name: train_accuracy_list_meter, value: {'top_1': {0: 98.25}}\n",
            "INFO 2023-02-14 14:27:13,603 io.py:  63: Saving data to file: /content/my_trash_2//metrics.json\n",
            "INFO 2023-02-14 14:27:13,603 io.py:  89: Saved data to file: /content/my_trash_2//metrics.json\n",
            "INFO 2023-02-14 14:27:13,603 log_hooks.py: 425: [phase: 0] Saving checkpoint to /content/my_trash_2/\n",
            "INFO 2023-02-14 14:27:14,096 checkpoint.py: 131: Saved checkpoint: /content/my_trash_2//model_final_checkpoint_phase0.torch\n",
            "INFO 2023-02-14 14:27:14,096 checkpoint.py: 140: Creating symlink...\n",
            "INFO 2023-02-14 14:27:14,096 checkpoint.py: 144: Created symlink: /content/my_trash_2//checkpoint.torch\n",
            "INFO 2023-02-14 14:27:14,097 __init__.py: 101: Distributed Sampler config:\n",
            "{'num_replicas': 1, 'rank': 0, 'epoch': 1, 'num_samples': 10000, 'total_size': 10000, 'shuffle': True, 'seed': 0}\n",
            "/usr/local/lib/python3.8/dist-packages/torch/utils/data/dataloader.py:474: UserWarning: This DataLoader will create 5 worker processes in total. Our suggested max number of worker in current system is 2, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.\n",
            "  warnings.warn(_create_warning_msg(\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "** fvcore version of PathManager will be deprecated soon. **\n",
            "** Please migrate to the version in iopath repo. **\n",
            "https://github.com/facebookresearch/iopath \n",
            "\n",
            "INFO 2023-02-14 14:27:19,431 trainer_main.py: 333: Phase advanced. Rank: 0\n",
            "INFO 2023-02-14 14:27:19,431 state_update_hooks.py: 115: Starting phase 1 [test]\n",
            "INFO 2023-02-14 14:27:50,958 trainer_main.py: 214: Meters synced\n",
            "INFO 2023-02-14 14:27:50,958 log_hooks.py: 566: Average test batch time (ms) for 157 batches: 200\n",
            "INFO 2023-02-14 14:27:50,959 log_hooks.py: 498: Rank: 0, name: test_accuracy_list_meter, value: {'top_1': {0: 99.19}}\n",
            "INFO 2023-02-14 14:27:50,959 io.py:  63: Saving data to file: /content/my_trash_2//metrics.json\n",
            "INFO 2023-02-14 14:27:50,959 io.py:  89: Saved data to file: /content/my_trash_2//metrics.json\n",
            "INFO 2023-02-14 14:27:51,049 train.py: 131: All Done!\n",
            "INFO 2023-02-14 14:27:51,049 logger.py:  73: Shutting down loggers...\n",
            "INFO 2023-02-14 14:27:51,049 distributed_launcher.py: 168: All Done!\n",
            "INFO 2023-02-14 14:27:51,049 logger.py:  73: Shutting down loggers...\n"
          ]
        }
      ],
      "source": [
        "# Full-tuning ResNet50 on MNIST by attaching a classifiation head 2048->10.\n",
        "# Note that this takes ~12 minutes to run. \n",
        "\n",
        "# !python3 tools/run_distributed_engines.py \\\n",
        "#         hydra.verbose=true \\\n",
        "#         config=benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml \\\n",
        "#         config.DATA.TRAIN.DATA_SOURCES=\"[torchvision_dataset]\" \\\n",
        "#         config.DATA.TRAIN.LABEL_SOURCES=\"[torchvision_dataset]\" \\\n",
        "#         config.DATA.TRAIN.DATASET_NAMES=\"[MNIST]\" \\\n",
        "#         config.DATA.TRAIN.DATA_PATHS=\"[/content/data/]\" \\\n",
        "#         config.DATA.TEST.DATA_SOURCES=\"[torchvision_dataset]\" \\\n",
        "#         config.DATA.TEST.LABEL_SOURCES=\"[torchvision_dataset]\" \\\n",
        "#         config.DATA.TEST.DATASET_NAMES=\"[MNIST]\" \\\n",
        "#         config.DATA.TEST.DATA_PATHS=\"[/content/data/]\" \\\n",
        "#         config.TEST_MODEL=True \\\n",
        "#         config.DATA.TEST.BATCHSIZE_PER_REPLICA=64 \\\n",
        "#         config.DATA.TRAIN.BATCHSIZE_PER_REPLICA=64 \\\n",
        "#         config.DISTRIBUTED.NUM_NODES=1 \\\n",
        "#         config.DISTRIBUTED.NUM_PROC_PER_NODE=1 \\\n",
        "#         config.OPTIMIZER.num_epochs=1 \\\n",
        "#         config.OPTIMIZER.param_schedulers.lr.values=\"[0.01]\" \\\n",
        "#         config.OPTIMIZER.param_schedulers.lr.milestones=\"[]\" \\\n",
        "#         config.CHECKPOINT.DIR=\"/content/checkpoints\" \\\n",
        "#         config.MODEL.WEIGHTS_INIT.PARAMS_FILE=\"/content/resnet50-19c8e357.pth\" \\\n",
        "#         config.MODEL.WEIGHTS_INIT.STATE_DICT_KEY_NAME=\"\" \\\n",
        "#         config.MODEL.WEIGHTS_INIT.APPEND_PREFIX=\"trunk._feature_blocks.\" \\\n",
        "#         config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True \\\n",
        "#         config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_ONLY=False \\\n",
        "#         config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=False \\\n",
        "#         config.MODEL.FEATURE_EVAL_SETTINGS.EXTRACT_TRUNK_FEATURES_ONLY=False \\\n",
        "#         config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=False \\\n",
        "#         config.MODEL.HEAD.PARAMS=\"\"\"[[\"eval_mlp\", {\"in_channels\": 2048, \"dims\": [2048, 10]}]]\"\"\" \\\n",
        "#         config.HOOKS.TENSORBOARD_SETUP.USE_TENSORBOARD=true\n",
        "\n",
        "\n",
        "\n",
        "\n",
        "!python3 vissl_tools/run_distributed_engines.py \\\n",
        "        hydra.verbose=true \\\n",
        "        config=benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml \\\n",
        "        config.DATA.TRAIN.DATA_SOURCES=\"[torchvision_dataset]\" \\\n",
        "        config.DATA.TRAIN.LABEL_SOURCES=\"[torchvision_dataset]\" \\\n",
        "        config.DATA.TRAIN.DATASET_NAMES=\"[MNIST]\" \\\n",
        "        config.DATA.TRAIN.DATA_PATHS=\"[ats/data/]\" \\\n",
        "        config.DATA.TEST.DATA_SOURCES=\"[torchvision_dataset]\" \\\n",
        "        config.DATA.TEST.LABEL_SOURCES=\"[torchvision_dataset]\" \\\n",
        "        config.DATA.TEST.DATASET_NAMES=\"[MNIST]\" \\\n",
        "        config.DATA.TEST.DATA_PATHS=\"[ats/data/]\" \\\n",
        "        config.TEST_MODEL=True \\\n",
        "        config.DATA.TEST.BATCHSIZE_PER_REPLICA=64 \\\n",
        "        config.DATA.TRAIN.BATCHSIZE_PER_REPLICA=64 \\\n",
        "        config.DISTRIBUTED.NUM_NODES=1 \\\n",
        "        config.DISTRIBUTED.NUM_PROC_PER_NODE=1 \\\n",
        "        config.OPTIMIZER.num_epochs=1 \\\n",
        "        config.OPTIMIZER.param_schedulers.lr.values=\"[0.01]\" \\\n",
        "        config.OPTIMIZER.param_schedulers.lr.milestones=\"[]\" \\\n",
        "        config.CHECKPOINT.DIR=\"ats/tuned_models/\" \\\n",
        "        config.CHECKPOINT.OVERWRITE_EXISTING=False \\\n",
        "        config.MODEL.WEIGHTS_INIT.PARAMS_FILE=\"ats/models/resnet50-19c8e357.pth\" \\\n",
        "        config.MODEL.WEIGHTS_INIT.STATE_DICT_KEY_NAME=\"\" \\\n",
        "        config.MODEL.WEIGHTS_INIT.APPEND_PREFIX=\"trunk._feature_blocks.\" \\\n",
        "        config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True \\\n",
        "        config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_ONLY=False \\\n",
        "        config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=False \\\n",
        "        config.MODEL.FEATURE_EVAL_SETTINGS.EXTRACT_TRUNK_FEATURES_ONLY=False \\\n",
        "        config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=False \\\n",
        "        config.MODEL.HEAD.PARAMS=\"\"\"[[\"eval_mlp\", {\"in_channels\": 2048, \"dims\": [2048, 10]}]]\"\"\" \\\n",
        "        config.HOOKS.TENSORBOARD_SETUP.USE_TENSORBOARD=true\n",
        "\n",
        "\n",
        "\n",
        "\n",
        "# Setting for fulltuning -> config.MODEL.WEIGHTS_INIT.APPEND_PREFIX=\"trunk._feature_blocks.\"\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_ONLY=False \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=False \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EXTRACT_TRUNK_FEATURES_ONLY=False \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=False \\\n",
        "\n",
        "# Setting for classification head-only tuning -> config.MODEL.WEIGHTS_INIT.APPEND_PREFIX=\"trunk.base_model._feature_blocks.\"\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_ONLY=True \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=False \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EXTRACT_TRUNK_FEATURES_ONLY=False \\\n",
        "        # config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=False \\"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "F4BTSLqOL4yv",
        "outputId": "14e5bebb-f929-437a-fc0b-5bd9621e2fe1"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "checkpoint.torch  model_final_checkpoint_phase0.torch  train_config.yaml\n",
            "log.txt\t\t  stdout.json\n",
            "metrics.json\t  tb_logs\n",
            "{\"iteration\": 938, \"phase_idx\": 0, \"train_accuracy_list_meter\": {\"top_1\": {\"0\": 98.25}}, \"train_phase_idx\": 0}\n",
            "{\"iteration\": 938, \"phase_idx\": 1, \"test_accuracy_list_meter\": {\"top_1\": {\"0\": 99.19}}, \"train_phase_idx\": 0}\n"
          ]
        }
      ],
      "source": [
        "!ls /content/my_trash_2/\n",
        "!cat /content/my_trash_2/metrics.json\n",
        "\n",
        "# 0.9656000137329102\n",
        "\n",
        "\n",
        "# 0.9951833486557007"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "hPgTZPh2OU6x",
        "outputId": "41f88111-ed9c-489a-c7e3-dc29d7719b09"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "checkpoint.torch  model_final_checkpoint_phase0.torch  train_config.yaml\n",
            "log.txt\t\t  stdout.json\n",
            "metrics.json\t  tb_logs\n"
          ]
        }
      ],
      "source": [
        "!ls /content/checkpoints/"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "bW6qgGJGObIq",
        "outputId": "2643900e-4822-4ee1-b920-8d6995b9d80d"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "{\"iteration\": 938, \"phase_idx\": 0, \"train_accuracy_list_meter\": {\"top_1\": {\"res5\": 94.2417}}, \"train_phase_idx\": 0}\n",
            "{\"iteration\": 938, \"phase_idx\": 1, \"test_accuracy_list_meter\": {\"top_1\": {\"res5\": 96.83}}, \"train_phase_idx\": 0}\n"
          ]
        }
      ],
      "source": [
        "# Performance metrics.\n",
        "# !cat /content/checkpoints/metrics.json"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "4TSt892RGSNy"
      },
      "outputs": [],
      "source": [
        "# Prepare the dataloader.\n",
        "# Pick the same transformations as used for training procedure, i.e. from config.DATA.TRANSFORMS.\n",
        "mean, std = torch.tensor([0.485, 0.456, 0.406]), torch.tensor([0.485, 0.456, 0.406])\n",
        "transform = vision_transforms.Compose([MNISTImgPil2RGB(size=32, box=[2, 2]), \n",
        "                                       vision_transforms.Resize(224),\n",
        "                                        vision_transforms.ToTensor(),\n",
        "                                        vision_transforms.Normalize(mean=mean, std=std)])\n",
        "# inverse_transform = vision_transforms.Compose([vision_transforms.Normalize(mean=[0., 0., 0.], std=1/std),\n",
        "#                                                 vision_transforms.Normalize(mean=-mean, std=[1., 1., 1.])])\n",
        "\n",
        "# Define the dataset and dataloader.\n",
        "trainset = MNIST(root=ROOT, train=True, download=True, transform=transform)\n",
        "train_loader = DataLoader(trainset, batch_size=64, shuffle=False, num_workers=0, pin_memory=False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "9j1LzSISOTGB"
      },
      "outputs": [],
      "source": [
        "class ProxyModel(nn.Module):\n",
        "    \"\"\"All models should return ONLY ONE vector of (N, C) where C = number of classes.\n",
        "    Considering most models in torchvision.models return one vector of (N,C), where\n",
        "    N is the number of inputs and C is the number of classes, torchattacks also only\n",
        "    supports limited forms of output. Please check the shape of the model’s output carefully.\"\"\"\n",
        "\n",
        "    def __init__(self, model, device, mode=\"train\"):\n",
        "        super(ProxyModel, self).__init__()\n",
        "        self.model = model\n",
        "        self.model.to(device)\n",
        "\n",
        "        # if mode == \"train\":\n",
        "        #     self.train()\n",
        "        # elif mode == \"eval\":\n",
        "        #     # TODO: Setting the model to train mode increases the accuracy.\n",
        "        #     self.eval()\n",
        "        #     # self.train()\n",
        "        # else:\n",
        "        #     raise ValueError(\"Invalid mode value, choose one of ('train', 'eval').\")\n",
        "\n",
        "        for param in self.model.parameters():\n",
        "            param.requires_grad = False\n",
        "\n",
        "    def forward(self, x):\n",
        "        return self.model(x)[0]\n",
        "\n",
        "\n",
        "# Loades full-tuned weights.\n",
        "def init_model(config: list, mode):\n",
        "    \"\"\"Initializes model from configs.\n",
        "    Args:\n",
        "        config: Configuration arguments.\n",
        "        mode: One of (\"train\", \"eval\").\n",
        "    Returns:\n",
        "        Initialized model.\n",
        "    \"\"\"\n",
        "    config = compose_hydra_configuration(config)\n",
        "    _, config = convert_to_attrdict(config)\n",
        "\n",
        "    # model = build_model(config.MODEL, config.OPTIMIZER)\n",
        "    # weights = load_checkpoint(checkpoint_path=config.MODEL.WEIGHTS_INIT.PARAMS_FILE)\n",
        "    # init_model_from_consolidated_weights(config=config,\n",
        "    #                                     model=model, state_dict=weights,\n",
        "    #                                     state_dict_key_name=\"classy_state_dict\",\n",
        "    #                                     skip_layers=[])\n",
        "\n",
        "\n",
        "    model = BaseSSLMultiInputOutputModel(config.MODEL, config.OPTIMIZER)\n",
        "    weights = load_checkpoint(checkpoint_path=config.MODEL.WEIGHTS_INIT.PARAMS_FILE)\n",
        "\n",
        "    # import torch.distributed as dist\n",
        "    # from vissl.models import convert_sync_bn\n",
        "\n",
        "    # dist.init_process_group(\"gloo\")\n",
        "    # if config[\"MODEL\"][\"SYNC_BN_CONFIG\"][\"CONVERT_BN_TO_SYNC_BN\"]:\n",
        "    #     print(\"Appling SyncBN..\")\n",
        "    #     model = convert_sync_bn(config, model)\n",
        "\n",
        "\n",
        "    print(weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"].keys())\n",
        "    print('-'*20)\n",
        "    print(model.get_classy_state()[\"model\"][\"trunk\"].keys())\n",
        "\n",
        "    # print(list(weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"].keys()) == list(model.get_classy_state()[\"model\"][\"trunk\"].keys()))\n",
        "\n",
        "    # backbone_weights = load_checkpoint(checkpoint_path=\"/content/resnet50-19c8e357.pth\")\n",
        "    # try:\n",
        "    #     for key in backbone_weights.keys():\n",
        "    #         adjusted_key = f\"base_model._feature_blocks.{key}\"\n",
        "    #         print(list((weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"][adjusted_key][i] == \n",
        "    #                     backbone_weights[key][i]).all() for i in range(63)))\n",
        "    # except:\n",
        "    #     adjusted_key = f\"base_model._feature_blocks.{key}\"\n",
        "    #     print(list((weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"heads\"][adjusted_key][i] == \n",
        "    #                 backbone_weights[key][i]).all() for i in range(63)))\n",
        "\n",
        "    # backbone_weights = load_checkpoint(checkpoint_path=\"/content/resnet50-19c8e357.pth\")    \n",
        "    # for key in backbone_weights.keys():\n",
        "    #     adjusted_key = f\"_feature_blocks.{key}\"\n",
        "    #     print(list((weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"][adjusted_key][i] == \n",
        "    #             backbone_weights[key][i]).all() for i in range(63)))\n",
        "\n",
        "\n",
        "    backbone_weights = load_checkpoint(checkpoint_path=\"/content/resnet50-19c8e357.pth\")   \n",
        "    key = '0.clf.clf.0.weight' # \n",
        "    adjusted_key = f\"_feature_blocks.fc.weight\"\n",
        "    print(weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"heads\"].keys())\n",
        "\n",
        "    prev = weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"heads\"][key]\n",
        "    print(backbone_weights.keys())\n",
        "\n",
        "\n",
        "    vissl_state_dict = weights.get(\"classy_state_dict\")\n",
        "    # model.set_classy_state(vissl_state_dict[\"base_model\"])\n",
        "\n",
        "    init_model_from_consolidated_weights(config=config, model=model, state_dict=weights,\n",
        "                                             state_dict_key_name=\"classy_state_dict\", skip_layers=[])\n",
        "    \n",
        "    new = dict(model.named_parameters())[f\"heads.{key}\"]\n",
        "\n",
        "    print(new==prev)\n",
        "\n",
        "\n",
        "\n",
        "\n",
        "    return ProxyModel(model, device, mode)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "wVvw9D9FwAZL"
      },
      "outputs": [],
      "source": [
        "import torch.distributed as dist\n",
        "\n",
        "\n",
        "\n",
        "# ``group_size`` must divide the total number of GPUs (world_size).\n",
        "\n",
        "# ``group_size`` of 0 would be considered as =world_size. In this case ``None`` will be returned.\n",
        "\n",
        "# ``group_size`` of 1 would be equivalent to using non-sync bn, but will still carry the overhead.\n",
        "\n",
        "\n",
        "\n",
        "def setup(rank, world_size):\n",
        "    os.environ['MASTER_ADDR'] = 'localhost'\n",
        "    os.environ['MASTER_PORT'] = '12356'\n",
        "\n",
        "    # initialize the process group\n",
        "    # dist.init_process_group(\"gloo\", rank=rank, world_size=world_size)\n",
        "    dist.init_process_group(\"gloo\", rank=0, world_size=2)\n",
        "\n",
        "def cleanup():\n",
        "    dist.destroy_process_group()\n",
        "\n",
        "\n",
        "# cleanup()\n",
        "# setup(0, 2)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "teeiAXPjOTDV",
        "outputId": "11509936-6165-4bef-d1b1-21fe3e15bfcf"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "odict_keys(['_feature_blocks.conv1.weight', '_feature_blocks.bn1.weight', '_feature_blocks.bn1.bias', '_feature_blocks.bn1.running_mean', '_feature_blocks.bn1.running_var', '_feature_blocks.bn1.num_batches_tracked', '_feature_blocks.layer1.0.conv1.weight', '_feature_blocks.layer1.0.bn1.weight', '_feature_blocks.layer1.0.bn1.bias', '_feature_blocks.layer1.0.bn1.running_mean', '_feature_blocks.layer1.0.bn1.running_var', '_feature_blocks.layer1.0.bn1.num_batches_tracked', '_feature_blocks.layer1.0.conv2.weight', '_feature_blocks.layer1.0.bn2.weight', '_feature_blocks.layer1.0.bn2.bias', '_feature_blocks.layer1.0.bn2.running_mean', '_feature_blocks.layer1.0.bn2.running_var', '_feature_blocks.layer1.0.bn2.num_batches_tracked', '_feature_blocks.layer1.0.conv3.weight', '_feature_blocks.layer1.0.bn3.weight', '_feature_blocks.layer1.0.bn3.bias', '_feature_blocks.layer1.0.bn3.running_mean', '_feature_blocks.layer1.0.bn3.running_var', '_feature_blocks.layer1.0.bn3.num_batches_tracked', '_feature_blocks.layer1.0.downsample.0.weight', '_feature_blocks.layer1.0.downsample.1.weight', '_feature_blocks.layer1.0.downsample.1.bias', '_feature_blocks.layer1.0.downsample.1.running_mean', '_feature_blocks.layer1.0.downsample.1.running_var', '_feature_blocks.layer1.0.downsample.1.num_batches_tracked', '_feature_blocks.layer1.1.conv1.weight', '_feature_blocks.layer1.1.bn1.weight', '_feature_blocks.layer1.1.bn1.bias', '_feature_blocks.layer1.1.bn1.running_mean', '_feature_blocks.layer1.1.bn1.running_var', '_feature_blocks.layer1.1.bn1.num_batches_tracked', '_feature_blocks.layer1.1.conv2.weight', '_feature_blocks.layer1.1.bn2.weight', '_feature_blocks.layer1.1.bn2.bias', '_feature_blocks.layer1.1.bn2.running_mean', '_feature_blocks.layer1.1.bn2.running_var', '_feature_blocks.layer1.1.bn2.num_batches_tracked', '_feature_blocks.layer1.1.conv3.weight', '_feature_blocks.layer1.1.bn3.weight', '_feature_blocks.layer1.1.bn3.bias', '_feature_blocks.layer1.1.bn3.running_mean', '_feature_blocks.layer1.1.bn3.running_var', '_feature_blocks.layer1.1.bn3.num_batches_tracked', '_feature_blocks.layer1.2.conv1.weight', '_feature_blocks.layer1.2.bn1.weight', '_feature_blocks.layer1.2.bn1.bias', '_feature_blocks.layer1.2.bn1.running_mean', '_feature_blocks.layer1.2.bn1.running_var', '_feature_blocks.layer1.2.bn1.num_batches_tracked', '_feature_blocks.layer1.2.conv2.weight', '_feature_blocks.layer1.2.bn2.weight', '_feature_blocks.layer1.2.bn2.bias', '_feature_blocks.layer1.2.bn2.running_mean', '_feature_blocks.layer1.2.bn2.running_var', '_feature_blocks.layer1.2.bn2.num_batches_tracked', '_feature_blocks.layer1.2.conv3.weight', '_feature_blocks.layer1.2.bn3.weight', '_feature_blocks.layer1.2.bn3.bias', '_feature_blocks.layer1.2.bn3.running_mean', '_feature_blocks.layer1.2.bn3.running_var', '_feature_blocks.layer1.2.bn3.num_batches_tracked', '_feature_blocks.layer2.0.conv1.weight', '_feature_blocks.layer2.0.bn1.weight', '_feature_blocks.layer2.0.bn1.bias', '_feature_blocks.layer2.0.bn1.running_mean', '_feature_blocks.layer2.0.bn1.running_var', '_feature_blocks.layer2.0.bn1.num_batches_tracked', '_feature_blocks.layer2.0.conv2.weight', '_feature_blocks.layer2.0.bn2.weight', '_feature_blocks.layer2.0.bn2.bias', '_feature_blocks.layer2.0.bn2.running_mean', '_feature_blocks.layer2.0.bn2.running_var', '_feature_blocks.layer2.0.bn2.num_batches_tracked', '_feature_blocks.layer2.0.conv3.weight', '_feature_blocks.layer2.0.bn3.weight', '_feature_blocks.layer2.0.bn3.bias', '_feature_blocks.layer2.0.bn3.running_mean', '_feature_blocks.layer2.0.bn3.running_var', '_feature_blocks.layer2.0.bn3.num_batches_tracked', '_feature_blocks.layer2.0.downsample.0.weight', '_feature_blocks.layer2.0.downsample.1.weight', '_feature_blocks.layer2.0.downsample.1.bias', '_feature_blocks.layer2.0.downsample.1.running_mean', '_feature_blocks.layer2.0.downsample.1.running_var', '_feature_blocks.layer2.0.downsample.1.num_batches_tracked', '_feature_blocks.layer2.1.conv1.weight', '_feature_blocks.layer2.1.bn1.weight', '_feature_blocks.layer2.1.bn1.bias', '_feature_blocks.layer2.1.bn1.running_mean', '_feature_blocks.layer2.1.bn1.running_var', '_feature_blocks.layer2.1.bn1.num_batches_tracked', '_feature_blocks.layer2.1.conv2.weight', '_feature_blocks.layer2.1.bn2.weight', '_feature_blocks.layer2.1.bn2.bias', '_feature_blocks.layer2.1.bn2.running_mean', '_feature_blocks.layer2.1.bn2.running_var', '_feature_blocks.layer2.1.bn2.num_batches_tracked', '_feature_blocks.layer2.1.conv3.weight', '_feature_blocks.layer2.1.bn3.weight', '_feature_blocks.layer2.1.bn3.bias', '_feature_blocks.layer2.1.bn3.running_mean', '_feature_blocks.layer2.1.bn3.running_var', '_feature_blocks.layer2.1.bn3.num_batches_tracked', '_feature_blocks.layer2.2.conv1.weight', '_feature_blocks.layer2.2.bn1.weight', '_feature_blocks.layer2.2.bn1.bias', '_feature_blocks.layer2.2.bn1.running_mean', '_feature_blocks.layer2.2.bn1.running_var', '_feature_blocks.layer2.2.bn1.num_batches_tracked', '_feature_blocks.layer2.2.conv2.weight', '_feature_blocks.layer2.2.bn2.weight', '_feature_blocks.layer2.2.bn2.bias', '_feature_blocks.layer2.2.bn2.running_mean', '_feature_blocks.layer2.2.bn2.running_var', '_feature_blocks.layer2.2.bn2.num_batches_tracked', '_feature_blocks.layer2.2.conv3.weight', '_feature_blocks.layer2.2.bn3.weight', '_feature_blocks.layer2.2.bn3.bias', '_feature_blocks.layer2.2.bn3.running_mean', '_feature_blocks.layer2.2.bn3.running_var', '_feature_blocks.layer2.2.bn3.num_batches_tracked', '_feature_blocks.layer2.3.conv1.weight', '_feature_blocks.layer2.3.bn1.weight', '_feature_blocks.layer2.3.bn1.bias', '_feature_blocks.layer2.3.bn1.running_mean', '_feature_blocks.layer2.3.bn1.running_var', '_feature_blocks.layer2.3.bn1.num_batches_tracked', '_feature_blocks.layer2.3.conv2.weight', '_feature_blocks.layer2.3.bn2.weight', '_feature_blocks.layer2.3.bn2.bias', '_feature_blocks.layer2.3.bn2.running_mean', '_feature_blocks.layer2.3.bn2.running_var', '_feature_blocks.layer2.3.bn2.num_batches_tracked', '_feature_blocks.layer2.3.conv3.weight', '_feature_blocks.layer2.3.bn3.weight', '_feature_blocks.layer2.3.bn3.bias', '_feature_blocks.layer2.3.bn3.running_mean', '_feature_blocks.layer2.3.bn3.running_var', '_feature_blocks.layer2.3.bn3.num_batches_tracked', '_feature_blocks.layer3.0.conv1.weight', '_feature_blocks.layer3.0.bn1.weight', '_feature_blocks.layer3.0.bn1.bias', '_feature_blocks.layer3.0.bn1.running_mean', '_feature_blocks.layer3.0.bn1.running_var', '_feature_blocks.layer3.0.bn1.num_batches_tracked', '_feature_blocks.layer3.0.conv2.weight', '_feature_blocks.layer3.0.bn2.weight', '_feature_blocks.layer3.0.bn2.bias', '_feature_blocks.layer3.0.bn2.running_mean', '_feature_blocks.layer3.0.bn2.running_var', '_feature_blocks.layer3.0.bn2.num_batches_tracked', '_feature_blocks.layer3.0.conv3.weight', '_feature_blocks.layer3.0.bn3.weight', '_feature_blocks.layer3.0.bn3.bias', '_feature_blocks.layer3.0.bn3.running_mean', '_feature_blocks.layer3.0.bn3.running_var', '_feature_blocks.layer3.0.bn3.num_batches_tracked', '_feature_blocks.layer3.0.downsample.0.weight', '_feature_blocks.layer3.0.downsample.1.weight', '_feature_blocks.layer3.0.downsample.1.bias', '_feature_blocks.layer3.0.downsample.1.running_mean', '_feature_blocks.layer3.0.downsample.1.running_var', '_feature_blocks.layer3.0.downsample.1.num_batches_tracked', '_feature_blocks.layer3.1.conv1.weight', '_feature_blocks.layer3.1.bn1.weight', '_feature_blocks.layer3.1.bn1.bias', '_feature_blocks.layer3.1.bn1.running_mean', '_feature_blocks.layer3.1.bn1.running_var', '_feature_blocks.layer3.1.bn1.num_batches_tracked', '_feature_blocks.layer3.1.conv2.weight', '_feature_blocks.layer3.1.bn2.weight', '_feature_blocks.layer3.1.bn2.bias', '_feature_blocks.layer3.1.bn2.running_mean', '_feature_blocks.layer3.1.bn2.running_var', '_feature_blocks.layer3.1.bn2.num_batches_tracked', '_feature_blocks.layer3.1.conv3.weight', '_feature_blocks.layer3.1.bn3.weight', '_feature_blocks.layer3.1.bn3.bias', '_feature_blocks.layer3.1.bn3.running_mean', '_feature_blocks.layer3.1.bn3.running_var', '_feature_blocks.layer3.1.bn3.num_batches_tracked', '_feature_blocks.layer3.2.conv1.weight', '_feature_blocks.layer3.2.bn1.weight', '_feature_blocks.layer3.2.bn1.bias', '_feature_blocks.layer3.2.bn1.running_mean', '_feature_blocks.layer3.2.bn1.running_var', '_feature_blocks.layer3.2.bn1.num_batches_tracked', '_feature_blocks.layer3.2.conv2.weight', '_feature_blocks.layer3.2.bn2.weight', '_feature_blocks.layer3.2.bn2.bias', '_feature_blocks.layer3.2.bn2.running_mean', '_feature_blocks.layer3.2.bn2.running_var', '_feature_blocks.layer3.2.bn2.num_batches_tracked', '_feature_blocks.layer3.2.conv3.weight', '_feature_blocks.layer3.2.bn3.weight', '_feature_blocks.layer3.2.bn3.bias', '_feature_blocks.layer3.2.bn3.running_mean', '_feature_blocks.layer3.2.bn3.running_var', '_feature_blocks.layer3.2.bn3.num_batches_tracked', '_feature_blocks.layer3.3.conv1.weight', '_feature_blocks.layer3.3.bn1.weight', '_feature_blocks.layer3.3.bn1.bias', '_feature_blocks.layer3.3.bn1.running_mean', '_feature_blocks.layer3.3.bn1.running_var', '_feature_blocks.layer3.3.bn1.num_batches_tracked', '_feature_blocks.layer3.3.conv2.weight', '_feature_blocks.layer3.3.bn2.weight', '_feature_blocks.layer3.3.bn2.bias', '_feature_blocks.layer3.3.bn2.running_mean', '_feature_blocks.layer3.3.bn2.running_var', '_feature_blocks.layer3.3.bn2.num_batches_tracked', '_feature_blocks.layer3.3.conv3.weight', '_feature_blocks.layer3.3.bn3.weight', '_feature_blocks.layer3.3.bn3.bias', '_feature_blocks.layer3.3.bn3.running_mean', '_feature_blocks.layer3.3.bn3.running_var', '_feature_blocks.layer3.3.bn3.num_batches_tracked', '_feature_blocks.layer3.4.conv1.weight', '_feature_blocks.layer3.4.bn1.weight', '_feature_blocks.layer3.4.bn1.bias', '_feature_blocks.layer3.4.bn1.running_mean', '_feature_blocks.layer3.4.bn1.running_var', '_feature_blocks.layer3.4.bn1.num_batches_tracked', '_feature_blocks.layer3.4.conv2.weight', '_feature_blocks.layer3.4.bn2.weight', '_feature_blocks.layer3.4.bn2.bias', '_feature_blocks.layer3.4.bn2.running_mean', '_feature_blocks.layer3.4.bn2.running_var', '_feature_blocks.layer3.4.bn2.num_batches_tracked', '_feature_blocks.layer3.4.conv3.weight', '_feature_blocks.layer3.4.bn3.weight', '_feature_blocks.layer3.4.bn3.bias', '_feature_blocks.layer3.4.bn3.running_mean', '_feature_blocks.layer3.4.bn3.running_var', '_feature_blocks.layer3.4.bn3.num_batches_tracked', '_feature_blocks.layer3.5.conv1.weight', '_feature_blocks.layer3.5.bn1.weight', '_feature_blocks.layer3.5.bn1.bias', '_feature_blocks.layer3.5.bn1.running_mean', '_feature_blocks.layer3.5.bn1.running_var', '_feature_blocks.layer3.5.bn1.num_batches_tracked', '_feature_blocks.layer3.5.conv2.weight', '_feature_blocks.layer3.5.bn2.weight', '_feature_blocks.layer3.5.bn2.bias', '_feature_blocks.layer3.5.bn2.running_mean', '_feature_blocks.layer3.5.bn2.running_var', '_feature_blocks.layer3.5.bn2.num_batches_tracked', '_feature_blocks.layer3.5.conv3.weight', '_feature_blocks.layer3.5.bn3.weight', '_feature_blocks.layer3.5.bn3.bias', '_feature_blocks.layer3.5.bn3.running_mean', '_feature_blocks.layer3.5.bn3.running_var', '_feature_blocks.layer3.5.bn3.num_batches_tracked', '_feature_blocks.layer4.0.conv1.weight', '_feature_blocks.layer4.0.bn1.weight', '_feature_blocks.layer4.0.bn1.bias', '_feature_blocks.layer4.0.bn1.running_mean', '_feature_blocks.layer4.0.bn1.running_var', '_feature_blocks.layer4.0.bn1.num_batches_tracked', '_feature_blocks.layer4.0.conv2.weight', '_feature_blocks.layer4.0.bn2.weight', '_feature_blocks.layer4.0.bn2.bias', '_feature_blocks.layer4.0.bn2.running_mean', '_feature_blocks.layer4.0.bn2.running_var', '_feature_blocks.layer4.0.bn2.num_batches_tracked', '_feature_blocks.layer4.0.conv3.weight', '_feature_blocks.layer4.0.bn3.weight', '_feature_blocks.layer4.0.bn3.bias', '_feature_blocks.layer4.0.bn3.running_mean', '_feature_blocks.layer4.0.bn3.running_var', '_feature_blocks.layer4.0.bn3.num_batches_tracked', '_feature_blocks.layer4.0.downsample.0.weight', '_feature_blocks.layer4.0.downsample.1.weight', '_feature_blocks.layer4.0.downsample.1.bias', '_feature_blocks.layer4.0.downsample.1.running_mean', '_feature_blocks.layer4.0.downsample.1.running_var', '_feature_blocks.layer4.0.downsample.1.num_batches_tracked', '_feature_blocks.layer4.1.conv1.weight', '_feature_blocks.layer4.1.bn1.weight', '_feature_blocks.layer4.1.bn1.bias', '_feature_blocks.layer4.1.bn1.running_mean', '_feature_blocks.layer4.1.bn1.running_var', '_feature_blocks.layer4.1.bn1.num_batches_tracked', '_feature_blocks.layer4.1.conv2.weight', '_feature_blocks.layer4.1.bn2.weight', '_feature_blocks.layer4.1.bn2.bias', '_feature_blocks.layer4.1.bn2.running_mean', '_feature_blocks.layer4.1.bn2.running_var', '_feature_blocks.layer4.1.bn2.num_batches_tracked', '_feature_blocks.layer4.1.conv3.weight', '_feature_blocks.layer4.1.bn3.weight', '_feature_blocks.layer4.1.bn3.bias', '_feature_blocks.layer4.1.bn3.running_mean', '_feature_blocks.layer4.1.bn3.running_var', '_feature_blocks.layer4.1.bn3.num_batches_tracked', '_feature_blocks.layer4.2.conv1.weight', '_feature_blocks.layer4.2.bn1.weight', '_feature_blocks.layer4.2.bn1.bias', '_feature_blocks.layer4.2.bn1.running_mean', '_feature_blocks.layer4.2.bn1.running_var', '_feature_blocks.layer4.2.bn1.num_batches_tracked', '_feature_blocks.layer4.2.conv2.weight', '_feature_blocks.layer4.2.bn2.weight', '_feature_blocks.layer4.2.bn2.bias', '_feature_blocks.layer4.2.bn2.running_mean', '_feature_blocks.layer4.2.bn2.running_var', '_feature_blocks.layer4.2.bn2.num_batches_tracked', '_feature_blocks.layer4.2.conv3.weight', '_feature_blocks.layer4.2.bn3.weight', '_feature_blocks.layer4.2.bn3.bias', '_feature_blocks.layer4.2.bn3.running_mean', '_feature_blocks.layer4.2.bn3.running_var', '_feature_blocks.layer4.2.bn3.num_batches_tracked'])\n",
            "--------------------\n",
            "odict_keys(['base_model._feature_blocks.conv1.weight', 'base_model._feature_blocks.bn1.weight', 'base_model._feature_blocks.bn1.bias', 'base_model._feature_blocks.bn1.running_mean', 'base_model._feature_blocks.bn1.running_var', 'base_model._feature_blocks.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv1.weight', 'base_model._feature_blocks.layer1.0.bn1.weight', 'base_model._feature_blocks.layer1.0.bn1.bias', 'base_model._feature_blocks.layer1.0.bn1.running_mean', 'base_model._feature_blocks.layer1.0.bn1.running_var', 'base_model._feature_blocks.layer1.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv2.weight', 'base_model._feature_blocks.layer1.0.bn2.weight', 'base_model._feature_blocks.layer1.0.bn2.bias', 'base_model._feature_blocks.layer1.0.bn2.running_mean', 'base_model._feature_blocks.layer1.0.bn2.running_var', 'base_model._feature_blocks.layer1.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv3.weight', 'base_model._feature_blocks.layer1.0.bn3.weight', 'base_model._feature_blocks.layer1.0.bn3.bias', 'base_model._feature_blocks.layer1.0.bn3.running_mean', 'base_model._feature_blocks.layer1.0.bn3.running_var', 'base_model._feature_blocks.layer1.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer1.0.downsample.0.weight', 'base_model._feature_blocks.layer1.0.downsample.1.weight', 'base_model._feature_blocks.layer1.0.downsample.1.bias', 'base_model._feature_blocks.layer1.0.downsample.1.running_mean', 'base_model._feature_blocks.layer1.0.downsample.1.running_var', 'base_model._feature_blocks.layer1.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv1.weight', 'base_model._feature_blocks.layer1.1.bn1.weight', 'base_model._feature_blocks.layer1.1.bn1.bias', 'base_model._feature_blocks.layer1.1.bn1.running_mean', 'base_model._feature_blocks.layer1.1.bn1.running_var', 'base_model._feature_blocks.layer1.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv2.weight', 'base_model._feature_blocks.layer1.1.bn2.weight', 'base_model._feature_blocks.layer1.1.bn2.bias', 'base_model._feature_blocks.layer1.1.bn2.running_mean', 'base_model._feature_blocks.layer1.1.bn2.running_var', 'base_model._feature_blocks.layer1.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv3.weight', 'base_model._feature_blocks.layer1.1.bn3.weight', 'base_model._feature_blocks.layer1.1.bn3.bias', 'base_model._feature_blocks.layer1.1.bn3.running_mean', 'base_model._feature_blocks.layer1.1.bn3.running_var', 'base_model._feature_blocks.layer1.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv1.weight', 'base_model._feature_blocks.layer1.2.bn1.weight', 'base_model._feature_blocks.layer1.2.bn1.bias', 'base_model._feature_blocks.layer1.2.bn1.running_mean', 'base_model._feature_blocks.layer1.2.bn1.running_var', 'base_model._feature_blocks.layer1.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv2.weight', 'base_model._feature_blocks.layer1.2.bn2.weight', 'base_model._feature_blocks.layer1.2.bn2.bias', 'base_model._feature_blocks.layer1.2.bn2.running_mean', 'base_model._feature_blocks.layer1.2.bn2.running_var', 'base_model._feature_blocks.layer1.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv3.weight', 'base_model._feature_blocks.layer1.2.bn3.weight', 'base_model._feature_blocks.layer1.2.bn3.bias', 'base_model._feature_blocks.layer1.2.bn3.running_mean', 'base_model._feature_blocks.layer1.2.bn3.running_var', 'base_model._feature_blocks.layer1.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv1.weight', 'base_model._feature_blocks.layer2.0.bn1.weight', 'base_model._feature_blocks.layer2.0.bn1.bias', 'base_model._feature_blocks.layer2.0.bn1.running_mean', 'base_model._feature_blocks.layer2.0.bn1.running_var', 'base_model._feature_blocks.layer2.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv2.weight', 'base_model._feature_blocks.layer2.0.bn2.weight', 'base_model._feature_blocks.layer2.0.bn2.bias', 'base_model._feature_blocks.layer2.0.bn2.running_mean', 'base_model._feature_blocks.layer2.0.bn2.running_var', 'base_model._feature_blocks.layer2.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv3.weight', 'base_model._feature_blocks.layer2.0.bn3.weight', 'base_model._feature_blocks.layer2.0.bn3.bias', 'base_model._feature_blocks.layer2.0.bn3.running_mean', 'base_model._feature_blocks.layer2.0.bn3.running_var', 'base_model._feature_blocks.layer2.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.0.downsample.0.weight', 'base_model._feature_blocks.layer2.0.downsample.1.weight', 'base_model._feature_blocks.layer2.0.downsample.1.bias', 'base_model._feature_blocks.layer2.0.downsample.1.running_mean', 'base_model._feature_blocks.layer2.0.downsample.1.running_var', 'base_model._feature_blocks.layer2.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv1.weight', 'base_model._feature_blocks.layer2.1.bn1.weight', 'base_model._feature_blocks.layer2.1.bn1.bias', 'base_model._feature_blocks.layer2.1.bn1.running_mean', 'base_model._feature_blocks.layer2.1.bn1.running_var', 'base_model._feature_blocks.layer2.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv2.weight', 'base_model._feature_blocks.layer2.1.bn2.weight', 'base_model._feature_blocks.layer2.1.bn2.bias', 'base_model._feature_blocks.layer2.1.bn2.running_mean', 'base_model._feature_blocks.layer2.1.bn2.running_var', 'base_model._feature_blocks.layer2.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv3.weight', 'base_model._feature_blocks.layer2.1.bn3.weight', 'base_model._feature_blocks.layer2.1.bn3.bias', 'base_model._feature_blocks.layer2.1.bn3.running_mean', 'base_model._feature_blocks.layer2.1.bn3.running_var', 'base_model._feature_blocks.layer2.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv1.weight', 'base_model._feature_blocks.layer2.2.bn1.weight', 'base_model._feature_blocks.layer2.2.bn1.bias', 'base_model._feature_blocks.layer2.2.bn1.running_mean', 'base_model._feature_blocks.layer2.2.bn1.running_var', 'base_model._feature_blocks.layer2.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv2.weight', 'base_model._feature_blocks.layer2.2.bn2.weight', 'base_model._feature_blocks.layer2.2.bn2.bias', 'base_model._feature_blocks.layer2.2.bn2.running_mean', 'base_model._feature_blocks.layer2.2.bn2.running_var', 'base_model._feature_blocks.layer2.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv3.weight', 'base_model._feature_blocks.layer2.2.bn3.weight', 'base_model._feature_blocks.layer2.2.bn3.bias', 'base_model._feature_blocks.layer2.2.bn3.running_mean', 'base_model._feature_blocks.layer2.2.bn3.running_var', 'base_model._feature_blocks.layer2.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv1.weight', 'base_model._feature_blocks.layer2.3.bn1.weight', 'base_model._feature_blocks.layer2.3.bn1.bias', 'base_model._feature_blocks.layer2.3.bn1.running_mean', 'base_model._feature_blocks.layer2.3.bn1.running_var', 'base_model._feature_blocks.layer2.3.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv2.weight', 'base_model._feature_blocks.layer2.3.bn2.weight', 'base_model._feature_blocks.layer2.3.bn2.bias', 'base_model._feature_blocks.layer2.3.bn2.running_mean', 'base_model._feature_blocks.layer2.3.bn2.running_var', 'base_model._feature_blocks.layer2.3.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv3.weight', 'base_model._feature_blocks.layer2.3.bn3.weight', 'base_model._feature_blocks.layer2.3.bn3.bias', 'base_model._feature_blocks.layer2.3.bn3.running_mean', 'base_model._feature_blocks.layer2.3.bn3.running_var', 'base_model._feature_blocks.layer2.3.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv1.weight', 'base_model._feature_blocks.layer3.0.bn1.weight', 'base_model._feature_blocks.layer3.0.bn1.bias', 'base_model._feature_blocks.layer3.0.bn1.running_mean', 'base_model._feature_blocks.layer3.0.bn1.running_var', 'base_model._feature_blocks.layer3.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv2.weight', 'base_model._feature_blocks.layer3.0.bn2.weight', 'base_model._feature_blocks.layer3.0.bn2.bias', 'base_model._feature_blocks.layer3.0.bn2.running_mean', 'base_model._feature_blocks.layer3.0.bn2.running_var', 'base_model._feature_blocks.layer3.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv3.weight', 'base_model._feature_blocks.layer3.0.bn3.weight', 'base_model._feature_blocks.layer3.0.bn3.bias', 'base_model._feature_blocks.layer3.0.bn3.running_mean', 'base_model._feature_blocks.layer3.0.bn3.running_var', 'base_model._feature_blocks.layer3.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.0.downsample.0.weight', 'base_model._feature_blocks.layer3.0.downsample.1.weight', 'base_model._feature_blocks.layer3.0.downsample.1.bias', 'base_model._feature_blocks.layer3.0.downsample.1.running_mean', 'base_model._feature_blocks.layer3.0.downsample.1.running_var', 'base_model._feature_blocks.layer3.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv1.weight', 'base_model._feature_blocks.layer3.1.bn1.weight', 'base_model._feature_blocks.layer3.1.bn1.bias', 'base_model._feature_blocks.layer3.1.bn1.running_mean', 'base_model._feature_blocks.layer3.1.bn1.running_var', 'base_model._feature_blocks.layer3.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv2.weight', 'base_model._feature_blocks.layer3.1.bn2.weight', 'base_model._feature_blocks.layer3.1.bn2.bias', 'base_model._feature_blocks.layer3.1.bn2.running_mean', 'base_model._feature_blocks.layer3.1.bn2.running_var', 'base_model._feature_blocks.layer3.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv3.weight', 'base_model._feature_blocks.layer3.1.bn3.weight', 'base_model._feature_blocks.layer3.1.bn3.bias', 'base_model._feature_blocks.layer3.1.bn3.running_mean', 'base_model._feature_blocks.layer3.1.bn3.running_var', 'base_model._feature_blocks.layer3.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv1.weight', 'base_model._feature_blocks.layer3.2.bn1.weight', 'base_model._feature_blocks.layer3.2.bn1.bias', 'base_model._feature_blocks.layer3.2.bn1.running_mean', 'base_model._feature_blocks.layer3.2.bn1.running_var', 'base_model._feature_blocks.layer3.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv2.weight', 'base_model._feature_blocks.layer3.2.bn2.weight', 'base_model._feature_blocks.layer3.2.bn2.bias', 'base_model._feature_blocks.layer3.2.bn2.running_mean', 'base_model._feature_blocks.layer3.2.bn2.running_var', 'base_model._feature_blocks.layer3.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv3.weight', 'base_model._feature_blocks.layer3.2.bn3.weight', 'base_model._feature_blocks.layer3.2.bn3.bias', 'base_model._feature_blocks.layer3.2.bn3.running_mean', 'base_model._feature_blocks.layer3.2.bn3.running_var', 'base_model._feature_blocks.layer3.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv1.weight', 'base_model._feature_blocks.layer3.3.bn1.weight', 'base_model._feature_blocks.layer3.3.bn1.bias', 'base_model._feature_blocks.layer3.3.bn1.running_mean', 'base_model._feature_blocks.layer3.3.bn1.running_var', 'base_model._feature_blocks.layer3.3.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv2.weight', 'base_model._feature_blocks.layer3.3.bn2.weight', 'base_model._feature_blocks.layer3.3.bn2.bias', 'base_model._feature_blocks.layer3.3.bn2.running_mean', 'base_model._feature_blocks.layer3.3.bn2.running_var', 'base_model._feature_blocks.layer3.3.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv3.weight', 'base_model._feature_blocks.layer3.3.bn3.weight', 'base_model._feature_blocks.layer3.3.bn3.bias', 'base_model._feature_blocks.layer3.3.bn3.running_mean', 'base_model._feature_blocks.layer3.3.bn3.running_var', 'base_model._feature_blocks.layer3.3.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv1.weight', 'base_model._feature_blocks.layer3.4.bn1.weight', 'base_model._feature_blocks.layer3.4.bn1.bias', 'base_model._feature_blocks.layer3.4.bn1.running_mean', 'base_model._feature_blocks.layer3.4.bn1.running_var', 'base_model._feature_blocks.layer3.4.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv2.weight', 'base_model._feature_blocks.layer3.4.bn2.weight', 'base_model._feature_blocks.layer3.4.bn2.bias', 'base_model._feature_blocks.layer3.4.bn2.running_mean', 'base_model._feature_blocks.layer3.4.bn2.running_var', 'base_model._feature_blocks.layer3.4.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv3.weight', 'base_model._feature_blocks.layer3.4.bn3.weight', 'base_model._feature_blocks.layer3.4.bn3.bias', 'base_model._feature_blocks.layer3.4.bn3.running_mean', 'base_model._feature_blocks.layer3.4.bn3.running_var', 'base_model._feature_blocks.layer3.4.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv1.weight', 'base_model._feature_blocks.layer3.5.bn1.weight', 'base_model._feature_blocks.layer3.5.bn1.bias', 'base_model._feature_blocks.layer3.5.bn1.running_mean', 'base_model._feature_blocks.layer3.5.bn1.running_var', 'base_model._feature_blocks.layer3.5.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv2.weight', 'base_model._feature_blocks.layer3.5.bn2.weight', 'base_model._feature_blocks.layer3.5.bn2.bias', 'base_model._feature_blocks.layer3.5.bn2.running_mean', 'base_model._feature_blocks.layer3.5.bn2.running_var', 'base_model._feature_blocks.layer3.5.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv3.weight', 'base_model._feature_blocks.layer3.5.bn3.weight', 'base_model._feature_blocks.layer3.5.bn3.bias', 'base_model._feature_blocks.layer3.5.bn3.running_mean', 'base_model._feature_blocks.layer3.5.bn3.running_var', 'base_model._feature_blocks.layer3.5.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv1.weight', 'base_model._feature_blocks.layer4.0.bn1.weight', 'base_model._feature_blocks.layer4.0.bn1.bias', 'base_model._feature_blocks.layer4.0.bn1.running_mean', 'base_model._feature_blocks.layer4.0.bn1.running_var', 'base_model._feature_blocks.layer4.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv2.weight', 'base_model._feature_blocks.layer4.0.bn2.weight', 'base_model._feature_blocks.layer4.0.bn2.bias', 'base_model._feature_blocks.layer4.0.bn2.running_mean', 'base_model._feature_blocks.layer4.0.bn2.running_var', 'base_model._feature_blocks.layer4.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv3.weight', 'base_model._feature_blocks.layer4.0.bn3.weight', 'base_model._feature_blocks.layer4.0.bn3.bias', 'base_model._feature_blocks.layer4.0.bn3.running_mean', 'base_model._feature_blocks.layer4.0.bn3.running_var', 'base_model._feature_blocks.layer4.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.0.downsample.0.weight', 'base_model._feature_blocks.layer4.0.downsample.1.weight', 'base_model._feature_blocks.layer4.0.downsample.1.bias', 'base_model._feature_blocks.layer4.0.downsample.1.running_mean', 'base_model._feature_blocks.layer4.0.downsample.1.running_var', 'base_model._feature_blocks.layer4.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv1.weight', 'base_model._feature_blocks.layer4.1.bn1.weight', 'base_model._feature_blocks.layer4.1.bn1.bias', 'base_model._feature_blocks.layer4.1.bn1.running_mean', 'base_model._feature_blocks.layer4.1.bn1.running_var', 'base_model._feature_blocks.layer4.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv2.weight', 'base_model._feature_blocks.layer4.1.bn2.weight', 'base_model._feature_blocks.layer4.1.bn2.bias', 'base_model._feature_blocks.layer4.1.bn2.running_mean', 'base_model._feature_blocks.layer4.1.bn2.running_var', 'base_model._feature_blocks.layer4.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv3.weight', 'base_model._feature_blocks.layer4.1.bn3.weight', 'base_model._feature_blocks.layer4.1.bn3.bias', 'base_model._feature_blocks.layer4.1.bn3.running_mean', 'base_model._feature_blocks.layer4.1.bn3.running_var', 'base_model._feature_blocks.layer4.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv1.weight', 'base_model._feature_blocks.layer4.2.bn1.weight', 'base_model._feature_blocks.layer4.2.bn1.bias', 'base_model._feature_blocks.layer4.2.bn1.running_mean', 'base_model._feature_blocks.layer4.2.bn1.running_var', 'base_model._feature_blocks.layer4.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv2.weight', 'base_model._feature_blocks.layer4.2.bn2.weight', 'base_model._feature_blocks.layer4.2.bn2.bias', 'base_model._feature_blocks.layer4.2.bn2.running_mean', 'base_model._feature_blocks.layer4.2.bn2.running_var', 'base_model._feature_blocks.layer4.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv3.weight', 'base_model._feature_blocks.layer4.2.bn3.weight', 'base_model._feature_blocks.layer4.2.bn3.bias', 'base_model._feature_blocks.layer4.2.bn3.running_mean', 'base_model._feature_blocks.layer4.2.bn3.running_var', 'base_model._feature_blocks.layer4.2.bn3.num_batches_tracked'])\n",
            "odict_keys(['0.channel_bn.weight', '0.channel_bn.bias', '0.channel_bn.running_mean', '0.channel_bn.running_var', '0.channel_bn.num_batches_tracked', '0.clf.clf.0.weight', '0.clf.clf.0.bias'])\n",
            "odict_keys(['conv1.weight', 'bn1.running_mean', 'bn1.running_var', 'bn1.weight', 'bn1.bias', 'layer1.0.conv1.weight', 'layer1.0.bn1.running_mean', 'layer1.0.bn1.running_var', 'layer1.0.bn1.weight', 'layer1.0.bn1.bias', 'layer1.0.conv2.weight', 'layer1.0.bn2.running_mean', 'layer1.0.bn2.running_var', 'layer1.0.bn2.weight', 'layer1.0.bn2.bias', 'layer1.0.conv3.weight', 'layer1.0.bn3.running_mean', 'layer1.0.bn3.running_var', 'layer1.0.bn3.weight', 'layer1.0.bn3.bias', 'layer1.0.downsample.0.weight', 'layer1.0.downsample.1.running_mean', 'layer1.0.downsample.1.running_var', 'layer1.0.downsample.1.weight', 'layer1.0.downsample.1.bias', 'layer1.1.conv1.weight', 'layer1.1.bn1.running_mean', 'layer1.1.bn1.running_var', 'layer1.1.bn1.weight', 'layer1.1.bn1.bias', 'layer1.1.conv2.weight', 'layer1.1.bn2.running_mean', 'layer1.1.bn2.running_var', 'layer1.1.bn2.weight', 'layer1.1.bn2.bias', 'layer1.1.conv3.weight', 'layer1.1.bn3.running_mean', 'layer1.1.bn3.running_var', 'layer1.1.bn3.weight', 'layer1.1.bn3.bias', 'layer1.2.conv1.weight', 'layer1.2.bn1.running_mean', 'layer1.2.bn1.running_var', 'layer1.2.bn1.weight', 'layer1.2.bn1.bias', 'layer1.2.conv2.weight', 'layer1.2.bn2.running_mean', 'layer1.2.bn2.running_var', 'layer1.2.bn2.weight', 'layer1.2.bn2.bias', 'layer1.2.conv3.weight', 'layer1.2.bn3.running_mean', 'layer1.2.bn3.running_var', 'layer1.2.bn3.weight', 'layer1.2.bn3.bias', 'layer2.0.conv1.weight', 'layer2.0.bn1.running_mean', 'layer2.0.bn1.running_var', 'layer2.0.bn1.weight', 'layer2.0.bn1.bias', 'layer2.0.conv2.weight', 'layer2.0.bn2.running_mean', 'layer2.0.bn2.running_var', 'layer2.0.bn2.weight', 'layer2.0.bn2.bias', 'layer2.0.conv3.weight', 'layer2.0.bn3.running_mean', 'layer2.0.bn3.running_var', 'layer2.0.bn3.weight', 'layer2.0.bn3.bias', 'layer2.0.downsample.0.weight', 'layer2.0.downsample.1.running_mean', 'layer2.0.downsample.1.running_var', 'layer2.0.downsample.1.weight', 'layer2.0.downsample.1.bias', 'layer2.1.conv1.weight', 'layer2.1.bn1.running_mean', 'layer2.1.bn1.running_var', 'layer2.1.bn1.weight', 'layer2.1.bn1.bias', 'layer2.1.conv2.weight', 'layer2.1.bn2.running_mean', 'layer2.1.bn2.running_var', 'layer2.1.bn2.weight', 'layer2.1.bn2.bias', 'layer2.1.conv3.weight', 'layer2.1.bn3.running_mean', 'layer2.1.bn3.running_var', 'layer2.1.bn3.weight', 'layer2.1.bn3.bias', 'layer2.2.conv1.weight', 'layer2.2.bn1.running_mean', 'layer2.2.bn1.running_var', 'layer2.2.bn1.weight', 'layer2.2.bn1.bias', 'layer2.2.conv2.weight', 'layer2.2.bn2.running_mean', 'layer2.2.bn2.running_var', 'layer2.2.bn2.weight', 'layer2.2.bn2.bias', 'layer2.2.conv3.weight', 'layer2.2.bn3.running_mean', 'layer2.2.bn3.running_var', 'layer2.2.bn3.weight', 'layer2.2.bn3.bias', 'layer2.3.conv1.weight', 'layer2.3.bn1.running_mean', 'layer2.3.bn1.running_var', 'layer2.3.bn1.weight', 'layer2.3.bn1.bias', 'layer2.3.conv2.weight', 'layer2.3.bn2.running_mean', 'layer2.3.bn2.running_var', 'layer2.3.bn2.weight', 'layer2.3.bn2.bias', 'layer2.3.conv3.weight', 'layer2.3.bn3.running_mean', 'layer2.3.bn3.running_var', 'layer2.3.bn3.weight', 'layer2.3.bn3.bias', 'layer3.0.conv1.weight', 'layer3.0.bn1.running_mean', 'layer3.0.bn1.running_var', 'layer3.0.bn1.weight', 'layer3.0.bn1.bias', 'layer3.0.conv2.weight', 'layer3.0.bn2.running_mean', 'layer3.0.bn2.running_var', 'layer3.0.bn2.weight', 'layer3.0.bn2.bias', 'layer3.0.conv3.weight', 'layer3.0.bn3.running_mean', 'layer3.0.bn3.running_var', 'layer3.0.bn3.weight', 'layer3.0.bn3.bias', 'layer3.0.downsample.0.weight', 'layer3.0.downsample.1.running_mean', 'layer3.0.downsample.1.running_var', 'layer3.0.downsample.1.weight', 'layer3.0.downsample.1.bias', 'layer3.1.conv1.weight', 'layer3.1.bn1.running_mean', 'layer3.1.bn1.running_var', 'layer3.1.bn1.weight', 'layer3.1.bn1.bias', 'layer3.1.conv2.weight', 'layer3.1.bn2.running_mean', 'layer3.1.bn2.running_var', 'layer3.1.bn2.weight', 'layer3.1.bn2.bias', 'layer3.1.conv3.weight', 'layer3.1.bn3.running_mean', 'layer3.1.bn3.running_var', 'layer3.1.bn3.weight', 'layer3.1.bn3.bias', 'layer3.2.conv1.weight', 'layer3.2.bn1.running_mean', 'layer3.2.bn1.running_var', 'layer3.2.bn1.weight', 'layer3.2.bn1.bias', 'layer3.2.conv2.weight', 'layer3.2.bn2.running_mean', 'layer3.2.bn2.running_var', 'layer3.2.bn2.weight', 'layer3.2.bn2.bias', 'layer3.2.conv3.weight', 'layer3.2.bn3.running_mean', 'layer3.2.bn3.running_var', 'layer3.2.bn3.weight', 'layer3.2.bn3.bias', 'layer3.3.conv1.weight', 'layer3.3.bn1.running_mean', 'layer3.3.bn1.running_var', 'layer3.3.bn1.weight', 'layer3.3.bn1.bias', 'layer3.3.conv2.weight', 'layer3.3.bn2.running_mean', 'layer3.3.bn2.running_var', 'layer3.3.bn2.weight', 'layer3.3.bn2.bias', 'layer3.3.conv3.weight', 'layer3.3.bn3.running_mean', 'layer3.3.bn3.running_var', 'layer3.3.bn3.weight', 'layer3.3.bn3.bias', 'layer3.4.conv1.weight', 'layer3.4.bn1.running_mean', 'layer3.4.bn1.running_var', 'layer3.4.bn1.weight', 'layer3.4.bn1.bias', 'layer3.4.conv2.weight', 'layer3.4.bn2.running_mean', 'layer3.4.bn2.running_var', 'layer3.4.bn2.weight', 'layer3.4.bn2.bias', 'layer3.4.conv3.weight', 'layer3.4.bn3.running_mean', 'layer3.4.bn3.running_var', 'layer3.4.bn3.weight', 'layer3.4.bn3.bias', 'layer3.5.conv1.weight', 'layer3.5.bn1.running_mean', 'layer3.5.bn1.running_var', 'layer3.5.bn1.weight', 'layer3.5.bn1.bias', 'layer3.5.conv2.weight', 'layer3.5.bn2.running_mean', 'layer3.5.bn2.running_var', 'layer3.5.bn2.weight', 'layer3.5.bn2.bias', 'layer3.5.conv3.weight', 'layer3.5.bn3.running_mean', 'layer3.5.bn3.running_var', 'layer3.5.bn3.weight', 'layer3.5.bn3.bias', 'layer4.0.conv1.weight', 'layer4.0.bn1.running_mean', 'layer4.0.bn1.running_var', 'layer4.0.bn1.weight', 'layer4.0.bn1.bias', 'layer4.0.conv2.weight', 'layer4.0.bn2.running_mean', 'layer4.0.bn2.running_var', 'layer4.0.bn2.weight', 'layer4.0.bn2.bias', 'layer4.0.conv3.weight', 'layer4.0.bn3.running_mean', 'layer4.0.bn3.running_var', 'layer4.0.bn3.weight', 'layer4.0.bn3.bias', 'layer4.0.downsample.0.weight', 'layer4.0.downsample.1.running_mean', 'layer4.0.downsample.1.running_var', 'layer4.0.downsample.1.weight', 'layer4.0.downsample.1.bias', 'layer4.1.conv1.weight', 'layer4.1.bn1.running_mean', 'layer4.1.bn1.running_var', 'layer4.1.bn1.weight', 'layer4.1.bn1.bias', 'layer4.1.conv2.weight', 'layer4.1.bn2.running_mean', 'layer4.1.bn2.running_var', 'layer4.1.bn2.weight', 'layer4.1.bn2.bias', 'layer4.1.conv3.weight', 'layer4.1.bn3.running_mean', 'layer4.1.bn3.running_var', 'layer4.1.bn3.weight', 'layer4.1.bn3.bias', 'layer4.2.conv1.weight', 'layer4.2.bn1.running_mean', 'layer4.2.bn1.running_var', 'layer4.2.bn1.weight', 'layer4.2.bn1.bias', 'layer4.2.conv2.weight', 'layer4.2.bn2.running_mean', 'layer4.2.bn2.running_var', 'layer4.2.bn2.weight', 'layer4.2.bn2.bias', 'layer4.2.conv3.weight', 'layer4.2.bn3.running_mean', 'layer4.2.bn3.running_var', 'layer4.2.bn3.weight', 'layer4.2.bn3.bias', 'fc.weight', 'fc.bias'])\n",
            "tensor([[True, True, True,  ..., True, True, True],\n",
            "        [True, True, True,  ..., True, True, True],\n",
            "        [True, True, True,  ..., True, True, True],\n",
            "        ...,\n",
            "        [True, True, True,  ..., True, True, True],\n",
            "        [True, True, True,  ..., True, True, True],\n",
            "        [True, True, True,  ..., True, True, True]])\n"
          ]
        }
      ],
      "source": [
        "# Calling init_model to load full-tuned weights.\n",
        "device = torch.device(\"cuda:0\" if torch.cuda.is_available() else \"cpu\")\n",
        "# checkpoint_dir = \"/content/checkpoints\"\n",
        "# checkpoint_dir = \"/content/my_trash\"\n",
        "checkpoint_dir = \"/content/my_trash_2\"\n",
        "\n",
        "\n",
        "\n",
        "# cfg = [f\"config.CHECKPOINT.DIR={checkpoint_dir}\",\n",
        "#         \"config=benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml\",\n",
        "#         \"config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True\",\n",
        "#         \"config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=True\",\n",
        "#         \"config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=True\",\n",
        "#         \"+config.MODEL.APPEND_PREFIX='trunk._feature_blocks.'\"\n",
        "#         ]\n",
        "\n",
        "cfg = [f\"config.CHECKPOINT.DIR={checkpoint_dir}\",\n",
        "        \"config=benchmark/linear_image_classification/mnist/eval_resnet_8gpu_transfer_mnist_linear.yaml\",\n",
        "        \"config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_MODE_ON=True\",\n",
        "        \"config.MODEL.FEATURE_EVAL_SETTINGS.FREEZE_TRUNK_AND_HEAD=True\",\n",
        "        \"config.MODEL.FEATURE_EVAL_SETTINGS.EVAL_TRUNK_AND_HEAD=True\"]\n",
        "\n",
        "model_final_checkpoint = os.path.join(checkpoint_dir, 'model_final_checkpoint_phase0.torch')\n",
        "cfg1 = cfg + [f\"config.MODEL.WEIGHTS_INIT.PARAMS_FILE={model_final_checkpoint}\"]\n",
        "model = init_model(cfg1, \"eval\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "g2W0UU5IyVkc",
        "outputId": "e6e0fd7b-cc55-43b8-a0f6-a3f76d5f8d13"
      },
      "outputs": [
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "100%|██████████| 938/938 [02:58<00:00,  5.25it/s]\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "Accuracy on 60000 examples:  0.995983362197876\n"
          ]
        }
      ],
      "source": [
        "# Evaluating model's accuracy. Above we saw that it is ~0.98 on train set, \n",
        "# hence we fairly expect the same performance after runing this small loop.\n",
        "n_correctly_classified, total = 0, 0\n",
        "\n",
        "model.eval()\n",
        "\n",
        "with torch.no_grad():\n",
        "    for batch_idx, (images, labels) in enumerate(tqdm(train_loader)):\n",
        "        images, labels = images.to(device), labels.to(device)\n",
        "\n",
        "        pred = model(images).argmax(dim=1)\n",
        "\n",
        "        n_correctly_classified += (pred == labels).sum()\n",
        "        total += labels.shape[0]\n",
        "\n",
        "        # if batch_idx == 4:\n",
        "        #     break\n",
        "\n",
        "\n",
        "print(f\"Accuracy on {total} examples:  {n_correctly_classified / total}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "_vEKEIqTX8v_"
      },
      "outputs": [],
      "source": [
        "0.9656000137329102 -> train\n",
        "0.744949996471405 -> eval\n",
        "0.9951833486557007 -> default\n",
        "0.995983362197876 -> default"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "2Q0guXGHvzCw"
      },
      "outputs": [],
      "source": [
        " # 0.9392833709716797"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "gNakiXEyFL5s"
      },
      "source": [
        "# Weight comp"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "2aGuT8WdFLv3"
      },
      "outputs": [],
      "source": [
        "weights = load_checkpoint(checkpoint_path=\"/content/resnet50-19c8e357.pth\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "YLGA4XSeFLtz",
        "outputId": "16ef86d6-e226-422a-9f12-22a0da5bae42"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "tensor([[ 0.0151, -0.0021,  0.0132],\n",
              "        [ 0.0100, -0.0132, -0.0144],\n",
              "        [ 0.0021, -0.0128, -0.0029]], grad_fn=<SelectBackward>)"
            ]
          },
          "execution_count": 43,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights['layer1.1.conv2.weight'][0][0]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "LnXdOk1lFLrz"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "8m2_2TePFLpj"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "foXm3S46FLne"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "SzTt6-muFLlb",
        "outputId": "f5c831bc-2be4-41e6-9ce5-03ebe1eb910d"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "True"
            ]
          },
          "execution_count": 64,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "\"model.trunk.base_model._feature_blocks.layer1.1.conv2.weight\" in  dict(model.named_parameters()).keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ry9pd5QjFLi_"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "9yo_jAlo7A0k"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "kOvJKKDn7Ays"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "M5XN4-p6z6nV"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "KsOgxl0evzAU"
      },
      "outputs": [],
      "source": [
        "path = \"/content/my_trash/model_final_checkpoint_phase0.torch\"\n",
        "weights_fine = load_checkpoint(checkpoint_path=path)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "JXg9SYSrFng3",
        "outputId": "b68db883-8aed-4879-9509-64446c3e0506"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "dict_keys(['phase_idx', 'iteration', 'loss', 'iteration_num', 'train_phase_idx', 'classy_state_dict', 'type'])"
            ]
          },
          "execution_count": 89,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine.keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "eFgJcRkqFtyB",
        "outputId": "c0598e9b-7223-40d6-e7d0-abbbc193253f"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "dict_keys(['train', 'base_model', 'meters', 'optimizer', 'phase_idx', 'train_phase_idx', 'num_updates', 'losses', 'hooks', 'loss', 'train_dataset_iterator'])"
            ]
          },
          "execution_count": 90,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"].keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "lNkwF1IjFzwS",
        "outputId": "429bd695-22fa-4057-9a1f-ce04c4077985"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "dict_keys(['model', 'meta'])"
            ]
          },
          "execution_count": 91,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"][\"base_model\"].keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "SdiHaCboF24U",
        "outputId": "0df691ed-fb2c-43c7-c3af-1e42b9e9c469"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "dict_keys(['model', 'meta'])"
            ]
          },
          "execution_count": 92,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"][\"base_model\"].keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "K9nG5c1rGDS_",
        "outputId": "195649fc-224c-45cf-f4da-d57656c845ab"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "dict_keys(['trunk', 'heads'])"
            ]
          },
          "execution_count": 93,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"][\"base_model\"][\"model\"].keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "6EXSGFDoGG41",
        "outputId": "85b74ba6-7c3f-44c1-c5c5-8dcfb7152c58"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "odict_keys(['base_model._feature_blocks.conv1.weight', 'base_model._feature_blocks.bn1.weight', 'base_model._feature_blocks.bn1.bias', 'base_model._feature_blocks.bn1.running_mean', 'base_model._feature_blocks.bn1.running_var', 'base_model._feature_blocks.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv1.weight', 'base_model._feature_blocks.layer1.0.bn1.weight', 'base_model._feature_blocks.layer1.0.bn1.bias', 'base_model._feature_blocks.layer1.0.bn1.running_mean', 'base_model._feature_blocks.layer1.0.bn1.running_var', 'base_model._feature_blocks.layer1.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv2.weight', 'base_model._feature_blocks.layer1.0.bn2.weight', 'base_model._feature_blocks.layer1.0.bn2.bias', 'base_model._feature_blocks.layer1.0.bn2.running_mean', 'base_model._feature_blocks.layer1.0.bn2.running_var', 'base_model._feature_blocks.layer1.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.0.conv3.weight', 'base_model._feature_blocks.layer1.0.bn3.weight', 'base_model._feature_blocks.layer1.0.bn3.bias', 'base_model._feature_blocks.layer1.0.bn3.running_mean', 'base_model._feature_blocks.layer1.0.bn3.running_var', 'base_model._feature_blocks.layer1.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer1.0.downsample.0.weight', 'base_model._feature_blocks.layer1.0.downsample.1.weight', 'base_model._feature_blocks.layer1.0.downsample.1.bias', 'base_model._feature_blocks.layer1.0.downsample.1.running_mean', 'base_model._feature_blocks.layer1.0.downsample.1.running_var', 'base_model._feature_blocks.layer1.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv1.weight', 'base_model._feature_blocks.layer1.1.bn1.weight', 'base_model._feature_blocks.layer1.1.bn1.bias', 'base_model._feature_blocks.layer1.1.bn1.running_mean', 'base_model._feature_blocks.layer1.1.bn1.running_var', 'base_model._feature_blocks.layer1.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv2.weight', 'base_model._feature_blocks.layer1.1.bn2.weight', 'base_model._feature_blocks.layer1.1.bn2.bias', 'base_model._feature_blocks.layer1.1.bn2.running_mean', 'base_model._feature_blocks.layer1.1.bn2.running_var', 'base_model._feature_blocks.layer1.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.1.conv3.weight', 'base_model._feature_blocks.layer1.1.bn3.weight', 'base_model._feature_blocks.layer1.1.bn3.bias', 'base_model._feature_blocks.layer1.1.bn3.running_mean', 'base_model._feature_blocks.layer1.1.bn3.running_var', 'base_model._feature_blocks.layer1.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv1.weight', 'base_model._feature_blocks.layer1.2.bn1.weight', 'base_model._feature_blocks.layer1.2.bn1.bias', 'base_model._feature_blocks.layer1.2.bn1.running_mean', 'base_model._feature_blocks.layer1.2.bn1.running_var', 'base_model._feature_blocks.layer1.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv2.weight', 'base_model._feature_blocks.layer1.2.bn2.weight', 'base_model._feature_blocks.layer1.2.bn2.bias', 'base_model._feature_blocks.layer1.2.bn2.running_mean', 'base_model._feature_blocks.layer1.2.bn2.running_var', 'base_model._feature_blocks.layer1.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer1.2.conv3.weight', 'base_model._feature_blocks.layer1.2.bn3.weight', 'base_model._feature_blocks.layer1.2.bn3.bias', 'base_model._feature_blocks.layer1.2.bn3.running_mean', 'base_model._feature_blocks.layer1.2.bn3.running_var', 'base_model._feature_blocks.layer1.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv1.weight', 'base_model._feature_blocks.layer2.0.bn1.weight', 'base_model._feature_blocks.layer2.0.bn1.bias', 'base_model._feature_blocks.layer2.0.bn1.running_mean', 'base_model._feature_blocks.layer2.0.bn1.running_var', 'base_model._feature_blocks.layer2.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv2.weight', 'base_model._feature_blocks.layer2.0.bn2.weight', 'base_model._feature_blocks.layer2.0.bn2.bias', 'base_model._feature_blocks.layer2.0.bn2.running_mean', 'base_model._feature_blocks.layer2.0.bn2.running_var', 'base_model._feature_blocks.layer2.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.0.conv3.weight', 'base_model._feature_blocks.layer2.0.bn3.weight', 'base_model._feature_blocks.layer2.0.bn3.bias', 'base_model._feature_blocks.layer2.0.bn3.running_mean', 'base_model._feature_blocks.layer2.0.bn3.running_var', 'base_model._feature_blocks.layer2.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.0.downsample.0.weight', 'base_model._feature_blocks.layer2.0.downsample.1.weight', 'base_model._feature_blocks.layer2.0.downsample.1.bias', 'base_model._feature_blocks.layer2.0.downsample.1.running_mean', 'base_model._feature_blocks.layer2.0.downsample.1.running_var', 'base_model._feature_blocks.layer2.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv1.weight', 'base_model._feature_blocks.layer2.1.bn1.weight', 'base_model._feature_blocks.layer2.1.bn1.bias', 'base_model._feature_blocks.layer2.1.bn1.running_mean', 'base_model._feature_blocks.layer2.1.bn1.running_var', 'base_model._feature_blocks.layer2.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv2.weight', 'base_model._feature_blocks.layer2.1.bn2.weight', 'base_model._feature_blocks.layer2.1.bn2.bias', 'base_model._feature_blocks.layer2.1.bn2.running_mean', 'base_model._feature_blocks.layer2.1.bn2.running_var', 'base_model._feature_blocks.layer2.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.1.conv3.weight', 'base_model._feature_blocks.layer2.1.bn3.weight', 'base_model._feature_blocks.layer2.1.bn3.bias', 'base_model._feature_blocks.layer2.1.bn3.running_mean', 'base_model._feature_blocks.layer2.1.bn3.running_var', 'base_model._feature_blocks.layer2.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv1.weight', 'base_model._feature_blocks.layer2.2.bn1.weight', 'base_model._feature_blocks.layer2.2.bn1.bias', 'base_model._feature_blocks.layer2.2.bn1.running_mean', 'base_model._feature_blocks.layer2.2.bn1.running_var', 'base_model._feature_blocks.layer2.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv2.weight', 'base_model._feature_blocks.layer2.2.bn2.weight', 'base_model._feature_blocks.layer2.2.bn2.bias', 'base_model._feature_blocks.layer2.2.bn2.running_mean', 'base_model._feature_blocks.layer2.2.bn2.running_var', 'base_model._feature_blocks.layer2.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.2.conv3.weight', 'base_model._feature_blocks.layer2.2.bn3.weight', 'base_model._feature_blocks.layer2.2.bn3.bias', 'base_model._feature_blocks.layer2.2.bn3.running_mean', 'base_model._feature_blocks.layer2.2.bn3.running_var', 'base_model._feature_blocks.layer2.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv1.weight', 'base_model._feature_blocks.layer2.3.bn1.weight', 'base_model._feature_blocks.layer2.3.bn1.bias', 'base_model._feature_blocks.layer2.3.bn1.running_mean', 'base_model._feature_blocks.layer2.3.bn1.running_var', 'base_model._feature_blocks.layer2.3.bn1.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv2.weight', 'base_model._feature_blocks.layer2.3.bn2.weight', 'base_model._feature_blocks.layer2.3.bn2.bias', 'base_model._feature_blocks.layer2.3.bn2.running_mean', 'base_model._feature_blocks.layer2.3.bn2.running_var', 'base_model._feature_blocks.layer2.3.bn2.num_batches_tracked', 'base_model._feature_blocks.layer2.3.conv3.weight', 'base_model._feature_blocks.layer2.3.bn3.weight', 'base_model._feature_blocks.layer2.3.bn3.bias', 'base_model._feature_blocks.layer2.3.bn3.running_mean', 'base_model._feature_blocks.layer2.3.bn3.running_var', 'base_model._feature_blocks.layer2.3.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv1.weight', 'base_model._feature_blocks.layer3.0.bn1.weight', 'base_model._feature_blocks.layer3.0.bn1.bias', 'base_model._feature_blocks.layer3.0.bn1.running_mean', 'base_model._feature_blocks.layer3.0.bn1.running_var', 'base_model._feature_blocks.layer3.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv2.weight', 'base_model._feature_blocks.layer3.0.bn2.weight', 'base_model._feature_blocks.layer3.0.bn2.bias', 'base_model._feature_blocks.layer3.0.bn2.running_mean', 'base_model._feature_blocks.layer3.0.bn2.running_var', 'base_model._feature_blocks.layer3.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.0.conv3.weight', 'base_model._feature_blocks.layer3.0.bn3.weight', 'base_model._feature_blocks.layer3.0.bn3.bias', 'base_model._feature_blocks.layer3.0.bn3.running_mean', 'base_model._feature_blocks.layer3.0.bn3.running_var', 'base_model._feature_blocks.layer3.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.0.downsample.0.weight', 'base_model._feature_blocks.layer3.0.downsample.1.weight', 'base_model._feature_blocks.layer3.0.downsample.1.bias', 'base_model._feature_blocks.layer3.0.downsample.1.running_mean', 'base_model._feature_blocks.layer3.0.downsample.1.running_var', 'base_model._feature_blocks.layer3.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv1.weight', 'base_model._feature_blocks.layer3.1.bn1.weight', 'base_model._feature_blocks.layer3.1.bn1.bias', 'base_model._feature_blocks.layer3.1.bn1.running_mean', 'base_model._feature_blocks.layer3.1.bn1.running_var', 'base_model._feature_blocks.layer3.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv2.weight', 'base_model._feature_blocks.layer3.1.bn2.weight', 'base_model._feature_blocks.layer3.1.bn2.bias', 'base_model._feature_blocks.layer3.1.bn2.running_mean', 'base_model._feature_blocks.layer3.1.bn2.running_var', 'base_model._feature_blocks.layer3.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.1.conv3.weight', 'base_model._feature_blocks.layer3.1.bn3.weight', 'base_model._feature_blocks.layer3.1.bn3.bias', 'base_model._feature_blocks.layer3.1.bn3.running_mean', 'base_model._feature_blocks.layer3.1.bn3.running_var', 'base_model._feature_blocks.layer3.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv1.weight', 'base_model._feature_blocks.layer3.2.bn1.weight', 'base_model._feature_blocks.layer3.2.bn1.bias', 'base_model._feature_blocks.layer3.2.bn1.running_mean', 'base_model._feature_blocks.layer3.2.bn1.running_var', 'base_model._feature_blocks.layer3.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv2.weight', 'base_model._feature_blocks.layer3.2.bn2.weight', 'base_model._feature_blocks.layer3.2.bn2.bias', 'base_model._feature_blocks.layer3.2.bn2.running_mean', 'base_model._feature_blocks.layer3.2.bn2.running_var', 'base_model._feature_blocks.layer3.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.2.conv3.weight', 'base_model._feature_blocks.layer3.2.bn3.weight', 'base_model._feature_blocks.layer3.2.bn3.bias', 'base_model._feature_blocks.layer3.2.bn3.running_mean', 'base_model._feature_blocks.layer3.2.bn3.running_var', 'base_model._feature_blocks.layer3.2.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv1.weight', 'base_model._feature_blocks.layer3.3.bn1.weight', 'base_model._feature_blocks.layer3.3.bn1.bias', 'base_model._feature_blocks.layer3.3.bn1.running_mean', 'base_model._feature_blocks.layer3.3.bn1.running_var', 'base_model._feature_blocks.layer3.3.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv2.weight', 'base_model._feature_blocks.layer3.3.bn2.weight', 'base_model._feature_blocks.layer3.3.bn2.bias', 'base_model._feature_blocks.layer3.3.bn2.running_mean', 'base_model._feature_blocks.layer3.3.bn2.running_var', 'base_model._feature_blocks.layer3.3.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.3.conv3.weight', 'base_model._feature_blocks.layer3.3.bn3.weight', 'base_model._feature_blocks.layer3.3.bn3.bias', 'base_model._feature_blocks.layer3.3.bn3.running_mean', 'base_model._feature_blocks.layer3.3.bn3.running_var', 'base_model._feature_blocks.layer3.3.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv1.weight', 'base_model._feature_blocks.layer3.4.bn1.weight', 'base_model._feature_blocks.layer3.4.bn1.bias', 'base_model._feature_blocks.layer3.4.bn1.running_mean', 'base_model._feature_blocks.layer3.4.bn1.running_var', 'base_model._feature_blocks.layer3.4.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv2.weight', 'base_model._feature_blocks.layer3.4.bn2.weight', 'base_model._feature_blocks.layer3.4.bn2.bias', 'base_model._feature_blocks.layer3.4.bn2.running_mean', 'base_model._feature_blocks.layer3.4.bn2.running_var', 'base_model._feature_blocks.layer3.4.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.4.conv3.weight', 'base_model._feature_blocks.layer3.4.bn3.weight', 'base_model._feature_blocks.layer3.4.bn3.bias', 'base_model._feature_blocks.layer3.4.bn3.running_mean', 'base_model._feature_blocks.layer3.4.bn3.running_var', 'base_model._feature_blocks.layer3.4.bn3.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv1.weight', 'base_model._feature_blocks.layer3.5.bn1.weight', 'base_model._feature_blocks.layer3.5.bn1.bias', 'base_model._feature_blocks.layer3.5.bn1.running_mean', 'base_model._feature_blocks.layer3.5.bn1.running_var', 'base_model._feature_blocks.layer3.5.bn1.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv2.weight', 'base_model._feature_blocks.layer3.5.bn2.weight', 'base_model._feature_blocks.layer3.5.bn2.bias', 'base_model._feature_blocks.layer3.5.bn2.running_mean', 'base_model._feature_blocks.layer3.5.bn2.running_var', 'base_model._feature_blocks.layer3.5.bn2.num_batches_tracked', 'base_model._feature_blocks.layer3.5.conv3.weight', 'base_model._feature_blocks.layer3.5.bn3.weight', 'base_model._feature_blocks.layer3.5.bn3.bias', 'base_model._feature_blocks.layer3.5.bn3.running_mean', 'base_model._feature_blocks.layer3.5.bn3.running_var', 'base_model._feature_blocks.layer3.5.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv1.weight', 'base_model._feature_blocks.layer4.0.bn1.weight', 'base_model._feature_blocks.layer4.0.bn1.bias', 'base_model._feature_blocks.layer4.0.bn1.running_mean', 'base_model._feature_blocks.layer4.0.bn1.running_var', 'base_model._feature_blocks.layer4.0.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv2.weight', 'base_model._feature_blocks.layer4.0.bn2.weight', 'base_model._feature_blocks.layer4.0.bn2.bias', 'base_model._feature_blocks.layer4.0.bn2.running_mean', 'base_model._feature_blocks.layer4.0.bn2.running_var', 'base_model._feature_blocks.layer4.0.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.0.conv3.weight', 'base_model._feature_blocks.layer4.0.bn3.weight', 'base_model._feature_blocks.layer4.0.bn3.bias', 'base_model._feature_blocks.layer4.0.bn3.running_mean', 'base_model._feature_blocks.layer4.0.bn3.running_var', 'base_model._feature_blocks.layer4.0.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.0.downsample.0.weight', 'base_model._feature_blocks.layer4.0.downsample.1.weight', 'base_model._feature_blocks.layer4.0.downsample.1.bias', 'base_model._feature_blocks.layer4.0.downsample.1.running_mean', 'base_model._feature_blocks.layer4.0.downsample.1.running_var', 'base_model._feature_blocks.layer4.0.downsample.1.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv1.weight', 'base_model._feature_blocks.layer4.1.bn1.weight', 'base_model._feature_blocks.layer4.1.bn1.bias', 'base_model._feature_blocks.layer4.1.bn1.running_mean', 'base_model._feature_blocks.layer4.1.bn1.running_var', 'base_model._feature_blocks.layer4.1.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv2.weight', 'base_model._feature_blocks.layer4.1.bn2.weight', 'base_model._feature_blocks.layer4.1.bn2.bias', 'base_model._feature_blocks.layer4.1.bn2.running_mean', 'base_model._feature_blocks.layer4.1.bn2.running_var', 'base_model._feature_blocks.layer4.1.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.1.conv3.weight', 'base_model._feature_blocks.layer4.1.bn3.weight', 'base_model._feature_blocks.layer4.1.bn3.bias', 'base_model._feature_blocks.layer4.1.bn3.running_mean', 'base_model._feature_blocks.layer4.1.bn3.running_var', 'base_model._feature_blocks.layer4.1.bn3.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv1.weight', 'base_model._feature_blocks.layer4.2.bn1.weight', 'base_model._feature_blocks.layer4.2.bn1.bias', 'base_model._feature_blocks.layer4.2.bn1.running_mean', 'base_model._feature_blocks.layer4.2.bn1.running_var', 'base_model._feature_blocks.layer4.2.bn1.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv2.weight', 'base_model._feature_blocks.layer4.2.bn2.weight', 'base_model._feature_blocks.layer4.2.bn2.bias', 'base_model._feature_blocks.layer4.2.bn2.running_mean', 'base_model._feature_blocks.layer4.2.bn2.running_var', 'base_model._feature_blocks.layer4.2.bn2.num_batches_tracked', 'base_model._feature_blocks.layer4.2.conv3.weight', 'base_model._feature_blocks.layer4.2.bn3.weight', 'base_model._feature_blocks.layer4.2.bn3.bias', 'base_model._feature_blocks.layer4.2.bn3.running_mean', 'base_model._feature_blocks.layer4.2.bn3.running_var', 'base_model._feature_blocks.layer4.2.bn3.num_batches_tracked'])"
            ]
          },
          "execution_count": 95,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"].keys()\n",
        "# 'base_model._feature_blocks.layer1.1.conv2.weight'\n",
        "# \"model.trunk.base_model._feature_blocks.layer1.1.conv2.weight\""
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "_P81o02LGbRx",
        "outputId": "744d621c-9415-493b-d4d4-c97d960d8240"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "[tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True), tensor(True)]\n"
          ]
        }
      ],
      "source": [
        "print(list((weights_fine[\"classy_state_dict\"][\"base_model\"][\"model\"][\"trunk\"]['base_model._feature_blocks.layer1.1.conv2.weight'][i] == weights['layer1.1.conv2.weight'][i]).all() for i in range(63)))"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "O55ao8QmGbOo"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "HdlUfYoiGbM3"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "MAvxux36GbJu"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "i2bbIfnTGbHc"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "FOW5Xpc1GbFM"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ny15TIPdGbCx"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "Iq3pxgPXGbAt"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "ZBjgE2FoP5CY",
        "outputId": "9a468954-eb47-4142-e637-391e2229da8e"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "odict_keys(['0.channel_bn.weight', '0.channel_bn.bias', '0.channel_bn.running_mean', '0.channel_bn.running_var', '0.channel_bn.num_batches_tracked', '0.clf.clf.0.weight', '0.clf.clf.0.bias'])"
            ]
          },
          "execution_count": 15,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights_fine[\"classy_state_dict\"][\"base_model\"][\"model\"][\"heads\"].keys()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "fWFqi_YBTboY",
        "outputId": "8b65227b-5120-4564-8a83-dde9b6f34c63"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "OrderedDict([('0.channel_bn.weight',\n",
              "              tensor([0.9998, 1.0005, 0.9999,  ..., 0.9997, 1.0006, 0.9998])),\n",
              "             ('0.channel_bn.bias',\n",
              "              tensor([ 9.9867e-05, -3.8489e-04, -3.0766e-04,  ..., -1.4030e-03,\n",
              "                       2.4626e-03,  2.2532e-03])),\n",
              "             ('0.channel_bn.running_mean',\n",
              "              tensor([0.2238, 1.1536, 0.5294,  ..., 0.2779, 0.1010, 0.2715])),\n",
              "             ('0.channel_bn.running_var',\n",
              "              tensor([0.0308, 0.3914, 0.0656,  ..., 0.0433, 0.0140, 0.0228])),\n",
              "             ('0.channel_bn.num_batches_tracked', tensor(938)),\n",
              "             ('0.clf.clf.0.weight',\n",
              "              tensor([[-0.0122, -0.0241, -0.0210,  ..., -0.0123, -0.0067, -0.0121],\n",
              "                      [-0.0103, -0.0022,  0.0225,  ..., -0.0041,  0.0174, -0.0038],\n",
              "                      [ 0.0040,  0.0027, -0.0244,  ..., -0.0141,  0.0334,  0.0059],\n",
              "                      ...,\n",
              "                      [-0.0175, -0.0161, -0.0039,  ..., -0.0259, -0.0079, -0.0166],\n",
              "                      [ 0.0196, -0.0266, -0.0120,  ..., -0.0199, -0.0092, -0.0073],\n",
              "                      [ 0.0088,  0.0156,  0.0167,  ..., -0.0203, -0.0129, -0.0096]])),\n",
              "             ('0.clf.clf.0.bias',\n",
              "              tensor([-0.0557, -0.0497,  0.0645, -0.0296, -0.0325, -0.0054,  0.0049,  0.0192,\n",
              "                       0.0123,  0.0538]))])"
            ]
          },
          "execution_count": 16,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "weights[\"classy_state_dict\"][\"base_model\"][\"model\"][\"heads\"]\n",
        "# running_mean and runnin_var parameters are here."
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 35
        },
        "id": "F2uqb9dqT_0g",
        "outputId": "4ec49f58-ae88-4052-ab7b-4264d5e5a6cc"
      },
      "outputs": [
        {
          "data": {
            "application/vnd.google.colaboratory.intrinsic+json": {
              "type": "string"
            },
            "text/plain": [
              "'heads.0.channel_bn.weight'"
            ]
          },
          "execution_count": 17,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "list(dict(model.model.named_parameters()).keys())[-4]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "b9glnreUT_xW",
        "outputId": "8e463405-5663-4896-98e3-4bdccfd0efe8"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "Parameter containing:\n",
              "tensor([0.9998, 1.0005, 0.9999,  ..., 0.9997, 1.0006, 0.9998], device='cuda:0')"
            ]
          },
          "execution_count": 18,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "dict(model.model.named_parameters())[\"heads.0.channel_bn.weight\"]"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ukL3Lc7aT_vR"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "zEO3BussP49f"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "h8it6CkUvy8H"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": 1,
      "metadata": {
        "id": "4WaMBNljQy2d"
      },
      "outputs": [
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "2023-02-21 21:42:09.992469: I tensorflow/core/util/util.cc:169] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n"
          ]
        },
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "<pad> Wie alte sind Sie?</s>\n"
          ]
        }
      ],
      "source": [
        "from transformers import T5Tokenizer, T5ForConditionalGeneration\n",
        "\n",
        "tokenizer = T5Tokenizer.from_pretrained(\"google/flan-t5-large\")\n",
        "model = T5ForConditionalGeneration.from_pretrained(\"google/flan-t5-large\", device_map=\"auto\")\n",
        "\n",
        "input_text = \"translate English to German: How old are you?\"\n",
        "input_ids = tokenizer(input_text, return_tensors=\"pt\").input_ids.to(\"cuda\")\n",
        "\n",
        "outputs = model.generate(input_ids)\n",
        "print(tokenizer.decode(outputs[0]))"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 2,
      "metadata": {},
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "\u001b[0;31mSignature:\u001b[0m\n",
            "\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgenerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0minputs\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mTensor\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mmax_length\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mmin_length\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mdo_sample\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mearly_stopping\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mnum_beams\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mtemperature\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mtop_k\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mtop_p\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mtypical_p\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mrepetition_penalty\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mbad_words_ids\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mIterable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mforce_words_ids\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mIterable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mIterable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mIterable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mbos_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mpad_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0meos_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mlength_penalty\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mno_repeat_ngram_size\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mencoder_no_repeat_ngram_size\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mnum_return_sequences\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mmax_time\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mmax_new_tokens\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mdecoder_start_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0muse_cache\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mnum_beam_groups\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mdiversity_penalty\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mprefix_allowed_tokens_fn\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mCallable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mTensor\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mList\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mlogits_processor\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_logits_process\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mLogitsProcessorList\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mrenormalize_logits\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mstopping_criteria\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_stopping_criteria\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mStoppingCriteriaList\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mconstraints\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mList\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_beam_constraints\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mConstraint\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0moutput_attentions\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0moutput_hidden_states\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0moutput_scores\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mreturn_dict_in_generate\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mforced_bos_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mforced_eos_token_id\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mremove_invalid_values\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0msynced_gpus\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mFalse\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0mexponential_decay_length_penalty\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mTuple\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfloat\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mNoneType\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m    \u001b[0;34m**\u001b[0m\u001b[0mmodel_kwargs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\n",
            "\u001b[0;34m\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mGreedySearchEncoderDecoderOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mGreedySearchDecoderOnlyOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mSampleEncoderDecoderOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mSampleDecoderOnlyOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mBeamSearchEncoderDecoderOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mBeamSearchDecoderOnlyOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mBeamSampleEncoderDecoderOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtransformers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgeneration_utils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mBeamSampleDecoderOnlyOutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mLongTensor\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
            "\u001b[0;31mDocstring:\u001b[0m\n",
            "Generates sequences of token ids for models with a language modeling head. The method supports the following\n",
            "generation methods for text-decoder, text-to-text, speech-to-text, and vision-to-text models:\n",
            "\n",
            "    - *greedy decoding* by calling [`~generation_utils.GenerationMixin.greedy_search`] if `num_beams=1` and\n",
            "      `do_sample=False`.\n",
            "    - *multinomial sampling* by calling [`~generation_utils.GenerationMixin.sample`] if `num_beams=1` and\n",
            "      `do_sample=True`.\n",
            "    - *beam-search decoding* by calling [`~generation_utils.GenerationMixin.beam_search`] if `num_beams>1` and\n",
            "      `do_sample=False`.\n",
            "    - *beam-search multinomial sampling* by calling [`~generation_utils.GenerationMixin.beam_sample`] if\n",
            "      `num_beams>1` and `do_sample=True`.\n",
            "    - *diverse beam-search decoding* by calling [`~generation_utils.GenerationMixin.group_beam_search`], if\n",
            "      `num_beams>1` and `num_beam_groups>1`.\n",
            "    - *constrained beam-search decoding* by calling\n",
            "      [`~generation_utils.GenerationMixin.constrained_beam_search`], if `constraints!=None` or\n",
            "      `force_words_ids!=None`.\n",
            "\n",
            "<Tip warning={true}>\n",
            "\n",
            "Apart from `inputs`, all the arguments below will default to the value of the attribute of the same name as\n",
            "defined in the model's config (`config.json`) which in turn defaults to the\n",
            "[`~modeling_utils.PretrainedConfig`] of the model.\n",
            "\n",
            "</Tip>\n",
            "\n",
            "Most of these parameters are explained in more detail in [this blog\n",
            "post](https://huggingface.co/blog/how-to-generate).\n",
            "\n",
            "Parameters:\n",
            "    inputs (`torch.Tensor` of varying shape depending on the modality, *optional*):\n",
            "        The sequence used as a prompt for the generation or as model inputs to the encoder. If `None` the\n",
            "        method initializes it with `bos_token_id` and a batch size of 1. For decoder-only models `inputs`\n",
            "        should of in the format of `input_ids`. For encoder-decoder models *inputs* can represent any of\n",
            "        `input_ids`, `input_values`, `input_features`, or `pixel_values`.\n",
            "    max_length (`int`, *optional*, defaults to `model.config.max_length`):\n",
            "        The maximum length of the sequence to be generated.\n",
            "    max_new_tokens (`int`, *optional*, defaults to None):\n",
            "        The maximum numbers of tokens to generate, ignore the current number of tokens. Use either\n",
            "        `max_new_tokens` or `max_length` but not both, they serve the same purpose.\n",
            "    min_length (`int`, *optional*, defaults to 10):\n",
            "        The minimum length of the sequence to be generated.\n",
            "    do_sample (`bool`, *optional*, defaults to `False`):\n",
            "        Whether or not to use sampling ; use greedy decoding otherwise.\n",
            "    early_stopping (`bool`, *optional*, defaults to `False`):\n",
            "        Whether to stop the beam search when at least `num_beams` sentences are finished per batch or not.\n",
            "    num_beams (`int`, *optional*, defaults to 1):\n",
            "        Number of beams for beam search. 1 means no beam search.\n",
            "    temperature (`float`, *optional*, defaults to 1.0):\n",
            "        The value used to module the next token probabilities.\n",
            "    top_k (`int`, *optional*, defaults to 50):\n",
            "        The number of highest probability vocabulary tokens to keep for top-k-filtering.\n",
            "    top_p (`float`, *optional*, defaults to 1.0):\n",
            "        If set to float < 1, only the most probable tokens with probabilities that add up to `top_p` or higher\n",
            "        are kept for generation.\n",
            "    typical_p (`float`, *optional*, defaults to 1.0):\n",
            "        The amount of probability mass from the original distribution to be considered in typical decoding. If\n",
            "        set to 1.0 it takes no effect. See [this paper](https://arxiv.org/pdf/2202.00666.pdf) for more details.\n",
            "    repetition_penalty (`float`, *optional*, defaults to 1.0):\n",
            "        The parameter for repetition penalty. 1.0 means no penalty. See [this\n",
            "        paper](https://arxiv.org/pdf/1909.05858.pdf) for more details.\n",
            "    pad_token_id (`int`, *optional*):\n",
            "        The id of the *padding* token.\n",
            "    bos_token_id (`int`, *optional*):\n",
            "        The id of the *beginning-of-sequence* token.\n",
            "    eos_token_id (`int`, *optional*):\n",
            "        The id of the *end-of-sequence* token.\n",
            "    length_penalty (`float`, *optional*, defaults to 1.0):\n",
            "         Exponential penalty to the length. 1.0 means that the beam score is penalized by the sequence length.\n",
            "         0.0 means no penalty. Set to values < 0.0 in order to encourage the model to generate longer\n",
            "         sequences, to a value > 0.0 in order to encourage the model to produce shorter sequences.\n",
            "    no_repeat_ngram_size (`int`, *optional*, defaults to 0):\n",
            "        If set to int > 0, all ngrams of that size can only occur once.\n",
            "    encoder_no_repeat_ngram_size (`int`, *optional*, defaults to 0):\n",
            "        If set to int > 0, all ngrams of that size that occur in the `encoder_input_ids` cannot occur in the\n",
            "        `decoder_input_ids`.\n",
            "    bad_words_ids(`List[List[int]]`, *optional*):\n",
            "        List of token ids that are not allowed to be generated. In order to get the token ids of the words that\n",
            "        should not appear in the generated text, use `tokenizer(bad_words, add_prefix_space=True,\n",
            "        add_special_tokens=False).input_ids`.\n",
            "    force_words_ids(`List[List[int]]` or `List[List[List[int]]]`, *optional*):\n",
            "        List of token ids that must be generated. If given a `List[List[int]]`, this is treated as a simple\n",
            "        list of words that must be included, the opposite to `bad_words_ids`. If given `List[List[List[int]]]`,\n",
            "        this triggers a [disjunctive constraint](https://github.com/huggingface/transformers/issues/14081),\n",
            "        where one can allow different forms of each word.\n",
            "    num_return_sequences(`int`, *optional*, defaults to 1):\n",
            "        The number of independently computed returned sequences for each element in the batch.\n",
            "    max_time(`float`, *optional*, defaults to None):\n",
            "        The maximum amount of time you allow the computation to run for in seconds. generation will still\n",
            "        finish the current pass after allocated time has been passed.\n",
            "    attention_mask (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):\n",
            "        Mask to avoid performing attention on padding token indices. Mask values are in `[0, 1]`, 1 for tokens\n",
            "        that are not masked, and 0 for masked tokens. If not provided, will default to a tensor the same shape\n",
            "        as `input_ids` that masks the pad token. [What are attention masks?](../glossary#attention-mask)\n",
            "    decoder_start_token_id (`int`, *optional*):\n",
            "        If an encoder-decoder model starts decoding with a different token than *bos*, the id of that token.\n",
            "    use_cache: (`bool`, *optional*, defaults to `True`):\n",
            "        Whether or not the model should use the past last key/values attentions (if applicable to the model) to\n",
            "        speed up decoding.\n",
            "    num_beam_groups (`int`, *optional*, defaults to 1):\n",
            "        Number of groups to divide `num_beams` into in order to ensure diversity among different groups of\n",
            "        beams. [this paper](https://arxiv.org/pdf/1610.02424.pdf) for more details.\n",
            "    diversity_penalty (`float`, *optional*, defaults to 0.0):\n",
            "        This value is subtracted from a beam's score if it generates a token same as any beam from other group\n",
            "        at a particular time. Note that `diversity_penalty` is only effective if `group beam search` is\n",
            "        enabled.\n",
            "    prefix_allowed_tokens_fn (`Callable[[int, torch.Tensor], List[int]]`, *optional*):\n",
            "        If provided, this function constraints the beam search to allowed tokens only at each step. If not\n",
            "        provided no constraint is applied. This function takes 2 arguments: the batch ID `batch_id` and\n",
            "        `input_ids`. It has to return a list with the allowed tokens for the next generation step conditioned\n",
            "        on the batch ID `batch_id` and the previously generated tokens `inputs_ids`. This argument is useful\n",
            "        for constrained generation conditioned on the prefix, as described in [Autoregressive Entity\n",
            "        Retrieval](https://arxiv.org/abs/2010.00904).\n",
            "    logits_processor (`LogitsProcessorList`, *optional*):\n",
            "         Custom logits processors that complement the default logits processors built from arguments and a\n",
            "         model's config. If a logit processor is passed that is already created with the arguments or a model's\n",
            "         config an error is thrown. This feature is intended for advanced users.\n",
            "    renormalize_logits: (`bool`, *optional*, defaults to `False`):\n",
            "        Whether to renormalize the logits after applying all the logits processors or warpers (including the\n",
            "        custom ones). It's highly recommended to set this flag to `True` as the search algorithms suppose the\n",
            "        score logits are normalized but some logit processors or warpers break the normalization.\n",
            "    stopping_criteria (`StoppingCriteriaList`, *optional*):\n",
            "         Custom stopping criteria that complement the default stopping criteria built from arguments and a\n",
            "         model's config. If a stopping criteria is passed that is already created with the arguments or a\n",
            "         model's config an error is thrown. This feature is intended for advanced users.\n",
            "    constraints (`List[Constraint]`, *optional*):\n",
            "         Custom constraints that can be added to the generation to ensure that the output will contain the use\n",
            "         of certain tokens as defined by `Constraint` objects, in the most sensible way possible.\n",
            "    output_attentions (`bool`, *optional*, defaults to `False`):\n",
            "        Whether or not to return the attentions tensors of all attention layers. See `attentions` under\n",
            "        returned tensors for more details.\n",
            "    output_hidden_states (`bool`, *optional*, defaults to `False`):\n",
            "        Whether or not to return the hidden states of all layers. See `hidden_states` under returned tensors\n",
            "        for more details.\n",
            "    output_scores (`bool`, *optional*, defaults to `False`):\n",
            "        Whether or not to return the prediction scores. See `scores` under returned tensors for more details.\n",
            "    return_dict_in_generate (`bool`, *optional*, defaults to `False`):\n",
            "        Whether or not to return a [`~utils.ModelOutput`] instead of a plain tuple.\n",
            "    forced_bos_token_id (`int`, *optional*):\n",
            "        The id of the token to force as the first generated token after the `decoder_start_token_id`. Useful\n",
            "        for multilingual models like [mBART](../model_doc/mbart) where the first generated token needs to be\n",
            "        the target language token.\n",
            "    forced_eos_token_id (`int`, *optional*):\n",
            "        The id of the token to force as the last generated token when `max_length` is reached.\n",
            "    remove_invalid_values (`bool`, *optional*):\n",
            "        Whether to remove possible *nan* and *inf* outputs of the model to prevent the generation method to\n",
            "        crash. Note that using `remove_invalid_values` can slow down generation.\n",
            "    synced_gpus (`bool`, *optional*, defaults to `False`):\n",
            "        Whether to continue running the while loop until max_length (needed for ZeRO stage 3)\n",
            "    exponential_decay_length_penalty (`tuple(int, float)`, *optional*):\n",
            "        This Tuple adds an exponentially increasing length penalty, after a certain amount of tokens have been\n",
            "        generated. The tuple shall consist of: `(start_index, decay_factor)` where `start_index` indicates\n",
            "        where penalty starts and `decay_factor` represents the factor of exponential decay\n",
            "\n",
            "    model_kwargs:\n",
            "        Additional model specific kwargs will be forwarded to the `forward` function of the model. If the model\n",
            "        is an encoder-decoder model, encoder specific kwargs should not be prefixed and decoder specific kwargs\n",
            "        should be prefixed with *decoder_*.\n",
            "\n",
            "Return:\n",
            "    [`~utils.ModelOutput`] or `torch.LongTensor`: A [`~utils.ModelOutput`] (if `return_dict_in_generate=True`\n",
            "    or when `config.return_dict_in_generate=True`) or a `torch.FloatTensor`.\n",
            "\n",
            "        If the model is *not* an encoder-decoder model (`model.config.is_encoder_decoder=False`), the possible\n",
            "        [`~utils.ModelOutput`] types are:\n",
            "\n",
            "            - [`~generation_utils.GreedySearchDecoderOnlyOutput`],\n",
            "            - [`~generation_utils.SampleDecoderOnlyOutput`],\n",
            "            - [`~generation_utils.BeamSearchDecoderOnlyOutput`],\n",
            "            - [`~generation_utils.BeamSampleDecoderOnlyOutput`]\n",
            "\n",
            "        If the model is an encoder-decoder model (`model.config.is_encoder_decoder=True`), the possible\n",
            "        [`~utils.ModelOutput`] types are:\n",
            "\n",
            "            - [`~generation_utils.GreedySearchEncoderDecoderOutput`],\n",
            "            - [`~generation_utils.SampleEncoderDecoderOutput`],\n",
            "            - [`~generation_utils.BeamSearchEncoderDecoderOutput`],\n",
            "            - [`~generation_utils.BeamSampleEncoderDecoderOutput`]\n",
            "\n",
            "Examples:\n",
            "\n",
            "Greedy Decoding:\n",
            "\n",
            "```python\n",
            ">>> from transformers import AutoTokenizer, AutoModelForCausalLM\n",
            "\n",
            ">>> tokenizer = AutoTokenizer.from_pretrained(\"gpt2\")\n",
            ">>> model = AutoModelForCausalLM.from_pretrained(\"gpt2\")\n",
            "\n",
            ">>> prompt = \"Today I believe we can finally\"\n",
            ">>> input_ids = tokenizer(prompt, return_tensors=\"pt\").input_ids\n",
            "\n",
            ">>> # generate up to 30 tokens\n",
            ">>> outputs = model.generate(input_ids, do_sample=False, max_length=30)\n",
            ">>> tokenizer.batch_decode(outputs, skip_special_tokens=True)\n",
            "['Today I believe we can finally get to the point where we can make a difference in the lives of the people of the United States of America.\\n']\n",
            "```\n",
            "\n",
            "Multinomial Sampling:\n",
            "\n",
            "```python\n",
            ">>> from transformers import AutoTokenizer, AutoModelForCausalLM\n",
            ">>> import torch\n",
            "\n",
            ">>> tokenizer = AutoTokenizer.from_pretrained(\"gpt2\")\n",
            ">>> model = AutoModelForCausalLM.from_pretrained(\"gpt2\")\n",
            "\n",
            ">>> prompt = \"Today I believe we can finally\"\n",
            ">>> input_ids = tokenizer(prompt, return_tensors=\"pt\").input_ids\n",
            "\n",
            ">>> # sample up to 30 tokens\n",
            ">>> torch.manual_seed(0)  # doctest: +IGNORE_RESULT\n",
            ">>> outputs = model.generate(input_ids, do_sample=True, max_length=30)\n",
            ">>> tokenizer.batch_decode(outputs, skip_special_tokens=True)\n",
            "['Today I believe we can finally get rid of discrimination,\" said Rep. Mark Pocan (D-Wis.).\\n\\n\"Just look at the']\n",
            "```\n",
            "\n",
            "Beam-search decoding:\n",
            "\n",
            "```python\n",
            ">>> from transformers import AutoTokenizer, AutoModelForSeq2SeqLM\n",
            "\n",
            ">>> tokenizer = AutoTokenizer.from_pretrained(\"Helsinki-NLP/opus-mt-en-de\")\n",
            ">>> model = AutoModelForSeq2SeqLM.from_pretrained(\"Helsinki-NLP/opus-mt-en-de\")\n",
            "\n",
            ">>> sentence = \"Paris is one of the densest populated areas in Europe.\"\n",
            ">>> input_ids = tokenizer(sentence, return_tensors=\"pt\").input_ids\n",
            "\n",
            ">>> outputs = model.generate(input_ids)\n",
            ">>> tokenizer.batch_decode(outputs, skip_special_tokens=True)\n",
            "['Paris ist eines der dichtesten besiedelten Gebiete Europas.']\n",
            "```\n",
            "\u001b[0;31mFile:\u001b[0m      ~/anaconda3/envs/nlp_lite/lib/python3.8/site-packages/transformers/generation_utils.py\n",
            "\u001b[0;31mType:\u001b[0m      method\n"
          ]
        }
      ],
      "source": [
        "?model.generate"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {},
      "outputs": [],
      "source": [
        "pred = ['cat', 'cat', 'the', 'is']\n",
        "gt = ['cat', 'the', 'road', 'is']\n",
        "\n",
        "pred = set(list(pred))\n",
        "gt = set(list(gt))\n",
        "\n",
        "def subs_overlap(pred, gt):\n",
        "    ans = 0.0\n",
        "    for p in pred:\n",
        "        if p in gt:\n",
        "            ans += 1.0\n",
        "    return ans / len(pred)\n",
        "\n",
        "subs_overlap(pred, gt)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {},
      "outputs": [],
      "source": [
        "# qstat all the job that are queried\n",
        "\n",
        "!qsstat -u $USER | grep -v \"job-ID\" | awk '{print $1}' | xargs -I {qsstat -u $USER | grep -v \"job-ID\" | awk '{print $1}' | xargs -I {} qdel {}} qdel {}"
      ]
    }
  ],
  "metadata": {
    "accelerator": "GPU",
    "colab": {
      "provenance": []
    },
    "gpuClass": "standard",
    "kernelspec": {
      "display_name": "Python 3.8.12 ('nlp_lite')",
      "language": "python",
      "name": "python3"
    },
    "language_info": {
      "codemirror_mode": {
        "name": "ipython",
        "version": 3
      },
      "file_extension": ".py",
      "mimetype": "text/x-python",
      "name": "python",
      "nbconvert_exporter": "python",
      "pygments_lexer": "ipython3",
      "version": "3.8.12"
    },
    "vscode": {
      "interpreter": {
        "hash": "1b561071db17c4e9f20bafb28e072113f0a8643294a26e1354618f8374742fb0"
      }
    },
    "widgets": {
      "application/vnd.jupyter.widget-state+json": {
        "01fbe0cab1144cd3a3946b487da67a76": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "04ed3be3e4ee4a8b8169e46e1680d149": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_b457bc23a8e64915baf0ba3c2a6b47fd",
              "IPY_MODEL_d9553549b2d345049e107ec6f784f18b",
              "IPY_MODEL_8f3d7ac36d934bf3b5866872410298eb"
            ],
            "layout": "IPY_MODEL_86a29711e44a4cf3b495d5b5889a59e7"
          }
        },
        "0ea01ccede9e4b5c9da043e764b8ff33": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "103c139cbdfe4b3b85e0a9a5514a6f9f": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_4d20a6f8e0444109a59f967c52f54401",
            "placeholder": "​",
            "style": "IPY_MODEL_0ea01ccede9e4b5c9da043e764b8ff33",
            "value": ""
          }
        },
        "13be9d99438d4e91b8fb0935feeb04d6": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "169ffc9494474b17b93ebf8467993673": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "1987475dc3e147c195f7ac285657fa2b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_103c139cbdfe4b3b85e0a9a5514a6f9f",
              "IPY_MODEL_4ce75f7cd5614e43b14f7ce27d7d8808",
              "IPY_MODEL_6974105051a3492585f5e5d8f47a702e"
            ],
            "layout": "IPY_MODEL_b4c3831ca0c841f4b4a9ad718e0f222f"
          }
        },
        "1a3ce30907f7454d84516066700749a3": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "33cbf5dbac8c45c0bb6a9a44028e4ea3": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "35b9c446ca3f44fd93025b18ad6e07cd": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_d18449be12ec4a61acd4b5f22e6f9b75",
            "placeholder": "​",
            "style": "IPY_MODEL_6064004fabc648d0b5b035274d5c3425",
            "value": ""
          }
        },
        "486af1494c654b9b917d5f67a33f8f18": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_13be9d99438d4e91b8fb0935feeb04d6",
            "max": 28881,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_169ffc9494474b17b93ebf8467993673",
            "value": 28881
          }
        },
        "4ce75f7cd5614e43b14f7ce27d7d8808": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_707369e8ef3d4e7c8add8703e90a5f1c",
            "max": 4542,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_b5e2ab3980f34a9db83e9dfc37234ec5",
            "value": 4542
          }
        },
        "4d20a6f8e0444109a59f967c52f54401": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "5402033b366e4fbbaea81cf8faf8eccf": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "58474f7c3b064736b1792d0dadc0b3fc": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "5f94b05328da4e23adc15f7f6eb4e937": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "6064004fabc648d0b5b035274d5c3425": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "6974105051a3492585f5e5d8f47a702e": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_f95058a5b1624167832c9c339f3a0074",
            "placeholder": "​",
            "style": "IPY_MODEL_1a3ce30907f7454d84516066700749a3",
            "value": " 5120/? [00:00&lt;00:00, 372891.76it/s]"
          }
        },
        "6b657966bd90498dac074b3f8d9ee6d1": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "707369e8ef3d4e7c8add8703e90a5f1c": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "7280424dedbb407e8ac139f9adbf60a8": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_97889e1a72d149479b042b4b24cdef3d",
              "IPY_MODEL_486af1494c654b9b917d5f67a33f8f18",
              "IPY_MODEL_75a3d4f67843440491448f273df1392a"
            ],
            "layout": "IPY_MODEL_d10bd232bca94aa686ea6be815cd3948"
          }
        },
        "75a3d4f67843440491448f273df1392a": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_ac99589b5ed04cef8fb0cfd651686525",
            "placeholder": "​",
            "style": "IPY_MODEL_5402033b366e4fbbaea81cf8faf8eccf",
            "value": " 29696/? [00:00&lt;00:00, 1060205.92it/s]"
          }
        },
        "7dbb7fe18d0f4aed8f72eaaea1ee67a8": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "82daabde61c945309fb19be31a7ef7d5": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "86a29711e44a4cf3b495d5b5889a59e7": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "8f3d7ac36d934bf3b5866872410298eb": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_5f94b05328da4e23adc15f7f6eb4e937",
            "placeholder": "​",
            "style": "IPY_MODEL_fbf834b6b8564382b09cfe3b82dfd28c",
            "value": " 9913344/? [00:00&lt;00:00, 71893737.30it/s]"
          }
        },
        "97889e1a72d149479b042b4b24cdef3d": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_ff53d6bf93034731a3f36eedb3bbf6a4",
            "placeholder": "​",
            "style": "IPY_MODEL_6b657966bd90498dac074b3f8d9ee6d1",
            "value": ""
          }
        },
        "9faf373ea16e487a8d7545efbe5ff404": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_35b9c446ca3f44fd93025b18ad6e07cd",
              "IPY_MODEL_9fea91ddc0154270a1fc79cd68217766",
              "IPY_MODEL_f88e1a88b4264fac8bb02b17b32a9f47"
            ],
            "layout": "IPY_MODEL_33cbf5dbac8c45c0bb6a9a44028e4ea3"
          }
        },
        "9fea91ddc0154270a1fc79cd68217766": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_58474f7c3b064736b1792d0dadc0b3fc",
            "max": 1648877,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_01fbe0cab1144cd3a3946b487da67a76",
            "value": 1648877
          }
        },
        "ac99589b5ed04cef8fb0cfd651686525": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "b239237acd33488ca73c46163688249f": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "b457bc23a8e64915baf0ba3c2a6b47fd": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_d9bad2ff744e486aab9f90d9ae6b309e",
            "placeholder": "​",
            "style": "IPY_MODEL_efefeefc09464cd883d5b10927c6d49b",
            "value": ""
          }
        },
        "b4c3831ca0c841f4b4a9ad718e0f222f": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "b5e2ab3980f34a9db83e9dfc37234ec5": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "d10bd232bca94aa686ea6be815cd3948": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "d18449be12ec4a61acd4b5f22e6f9b75": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "d9553549b2d345049e107ec6f784f18b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_7dbb7fe18d0f4aed8f72eaaea1ee67a8",
            "max": 9912422,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_82daabde61c945309fb19be31a7ef7d5",
            "value": 9912422
          }
        },
        "d9bad2ff744e486aab9f90d9ae6b309e": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "efefeefc09464cd883d5b10927c6d49b": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "f88e1a88b4264fac8bb02b17b32a9f47": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_fb0390b8a3384a68be7b0dc5a35093f3",
            "placeholder": "​",
            "style": "IPY_MODEL_b239237acd33488ca73c46163688249f",
            "value": " 1649664/? [00:00&lt;00:00, 33020866.25it/s]"
          }
        },
        "f95058a5b1624167832c9c339f3a0074": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "fb0390b8a3384a68be7b0dc5a35093f3": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "fbf834b6b8564382b09cfe3b82dfd28c": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "ff53d6bf93034731a3f36eedb3bbf6a4": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        }
      }
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}
