{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "collapsed": true,
    "jupyter": {
     "outputs_hidden": true
    },
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Collecting torch\n",
      "  Downloading torch-2.4.1-cp310-cp310-manylinux1_x86_64.whl.metadata (26 kB)\n",
      "Collecting torchvision\n",
      "  Downloading torchvision-0.19.1-cp310-cp310-manylinux1_x86_64.whl.metadata (6.0 kB)\n",
      "Collecting torchaudio\n",
      "  Downloading torchaudio-2.4.1-cp310-cp310-manylinux1_x86_64.whl.metadata (6.4 kB)\n",
      "Requirement already satisfied: filelock in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (3.15.4)\n",
      "Requirement already satisfied: typing-extensions>=4.8.0 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (4.12.2)\n",
      "Requirement already satisfied: sympy in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (1.13.0)\n",
      "Requirement already satisfied: networkx in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (3.3)\n",
      "Requirement already satisfied: jinja2 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (3.1.4)\n",
      "Requirement already satisfied: fsspec in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torch) (2024.6.1)\n",
      "Collecting nvidia-cuda-nvrtc-cu12==12.1.105 (from torch)\n",
      "  Downloading nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)\n",
      "Collecting nvidia-cuda-runtime-cu12==12.1.105 (from torch)\n",
      "  Downloading nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)\n",
      "Collecting nvidia-cuda-cupti-cu12==12.1.105 (from torch)\n",
      "  Downloading nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.6 kB)\n",
      "Collecting nvidia-cudnn-cu12==9.1.0.70 (from torch)\n",
      "  Downloading nvidia_cudnn_cu12-9.1.0.70-py3-none-manylinux2014_x86_64.whl.metadata (1.6 kB)\n",
      "Collecting nvidia-cublas-cu12==12.1.3.1 (from torch)\n",
      "  Downloading nvidia_cublas_cu12-12.1.3.1-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)\n",
      "Collecting nvidia-cufft-cu12==11.0.2.54 (from torch)\n",
      "  Downloading nvidia_cufft_cu12-11.0.2.54-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)\n",
      "Collecting nvidia-curand-cu12==10.3.2.106 (from torch)\n",
      "  Downloading nvidia_curand_cu12-10.3.2.106-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)\n",
      "Collecting nvidia-cusolver-cu12==11.4.5.107 (from torch)\n",
      "  Downloading nvidia_cusolver_cu12-11.4.5.107-py3-none-manylinux1_x86_64.whl.metadata (1.6 kB)\n",
      "Collecting nvidia-cusparse-cu12==12.1.0.106 (from torch)\n",
      "  Downloading nvidia_cusparse_cu12-12.1.0.106-py3-none-manylinux1_x86_64.whl.metadata (1.6 kB)\n",
      "Collecting nvidia-nccl-cu12==2.20.5 (from torch)\n",
      "  Downloading nvidia_nccl_cu12-2.20.5-py3-none-manylinux2014_x86_64.whl.metadata (1.8 kB)\n",
      "Collecting nvidia-nvtx-cu12==12.1.105 (from torch)\n",
      "  Downloading nvidia_nvtx_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.7 kB)\n",
      "Collecting triton==3.0.0 (from torch)\n",
      "  Downloading triton-3.0.0-1-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl.metadata (1.3 kB)\n",
      "Collecting nvidia-nvjitlink-cu12 (from nvidia-cusolver-cu12==11.4.5.107->torch)\n",
      "  Downloading nvidia_nvjitlink_cu12-12.6.68-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n",
      "Requirement already satisfied: numpy in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torchvision) (1.22.4)\n",
      "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from torchvision) (10.4.0)\n",
      "Requirement already satisfied: MarkupSafe>=2.0 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from jinja2->torch) (2.1.5)\n",
      "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from sympy->torch) (1.3.0)\n",
      "Downloading torch-2.4.1-cp310-cp310-manylinux1_x86_64.whl (797.1 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m797.1/797.1 MB\u001b[0m \u001b[31m1.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cublas_cu12-12.1.3.1-py3-none-manylinux1_x86_64.whl (410.6 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m410.6/410.6 MB\u001b[0m \u001b[31m2.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (14.1 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m14.1/14.1 MB\u001b[0m \u001b[31m40.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m0:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (23.7 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m23.7/23.7 MB\u001b[0m \u001b[31m27.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (823 kB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m823.6/823.6 kB\u001b[0m \u001b[31m17.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cudnn_cu12-9.1.0.70-py3-none-manylinux2014_x86_64.whl (664.8 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m664.8/664.8 MB\u001b[0m \u001b[31m1.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cufft_cu12-11.0.2.54-py3-none-manylinux1_x86_64.whl (121.6 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m121.6/121.6 MB\u001b[0m \u001b[31m15.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_curand_cu12-10.3.2.106-py3-none-manylinux1_x86_64.whl (56.5 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m56.5/56.5 MB\u001b[0m \u001b[31m24.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cusolver_cu12-11.4.5.107-py3-none-manylinux1_x86_64.whl (124.2 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m124.2/124.2 MB\u001b[0m \u001b[31m4.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_cusparse_cu12-12.1.0.106-py3-none-manylinux1_x86_64.whl (196.0 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m196.0/196.0 MB\u001b[0m \u001b[31m2.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_nccl_cu12-2.20.5-py3-none-manylinux2014_x86_64.whl (176.2 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m176.2/176.2 MB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_nvtx_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (99 kB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m99.1/99.1 kB\u001b[0m \u001b[31m19.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
      "\u001b[?25hDownloading triton-3.0.0-1-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl (209.4 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m209.4/209.4 MB\u001b[0m \u001b[31m2.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading torchvision-0.19.1-cp310-cp310-manylinux1_x86_64.whl (7.0 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.0/7.0 MB\u001b[0m \u001b[31m31.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading torchaudio-2.4.1-cp310-cp310-manylinux1_x86_64.whl (3.4 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.4/3.4 MB\u001b[0m \u001b[31m30.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hDownloading nvidia_nvjitlink_cu12-12.6.68-py3-none-manylinux2014_x86_64.whl (19.7 MB)\n",
      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m19.7/19.7 MB\u001b[0m \u001b[31m32.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
      "\u001b[?25hInstalling collected packages: triton, nvidia-nvtx-cu12, nvidia-nvjitlink-cu12, nvidia-nccl-cu12, nvidia-curand-cu12, nvidia-cufft-cu12, nvidia-cuda-runtime-cu12, nvidia-cuda-nvrtc-cu12, nvidia-cuda-cupti-cu12, nvidia-cublas-cu12, nvidia-cusparse-cu12, nvidia-cudnn-cu12, nvidia-cusolver-cu12, torch, torchvision, torchaudio\n",
      "Successfully installed nvidia-cublas-cu12-12.1.3.1 nvidia-cuda-cupti-cu12-12.1.105 nvidia-cuda-nvrtc-cu12-12.1.105 nvidia-cuda-runtime-cu12-12.1.105 nvidia-cudnn-cu12-9.1.0.70 nvidia-cufft-cu12-11.0.2.54 nvidia-curand-cu12-10.3.2.106 nvidia-cusolver-cu12-11.4.5.107 nvidia-cusparse-cu12-12.1.0.106 nvidia-nccl-cu12-2.20.5 nvidia-nvjitlink-cu12-12.6.68 nvidia-nvtx-cu12-12.1.105 torch-2.4.1 torchaudio-2.4.1 torchvision-0.19.1 triton-3.0.0\n",
      "fatal: destination path 'apex' already exists and is not an empty directory.\n",
      "/home/ec2-user/SageMaker/FAST_CIFAR10/apex\n",
      "Found existing installation: packaging 21.3\n",
      "Uninstalling packaging-21.3:\n",
      "  Successfully uninstalled packaging-21.3\n",
      "Collecting packaging\n",
      "  Using cached packaging-24.1-py3-none-any.whl.metadata (3.2 kB)\n",
      "Using cached packaging-24.1-py3-none-any.whl (53 kB)\n",
      "Installing collected packages: packaging\n",
      "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
      "astropy 6.1.0 requires numpy>=1.23, but you have numpy 1.22.4 which is incompatible.\n",
      "scikit-image 0.24.0 requires numpy>=1.23, but you have numpy 1.22.4 which is incompatible.\n",
      "sparkmagic 0.21.0 requires pandas<2.0.0,>=0.17.1, but you have pandas 2.2.2 which is incompatible.\n",
      "sphinx 8.0.2 requires docutils<0.22,>=0.20, but you have docutils 0.16 which is incompatible.\u001b[0m\u001b[31m\n",
      "\u001b[0mSuccessfully installed packaging-24.1\n",
      "Using pip 23.3.2 from /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages/pip (python 3.10)\n",
      "\u001b[33mDEPRECATION: --build-option and --global-option are deprecated. pip 24.0 will enforce this behaviour change. A possible replacement is to use --config-settings. Discussion can be found at https://github.com/pypa/pip/issues/11859\u001b[0m\u001b[33m\n",
      "\u001b[0m\u001b[33mWARNING: Implying --no-binary=:all: due to the presence of --build-option / --global-option.\u001b[0m\u001b[33m\n",
      "\u001b[0mProcessing /home/ec2-user/SageMaker/FAST_CIFAR10/apex\n",
      "  Running command Preparing metadata (pyproject.toml)\n",
      "\n",
      "\n",
      "  torch.__version__  = 2.4.1+cu121\n",
      "\n",
      "\n",
      "  running dist_info\n",
      "  creating /tmp/pip-modern-metadata-zncr1nej/apex.egg-info\n",
      "  writing /tmp/pip-modern-metadata-zncr1nej/apex.egg-info/PKG-INFO\n",
      "  writing dependency_links to /tmp/pip-modern-metadata-zncr1nej/apex.egg-info/dependency_links.txt\n",
      "  writing requirements to /tmp/pip-modern-metadata-zncr1nej/apex.egg-info/requires.txt\n",
      "  writing top-level names to /tmp/pip-modern-metadata-zncr1nej/apex.egg-info/top_level.txt\n",
      "  writing manifest file '/tmp/pip-modern-metadata-zncr1nej/apex.egg-info/SOURCES.txt'\n",
      "  reading manifest file '/tmp/pip-modern-metadata-zncr1nej/apex.egg-info/SOURCES.txt'\n",
      "  adding license file 'LICENSE'\n",
      "  writing manifest file '/tmp/pip-modern-metadata-zncr1nej/apex.egg-info/SOURCES.txt'\n",
      "  creating '/tmp/pip-modern-metadata-zncr1nej/apex-0.1.dist-info'\n",
      "  Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
      "Requirement already satisfied: packaging>20.6 in /home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages (from apex==0.1) (24.1)\n",
      "Building wheels for collected packages: apex\n",
      "\u001b[33m  WARNING: Ignoring --global-option when building apex using PEP 517\u001b[0m\u001b[33m\n",
      "\u001b[0m  Running command Building wheel for apex (pyproject.toml)\n",
      "\n",
      "\n",
      "  torch.__version__  = 2.4.1+cu121\n",
      "\n",
      "\n",
      "  running bdist_wheel\n",
      "  running build\n",
      "  running build_py\n",
      "  copying apex/_autocast_utils.py -> build/lib/apex\n",
      "  copying apex/__init__.py -> build/lib/apex\n",
      "  copying apex/transformer/enums.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/_ucc_util.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/microbatches.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/utils.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/log_util.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/parallel_state.py -> build/lib/apex/transformer\n",
      "  copying apex/transformer/__init__.py -> build/lib/apex/transformer\n",
      "  copying apex/RNN/cells.py -> build/lib/apex/RNN\n",
      "  copying apex/RNN/models.py -> build/lib/apex/RNN\n",
      "  copying apex/RNN/__init__.py -> build/lib/apex/RNN\n",
      "  copying apex/RNN/RNNBackend.py -> build/lib/apex/RNN\n",
      "  copying apex/fp16_utils/fp16_optimizer.py -> build/lib/apex/fp16_utils\n",
      "  copying apex/fp16_utils/loss_scaler.py -> build/lib/apex/fp16_utils\n",
      "  copying apex/fp16_utils/__init__.py -> build/lib/apex/fp16_utils\n",
      "  copying apex/fp16_utils/fp16util.py -> build/lib/apex/fp16_utils\n",
      "  copying apex/mlp/mlp.py -> build/lib/apex/mlp\n",
      "  copying apex/mlp/__init__.py -> build/lib/apex/mlp\n",
      "  copying apex/fused_dense/fused_dense.py -> build/lib/apex/fused_dense\n",
      "  copying apex/fused_dense/__init__.py -> build/lib/apex/fused_dense\n",
      "  copying apex/parallel/LARC.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/multiproc.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/sync_batchnorm.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/optimized_sync_batchnorm.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/optimized_sync_batchnorm_kernel.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/distributed.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/__init__.py -> build/lib/apex/parallel\n",
      "  copying apex/parallel/sync_batchnorm_kernel.py -> build/lib/apex/parallel\n",
      "  copying apex/amp/scaler.py -> build/lib/apex/amp\n",
      "  copying apex/amp/__version__.py -> build/lib/apex/amp\n",
      "  copying apex/amp/handle.py -> build/lib/apex/amp\n",
      "  copying apex/amp/opt.py -> build/lib/apex/amp\n",
      "  copying apex/amp/compat.py -> build/lib/apex/amp\n",
      "  copying apex/amp/_process_optimizer.py -> build/lib/apex/amp\n",
      "  copying apex/amp/wrap.py -> build/lib/apex/amp\n",
      "  copying apex/amp/utils.py -> build/lib/apex/amp\n",
      "  copying apex/amp/_initialize.py -> build/lib/apex/amp\n",
      "  copying apex/amp/__init__.py -> build/lib/apex/amp\n",
      "  copying apex/amp/frontend.py -> build/lib/apex/amp\n",
      "  copying apex/amp/_amp_state.py -> build/lib/apex/amp\n",
      "  copying apex/amp/amp.py -> build/lib/apex/amp\n",
      "  copying apex/amp/rnn_compat.py -> build/lib/apex/amp\n",
      "  copying apex/contrib/__init__.py -> build/lib/apex/contrib\n",
      "  copying apex/optimizers/fused_novograd.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/fused_lamb.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/fused_adam.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/fused_adagrad.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/fused_mixed_precision_lamb.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/fused_sgd.py -> build/lib/apex/optimizers\n",
      "  copying apex/optimizers/__init__.py -> build/lib/apex/optimizers\n",
      "  copying apex/multi_tensor_apply/multi_tensor_apply.py -> build/lib/apex/multi_tensor_apply\n",
      "  copying apex/multi_tensor_apply/__init__.py -> build/lib/apex/multi_tensor_apply\n",
      "  copying apex/normalization/fused_layer_norm.py -> build/lib/apex/normalization\n",
      "  copying apex/normalization/__init__.py -> build/lib/apex/normalization\n",
      "  copying apex/transformer/tensor_parallel/layers.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/memory.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/random.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/cross_entropy.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/utils.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/__init__.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/mappings.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/tensor_parallel/data.py -> build/lib/apex/transformer/tensor_parallel\n",
      "  copying apex/transformer/layers/layer_norm.py -> build/lib/apex/transformer/layers\n",
      "  copying apex/transformer/layers/__init__.py -> build/lib/apex/transformer/layers\n",
      "  copying apex/transformer/_data/_batchsampler.py -> build/lib/apex/transformer/_data\n",
      "  copying apex/transformer/_data/__init__.py -> build/lib/apex/transformer/_data\n",
      "  copying apex/transformer/pipeline_parallel/_timers.py -> build/lib/apex/transformer/pipeline_parallel\n",
      "  copying apex/transformer/pipeline_parallel/utils.py -> build/lib/apex/transformer/pipeline_parallel\n",
      "  copying apex/transformer/pipeline_parallel/__init__.py -> build/lib/apex/transformer/pipeline_parallel\n",
      "  copying apex/transformer/pipeline_parallel/p2p_communication.py -> build/lib/apex/transformer/pipeline_parallel\n",
      "  copying apex/transformer/testing/global_vars.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/distributed_test_base.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/arguments.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/standalone_gpt.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/standalone_transformer_lm.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/commons.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/__init__.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/testing/standalone_bert.py -> build/lib/apex/transformer/testing\n",
      "  copying apex/transformer/amp/grad_scaler.py -> build/lib/apex/transformer/amp\n",
      "  copying apex/transformer/amp/__init__.py -> build/lib/apex/transformer/amp\n",
      "  copying apex/transformer/functional/fused_softmax.py -> build/lib/apex/transformer/functional\n",
      "  copying apex/transformer/functional/fused_rope.py -> build/lib/apex/transformer/functional\n",
      "  copying apex/transformer/functional/__init__.py -> build/lib/apex/transformer/functional\n",
      "  copying apex/transformer/pipeline_parallel/schedules/fwd_bwd_no_pipelining.py -> build/lib/apex/transformer/pipeline_parallel/schedules\n",
      "  copying apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_with_interleaving.py -> build/lib/apex/transformer/pipeline_parallel/schedules\n",
      "  copying apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_without_interleaving.py -> build/lib/apex/transformer/pipeline_parallel/schedules\n",
      "  copying apex/transformer/pipeline_parallel/schedules/__init__.py -> build/lib/apex/transformer/pipeline_parallel/schedules\n",
      "  copying apex/transformer/pipeline_parallel/schedules/common.py -> build/lib/apex/transformer/pipeline_parallel/schedules\n",
      "  copying apex/amp/lists/tensor_overrides.py -> build/lib/apex/amp/lists\n",
      "  copying apex/amp/lists/functional_overrides.py -> build/lib/apex/amp/lists\n",
      "  copying apex/amp/lists/__init__.py -> build/lib/apex/amp/lists\n",
      "  copying apex/amp/lists/torch_overrides.py -> build/lib/apex/amp/lists\n",
      "  copying apex/contrib/gpu_direct_storage/__init__.py -> build/lib/apex/contrib/gpu_direct_storage\n",
      "  copying apex/contrib/index_mul_2d/__init__.py -> build/lib/apex/contrib/index_mul_2d\n",
      "  copying apex/contrib/index_mul_2d/index_mul_2d.py -> build/lib/apex/contrib/index_mul_2d\n",
      "  copying apex/contrib/conv_bias_relu/conv_bias_relu.py -> build/lib/apex/contrib/conv_bias_relu\n",
      "  copying apex/contrib/conv_bias_relu/__init__.py -> build/lib/apex/contrib/conv_bias_relu\n",
      "  copying apex/contrib/clip_grad/__init__.py -> build/lib/apex/contrib/clip_grad\n",
      "  copying apex/contrib/clip_grad/clip_grad.py -> build/lib/apex/contrib/clip_grad\n",
      "  copying apex/contrib/groupbn/batch_norm.py -> build/lib/apex/contrib/groupbn\n",
      "  copying apex/contrib/groupbn/__init__.py -> build/lib/apex/contrib/groupbn\n",
      "  copying apex/contrib/group_norm/group_norm.py -> build/lib/apex/contrib/group_norm\n",
      "  copying apex/contrib/group_norm/__init__.py -> build/lib/apex/contrib/group_norm\n",
      "  copying apex/contrib/fmha/__init__.py -> build/lib/apex/contrib/fmha\n",
      "  copying apex/contrib/fmha/fmha.py -> build/lib/apex/contrib/fmha\n",
      "  copying apex/contrib/openfold_triton/layer_norm.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/mha.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/_layer_norm_config_hopper.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/_layer_norm_config_ampere.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/fused_adam_swa.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/_layer_norm_forward_kernels.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/_layer_norm_backward_kernels.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/__init__.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/openfold_triton/_mha_kernel.py -> build/lib/apex/contrib/openfold_triton\n",
      "  copying apex/contrib/multihead_attn/encdec_multihead_attn.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/mask_softmax_dropout_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/self_multihead_attn.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/fast_encdec_multihead_attn_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/fast_encdec_multihead_attn_norm_add_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/fast_self_multihead_attn_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/encdec_multihead_attn_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/self_multihead_attn_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/__init__.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/multihead_attn/fast_self_multihead_attn_norm_add_func.py -> build/lib/apex/contrib/multihead_attn\n",
      "  copying apex/contrib/layer_norm/layer_norm.py -> build/lib/apex/contrib/layer_norm\n",
      "  copying apex/contrib/layer_norm/__init__.py -> build/lib/apex/contrib/layer_norm\n",
      "  copying apex/contrib/nccl_allocator/nccl_allocator.py -> build/lib/apex/contrib/nccl_allocator\n",
      "  copying apex/contrib/nccl_allocator/__init__.py -> build/lib/apex/contrib/nccl_allocator\n",
      "  copying apex/contrib/bottleneck/bottleneck.py -> build/lib/apex/contrib/bottleneck\n",
      "  copying apex/contrib/bottleneck/test.py -> build/lib/apex/contrib/bottleneck\n",
      "  copying apex/contrib/bottleneck/halo_exchangers.py -> build/lib/apex/contrib/bottleneck\n",
      "  copying apex/contrib/bottleneck/__init__.py -> build/lib/apex/contrib/bottleneck\n",
      "  copying apex/contrib/cudnn_gbn/batch_norm.py -> build/lib/apex/contrib/cudnn_gbn\n",
      "  copying apex/contrib/cudnn_gbn/__init__.py -> build/lib/apex/contrib/cudnn_gbn\n",
      "  copying apex/contrib/peer_memory/peer_halo_exchanger_1d.py -> build/lib/apex/contrib/peer_memory\n",
      "  copying apex/contrib/peer_memory/peer_memory.py -> build/lib/apex/contrib/peer_memory\n",
      "  copying apex/contrib/peer_memory/__init__.py -> build/lib/apex/contrib/peer_memory\n",
      "  copying apex/contrib/focal_loss/focal_loss.py -> build/lib/apex/contrib/focal_loss\n",
      "  copying apex/contrib/focal_loss/__init__.py -> build/lib/apex/contrib/focal_loss\n",
      "  copying apex/contrib/sparsity/permutation_lib.py -> build/lib/apex/contrib/sparsity\n",
      "  copying apex/contrib/sparsity/asp.py -> build/lib/apex/contrib/sparsity\n",
      "  copying apex/contrib/sparsity/sparse_masklib.py -> build/lib/apex/contrib/sparsity\n",
      "  copying apex/contrib/sparsity/__init__.py -> build/lib/apex/contrib/sparsity\n",
      "  copying apex/contrib/test/__init__.py -> build/lib/apex/contrib/test\n",
      "  copying apex/contrib/optimizers/fused_lamb.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/fused_adam.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/fp16_optimizer.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/distributed_fused_adam.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/distributed_fused_lamb.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/fused_sgd.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/optimizers/__init__.py -> build/lib/apex/contrib/optimizers\n",
      "  copying apex/contrib/xentropy/softmax_xentropy.py -> build/lib/apex/contrib/xentropy\n",
      "  copying apex/contrib/xentropy/__init__.py -> build/lib/apex/contrib/xentropy\n",
      "  copying apex/contrib/transducer/_transducer_ref.py -> build/lib/apex/contrib/transducer\n",
      "  copying apex/contrib/transducer/__init__.py -> build/lib/apex/contrib/transducer\n",
      "  copying apex/contrib/transducer/transducer.py -> build/lib/apex/contrib/transducer\n",
      "  copying apex/contrib/sparsity/permutation_search_kernels/exhaustive_search.py -> build/lib/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying apex/contrib/sparsity/permutation_search_kernels/permutation_utilities.py -> build/lib/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying apex/contrib/sparsity/permutation_search_kernels/call_permutation_search_kernels.py -> build/lib/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying apex/contrib/sparsity/permutation_search_kernels/channel_swap.py -> build/lib/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying apex/contrib/sparsity/permutation_search_kernels/__init__.py -> build/lib/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying apex/contrib/test/index_mul_2d/test_index_mul_2d.py -> build/lib/apex/contrib/test/index_mul_2d\n",
      "  copying apex/contrib/test/index_mul_2d/__init__.py -> build/lib/apex/contrib/test/index_mul_2d\n",
      "  copying apex/contrib/test/conv_bias_relu/test_conv_bias_relu.py -> build/lib/apex/contrib/test/conv_bias_relu\n",
      "  copying apex/contrib/test/conv_bias_relu/__init__.py -> build/lib/apex/contrib/test/conv_bias_relu\n",
      "  copying apex/contrib/test/clip_grad/test_clip_grad.py -> build/lib/apex/contrib/test/clip_grad\n",
      "  copying apex/contrib/test/clip_grad/__init__.py -> build/lib/apex/contrib/test/clip_grad\n",
      "  copying apex/contrib/test/group_norm/test_group_norm.py -> build/lib/apex/contrib/test/group_norm\n",
      "  copying apex/contrib/test/group_norm/__init__.py -> build/lib/apex/contrib/test/group_norm\n",
      "  copying apex/contrib/test/fmha/test_fmha.py -> build/lib/apex/contrib/test/fmha\n",
      "  copying apex/contrib/test/fmha/__init__.py -> build/lib/apex/contrib/test/fmha\n",
      "  copying apex/contrib/test/multihead_attn/test_encdec_multihead_attn.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/test_self_multihead_attn_norm_add.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/test_encdec_multihead_attn_norm_add.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/test_fast_self_multihead_attn_bias.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/test_self_multihead_attn.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/test_mha_fused_softmax.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/multihead_attn/__init__.py -> build/lib/apex/contrib/test/multihead_attn\n",
      "  copying apex/contrib/test/layer_norm/test_fast_layer_norm.py -> build/lib/apex/contrib/test/layer_norm\n",
      "  copying apex/contrib/test/layer_norm/__init__.py -> build/lib/apex/contrib/test/layer_norm\n",
      "  copying apex/contrib/test/bottleneck/test_bottleneck_module.py -> build/lib/apex/contrib/test/bottleneck\n",
      "  copying apex/contrib/test/bottleneck/__init__.py -> build/lib/apex/contrib/test/bottleneck\n",
      "  copying apex/contrib/test/cudnn_gbn/test_cudnn_gbn_with_two_gpus.py -> build/lib/apex/contrib/test/cudnn_gbn\n",
      "  copying apex/contrib/test/cudnn_gbn/__init__.py -> build/lib/apex/contrib/test/cudnn_gbn\n",
      "  copying apex/contrib/test/peer_memory/test_peer_halo_exchange_module.py -> build/lib/apex/contrib/test/peer_memory\n",
      "  copying apex/contrib/test/peer_memory/__init__.py -> build/lib/apex/contrib/test/peer_memory\n",
      "  copying apex/contrib/test/focal_loss/test_focal_loss.py -> build/lib/apex/contrib/test/focal_loss\n",
      "  copying apex/contrib/test/focal_loss/__init__.py -> build/lib/apex/contrib/test/focal_loss\n",
      "  copying apex/contrib/test/optimizers/test_dist_adam.py -> build/lib/apex/contrib/test/optimizers\n",
      "  copying apex/contrib/test/optimizers/test_distributed_fused_lamb.py -> build/lib/apex/contrib/test/optimizers\n",
      "  copying apex/contrib/test/optimizers/__init__.py -> build/lib/apex/contrib/test/optimizers\n",
      "  copying apex/contrib/test/xentropy/test_label_smoothing.py -> build/lib/apex/contrib/test/xentropy\n",
      "  copying apex/contrib/test/xentropy/__init__.py -> build/lib/apex/contrib/test/xentropy\n",
      "  copying apex/contrib/test/transducer/test_transducer_loss.py -> build/lib/apex/contrib/test/transducer\n",
      "  copying apex/contrib/test/transducer/__init__.py -> build/lib/apex/contrib/test/transducer\n",
      "  copying apex/contrib/test/transducer/test_transducer_joint.py -> build/lib/apex/contrib/test/transducer\n",
      "  installing to build/bdist.linux-x86_64/wheel\n",
      "  running install\n",
      "  running install_lib\n",
      "  creating build/bdist.linux-x86_64/wheel\n",
      "  creating build/bdist.linux-x86_64/wheel/apex\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/enums.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/_ucc_util.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/layers.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/memory.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/random.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/cross_entropy.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/utils.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/mappings.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  copying build/lib/apex/transformer/tensor_parallel/data.py -> build/bdist.linux-x86_64/wheel/apex/transformer/tensor_parallel\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/layers\n",
      "  copying build/lib/apex/transformer/layers/layer_norm.py -> build/bdist.linux-x86_64/wheel/apex/transformer/layers\n",
      "  copying build/lib/apex/transformer/layers/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/layers\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/_data\n",
      "  copying build/lib/apex/transformer/_data/_batchsampler.py -> build/bdist.linux-x86_64/wheel/apex/transformer/_data\n",
      "  copying build/lib/apex/transformer/_data/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/_data\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/_timers.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/utils.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/schedules/fwd_bwd_no_pipelining.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_with_interleaving.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_without_interleaving.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/schedules/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/schedules/common.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel/schedules\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel\n",
      "  copying build/lib/apex/transformer/pipeline_parallel/p2p_communication.py -> build/bdist.linux-x86_64/wheel/apex/transformer/pipeline_parallel\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/global_vars.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/distributed_test_base.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/arguments.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/standalone_gpt.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/standalone_transformer_lm.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/commons.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  copying build/lib/apex/transformer/testing/standalone_bert.py -> build/bdist.linux-x86_64/wheel/apex/transformer/testing\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/amp\n",
      "  copying build/lib/apex/transformer/amp/grad_scaler.py -> build/bdist.linux-x86_64/wheel/apex/transformer/amp\n",
      "  copying build/lib/apex/transformer/amp/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/amp\n",
      "  copying build/lib/apex/transformer/microbatches.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/utils.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/log_util.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/parallel_state.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  copying build/lib/apex/transformer/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/transformer/functional\n",
      "  copying build/lib/apex/transformer/functional/fused_softmax.py -> build/bdist.linux-x86_64/wheel/apex/transformer/functional\n",
      "  copying build/lib/apex/transformer/functional/fused_rope.py -> build/bdist.linux-x86_64/wheel/apex/transformer/functional\n",
      "  copying build/lib/apex/transformer/functional/__init__.py -> build/bdist.linux-x86_64/wheel/apex/transformer/functional\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/RNN\n",
      "  copying build/lib/apex/RNN/cells.py -> build/bdist.linux-x86_64/wheel/apex/RNN\n",
      "  copying build/lib/apex/RNN/models.py -> build/bdist.linux-x86_64/wheel/apex/RNN\n",
      "  copying build/lib/apex/RNN/__init__.py -> build/bdist.linux-x86_64/wheel/apex/RNN\n",
      "  copying build/lib/apex/RNN/RNNBackend.py -> build/bdist.linux-x86_64/wheel/apex/RNN\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/fp16_utils\n",
      "  copying build/lib/apex/fp16_utils/fp16_optimizer.py -> build/bdist.linux-x86_64/wheel/apex/fp16_utils\n",
      "  copying build/lib/apex/fp16_utils/loss_scaler.py -> build/bdist.linux-x86_64/wheel/apex/fp16_utils\n",
      "  copying build/lib/apex/fp16_utils/__init__.py -> build/bdist.linux-x86_64/wheel/apex/fp16_utils\n",
      "  copying build/lib/apex/fp16_utils/fp16util.py -> build/bdist.linux-x86_64/wheel/apex/fp16_utils\n",
      "  copying build/lib/apex/_autocast_utils.py -> build/bdist.linux-x86_64/wheel/apex\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/mlp\n",
      "  copying build/lib/apex/mlp/mlp.py -> build/bdist.linux-x86_64/wheel/apex/mlp\n",
      "  copying build/lib/apex/mlp/__init__.py -> build/bdist.linux-x86_64/wheel/apex/mlp\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/fused_dense\n",
      "  copying build/lib/apex/fused_dense/fused_dense.py -> build/bdist.linux-x86_64/wheel/apex/fused_dense\n",
      "  copying build/lib/apex/fused_dense/__init__.py -> build/bdist.linux-x86_64/wheel/apex/fused_dense\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/LARC.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/multiproc.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/sync_batchnorm.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/optimized_sync_batchnorm.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/optimized_sync_batchnorm_kernel.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/distributed.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/__init__.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  copying build/lib/apex/parallel/sync_batchnorm_kernel.py -> build/bdist.linux-x86_64/wheel/apex/parallel\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/scaler.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/__version__.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/handle.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/opt.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/compat.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/_process_optimizer.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/amp/lists\n",
      "  copying build/lib/apex/amp/lists/tensor_overrides.py -> build/bdist.linux-x86_64/wheel/apex/amp/lists\n",
      "  copying build/lib/apex/amp/lists/functional_overrides.py -> build/bdist.linux-x86_64/wheel/apex/amp/lists\n",
      "  copying build/lib/apex/amp/lists/__init__.py -> build/bdist.linux-x86_64/wheel/apex/amp/lists\n",
      "  copying build/lib/apex/amp/lists/torch_overrides.py -> build/bdist.linux-x86_64/wheel/apex/amp/lists\n",
      "  copying build/lib/apex/amp/wrap.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/utils.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/_initialize.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/__init__.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/frontend.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/_amp_state.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/amp.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  copying build/lib/apex/amp/rnn_compat.py -> build/bdist.linux-x86_64/wheel/apex/amp\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/gpu_direct_storage\n",
      "  copying build/lib/apex/contrib/gpu_direct_storage/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/gpu_direct_storage\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/index_mul_2d\n",
      "  copying build/lib/apex/contrib/index_mul_2d/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/index_mul_2d\n",
      "  copying build/lib/apex/contrib/index_mul_2d/index_mul_2d.py -> build/bdist.linux-x86_64/wheel/apex/contrib/index_mul_2d\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/conv_bias_relu\n",
      "  copying build/lib/apex/contrib/conv_bias_relu/conv_bias_relu.py -> build/bdist.linux-x86_64/wheel/apex/contrib/conv_bias_relu\n",
      "  copying build/lib/apex/contrib/conv_bias_relu/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/conv_bias_relu\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/clip_grad\n",
      "  copying build/lib/apex/contrib/clip_grad/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/clip_grad\n",
      "  copying build/lib/apex/contrib/clip_grad/clip_grad.py -> build/bdist.linux-x86_64/wheel/apex/contrib/clip_grad\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/groupbn\n",
      "  copying build/lib/apex/contrib/groupbn/batch_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/groupbn\n",
      "  copying build/lib/apex/contrib/groupbn/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/groupbn\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/group_norm\n",
      "  copying build/lib/apex/contrib/group_norm/group_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/group_norm\n",
      "  copying build/lib/apex/contrib/group_norm/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/group_norm\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/fmha\n",
      "  copying build/lib/apex/contrib/fmha/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/fmha\n",
      "  copying build/lib/apex/contrib/fmha/fmha.py -> build/bdist.linux-x86_64/wheel/apex/contrib/fmha\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/layer_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/mha.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/_layer_norm_config_hopper.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/_layer_norm_config_ampere.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/fused_adam_swa.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/_layer_norm_forward_kernels.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/_layer_norm_backward_kernels.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  copying build/lib/apex/contrib/openfold_triton/_mha_kernel.py -> build/bdist.linux-x86_64/wheel/apex/contrib/openfold_triton\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/encdec_multihead_attn.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/mask_softmax_dropout_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/self_multihead_attn.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/fast_encdec_multihead_attn_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/fast_encdec_multihead_attn_norm_add_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/fast_self_multihead_attn_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/encdec_multihead_attn_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/self_multihead_attn_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  copying build/lib/apex/contrib/multihead_attn/fast_self_multihead_attn_norm_add_func.py -> build/bdist.linux-x86_64/wheel/apex/contrib/multihead_attn\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/layer_norm\n",
      "  copying build/lib/apex/contrib/layer_norm/layer_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/layer_norm\n",
      "  copying build/lib/apex/contrib/layer_norm/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/layer_norm\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/nccl_allocator\n",
      "  copying build/lib/apex/contrib/nccl_allocator/nccl_allocator.py -> build/bdist.linux-x86_64/wheel/apex/contrib/nccl_allocator\n",
      "  copying build/lib/apex/contrib/nccl_allocator/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/nccl_allocator\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/bottleneck\n",
      "  copying build/lib/apex/contrib/bottleneck/bottleneck.py -> build/bdist.linux-x86_64/wheel/apex/contrib/bottleneck\n",
      "  copying build/lib/apex/contrib/bottleneck/test.py -> build/bdist.linux-x86_64/wheel/apex/contrib/bottleneck\n",
      "  copying build/lib/apex/contrib/bottleneck/halo_exchangers.py -> build/bdist.linux-x86_64/wheel/apex/contrib/bottleneck\n",
      "  copying build/lib/apex/contrib/bottleneck/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/bottleneck\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/cudnn_gbn\n",
      "  copying build/lib/apex/contrib/cudnn_gbn/batch_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/cudnn_gbn\n",
      "  copying build/lib/apex/contrib/cudnn_gbn/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/cudnn_gbn\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/peer_memory\n",
      "  copying build/lib/apex/contrib/peer_memory/peer_halo_exchanger_1d.py -> build/bdist.linux-x86_64/wheel/apex/contrib/peer_memory\n",
      "  copying build/lib/apex/contrib/peer_memory/peer_memory.py -> build/bdist.linux-x86_64/wheel/apex/contrib/peer_memory\n",
      "  copying build/lib/apex/contrib/peer_memory/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/peer_memory\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/focal_loss\n",
      "  copying build/lib/apex/contrib/focal_loss/focal_loss.py -> build/bdist.linux-x86_64/wheel/apex/contrib/focal_loss\n",
      "  copying build/lib/apex/contrib/focal_loss/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/focal_loss\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/sparsity\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_lib.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity\n",
      "  copying build/lib/apex/contrib/sparsity/asp.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_search_kernels/exhaustive_search.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_search_kernels/permutation_utilities.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_search_kernels/call_permutation_search_kernels.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_search_kernels/channel_swap.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/permutation_search_kernels/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity/permutation_search_kernels\n",
      "  copying build/lib/apex/contrib/sparsity/sparse_masklib.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity\n",
      "  copying build/lib/apex/contrib/sparsity/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/sparsity\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/index_mul_2d\n",
      "  copying build/lib/apex/contrib/test/index_mul_2d/test_index_mul_2d.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/index_mul_2d\n",
      "  copying build/lib/apex/contrib/test/index_mul_2d/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/index_mul_2d\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/conv_bias_relu\n",
      "  copying build/lib/apex/contrib/test/conv_bias_relu/test_conv_bias_relu.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/conv_bias_relu\n",
      "  copying build/lib/apex/contrib/test/conv_bias_relu/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/conv_bias_relu\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/clip_grad\n",
      "  copying build/lib/apex/contrib/test/clip_grad/test_clip_grad.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/clip_grad\n",
      "  copying build/lib/apex/contrib/test/clip_grad/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/clip_grad\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/group_norm\n",
      "  copying build/lib/apex/contrib/test/group_norm/test_group_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/group_norm\n",
      "  copying build/lib/apex/contrib/test/group_norm/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/group_norm\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/fmha\n",
      "  copying build/lib/apex/contrib/test/fmha/test_fmha.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/fmha\n",
      "  copying build/lib/apex/contrib/test/fmha/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/fmha\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_encdec_multihead_attn.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_self_multihead_attn_norm_add.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_encdec_multihead_attn_norm_add.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_fast_self_multihead_attn_bias.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_self_multihead_attn.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/test_mha_fused_softmax.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  copying build/lib/apex/contrib/test/multihead_attn/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/multihead_attn\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/layer_norm\n",
      "  copying build/lib/apex/contrib/test/layer_norm/test_fast_layer_norm.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/layer_norm\n",
      "  copying build/lib/apex/contrib/test/layer_norm/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/layer_norm\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/bottleneck\n",
      "  copying build/lib/apex/contrib/test/bottleneck/test_bottleneck_module.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/bottleneck\n",
      "  copying build/lib/apex/contrib/test/bottleneck/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/bottleneck\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/cudnn_gbn\n",
      "  copying build/lib/apex/contrib/test/cudnn_gbn/test_cudnn_gbn_with_two_gpus.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/cudnn_gbn\n",
      "  copying build/lib/apex/contrib/test/cudnn_gbn/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/cudnn_gbn\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/peer_memory\n",
      "  copying build/lib/apex/contrib/test/peer_memory/test_peer_halo_exchange_module.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/peer_memory\n",
      "  copying build/lib/apex/contrib/test/peer_memory/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/peer_memory\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/focal_loss\n",
      "  copying build/lib/apex/contrib/test/focal_loss/test_focal_loss.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/focal_loss\n",
      "  copying build/lib/apex/contrib/test/focal_loss/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/focal_loss\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/optimizers\n",
      "  copying build/lib/apex/contrib/test/optimizers/test_dist_adam.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/optimizers\n",
      "  copying build/lib/apex/contrib/test/optimizers/test_distributed_fused_lamb.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/optimizers\n",
      "  copying build/lib/apex/contrib/test/optimizers/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/optimizers\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/xentropy\n",
      "  copying build/lib/apex/contrib/test/xentropy/test_label_smoothing.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/xentropy\n",
      "  copying build/lib/apex/contrib/test/xentropy/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/xentropy\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/test/transducer\n",
      "  copying build/lib/apex/contrib/test/transducer/test_transducer_loss.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/transducer\n",
      "  copying build/lib/apex/contrib/test/transducer/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/transducer\n",
      "  copying build/lib/apex/contrib/test/transducer/test_transducer_joint.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test/transducer\n",
      "  copying build/lib/apex/contrib/test/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/test\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/fused_lamb.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/fused_adam.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/fp16_optimizer.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/distributed_fused_adam.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/distributed_fused_lamb.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/fused_sgd.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  copying build/lib/apex/contrib/optimizers/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/optimizers\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/xentropy\n",
      "  copying build/lib/apex/contrib/xentropy/softmax_xentropy.py -> build/bdist.linux-x86_64/wheel/apex/contrib/xentropy\n",
      "  copying build/lib/apex/contrib/xentropy/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/xentropy\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/contrib/transducer\n",
      "  copying build/lib/apex/contrib/transducer/_transducer_ref.py -> build/bdist.linux-x86_64/wheel/apex/contrib/transducer\n",
      "  copying build/lib/apex/contrib/transducer/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib/transducer\n",
      "  copying build/lib/apex/contrib/transducer/transducer.py -> build/bdist.linux-x86_64/wheel/apex/contrib/transducer\n",
      "  copying build/lib/apex/contrib/__init__.py -> build/bdist.linux-x86_64/wheel/apex/contrib\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_novograd.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_lamb.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_adam.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_adagrad.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_mixed_precision_lamb.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/fused_sgd.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  copying build/lib/apex/optimizers/__init__.py -> build/bdist.linux-x86_64/wheel/apex/optimizers\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/multi_tensor_apply\n",
      "  copying build/lib/apex/multi_tensor_apply/multi_tensor_apply.py -> build/bdist.linux-x86_64/wheel/apex/multi_tensor_apply\n",
      "  copying build/lib/apex/multi_tensor_apply/__init__.py -> build/bdist.linux-x86_64/wheel/apex/multi_tensor_apply\n",
      "  copying build/lib/apex/__init__.py -> build/bdist.linux-x86_64/wheel/apex\n",
      "  creating build/bdist.linux-x86_64/wheel/apex/normalization\n",
      "  copying build/lib/apex/normalization/fused_layer_norm.py -> build/bdist.linux-x86_64/wheel/apex/normalization\n",
      "  copying build/lib/apex/normalization/__init__.py -> build/bdist.linux-x86_64/wheel/apex/normalization\n",
      "  running install_egg_info\n",
      "  running egg_info\n",
      "  writing apex.egg-info/PKG-INFO\n",
      "  writing dependency_links to apex.egg-info/dependency_links.txt\n",
      "  writing requirements to apex.egg-info/requires.txt\n",
      "  writing top-level names to apex.egg-info/top_level.txt\n",
      "  reading manifest file 'apex.egg-info/SOURCES.txt'\n",
      "  adding license file 'LICENSE'\n",
      "  writing manifest file 'apex.egg-info/SOURCES.txt'\n",
      "  Copying apex.egg-info to build/bdist.linux-x86_64/wheel/apex-0.1-py3.10.egg-info\n",
      "  running install_scripts\n",
      "  creating build/bdist.linux-x86_64/wheel/apex-0.1.dist-info/WHEEL\n",
      "  creating '/tmp/pip-wheel-9vbarcid/.tmp-nkpflb3v/apex-0.1-py3-none-any.whl' and adding 'build/bdist.linux-x86_64/wheel' to it\n",
      "  adding 'apex/__init__.py'\n",
      "  adding 'apex/_autocast_utils.py'\n",
      "  adding 'apex/RNN/RNNBackend.py'\n",
      "  adding 'apex/RNN/__init__.py'\n",
      "  adding 'apex/RNN/cells.py'\n",
      "  adding 'apex/RNN/models.py'\n",
      "  adding 'apex/amp/__init__.py'\n",
      "  adding 'apex/amp/__version__.py'\n",
      "  adding 'apex/amp/_amp_state.py'\n",
      "  adding 'apex/amp/_initialize.py'\n",
      "  adding 'apex/amp/_process_optimizer.py'\n",
      "  adding 'apex/amp/amp.py'\n",
      "  adding 'apex/amp/compat.py'\n",
      "  adding 'apex/amp/frontend.py'\n",
      "  adding 'apex/amp/handle.py'\n",
      "  adding 'apex/amp/opt.py'\n",
      "  adding 'apex/amp/rnn_compat.py'\n",
      "  adding 'apex/amp/scaler.py'\n",
      "  adding 'apex/amp/utils.py'\n",
      "  adding 'apex/amp/wrap.py'\n",
      "  adding 'apex/amp/lists/__init__.py'\n",
      "  adding 'apex/amp/lists/functional_overrides.py'\n",
      "  adding 'apex/amp/lists/tensor_overrides.py'\n",
      "  adding 'apex/amp/lists/torch_overrides.py'\n",
      "  adding 'apex/contrib/__init__.py'\n",
      "  adding 'apex/contrib/bottleneck/__init__.py'\n",
      "  adding 'apex/contrib/bottleneck/bottleneck.py'\n",
      "  adding 'apex/contrib/bottleneck/halo_exchangers.py'\n",
      "  adding 'apex/contrib/bottleneck/test.py'\n",
      "  adding 'apex/contrib/clip_grad/__init__.py'\n",
      "  adding 'apex/contrib/clip_grad/clip_grad.py'\n",
      "  adding 'apex/contrib/conv_bias_relu/__init__.py'\n",
      "  adding 'apex/contrib/conv_bias_relu/conv_bias_relu.py'\n",
      "  adding 'apex/contrib/cudnn_gbn/__init__.py'\n",
      "  adding 'apex/contrib/cudnn_gbn/batch_norm.py'\n",
      "  adding 'apex/contrib/fmha/__init__.py'\n",
      "  adding 'apex/contrib/fmha/fmha.py'\n",
      "  adding 'apex/contrib/focal_loss/__init__.py'\n",
      "  adding 'apex/contrib/focal_loss/focal_loss.py'\n",
      "  adding 'apex/contrib/gpu_direct_storage/__init__.py'\n",
      "  adding 'apex/contrib/group_norm/__init__.py'\n",
      "  adding 'apex/contrib/group_norm/group_norm.py'\n",
      "  adding 'apex/contrib/groupbn/__init__.py'\n",
      "  adding 'apex/contrib/groupbn/batch_norm.py'\n",
      "  adding 'apex/contrib/index_mul_2d/__init__.py'\n",
      "  adding 'apex/contrib/index_mul_2d/index_mul_2d.py'\n",
      "  adding 'apex/contrib/layer_norm/__init__.py'\n",
      "  adding 'apex/contrib/layer_norm/layer_norm.py'\n",
      "  adding 'apex/contrib/multihead_attn/__init__.py'\n",
      "  adding 'apex/contrib/multihead_attn/encdec_multihead_attn.py'\n",
      "  adding 'apex/contrib/multihead_attn/encdec_multihead_attn_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/fast_encdec_multihead_attn_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/fast_encdec_multihead_attn_norm_add_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/fast_self_multihead_attn_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/fast_self_multihead_attn_norm_add_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/mask_softmax_dropout_func.py'\n",
      "  adding 'apex/contrib/multihead_attn/self_multihead_attn.py'\n",
      "  adding 'apex/contrib/multihead_attn/self_multihead_attn_func.py'\n",
      "  adding 'apex/contrib/nccl_allocator/__init__.py'\n",
      "  adding 'apex/contrib/nccl_allocator/nccl_allocator.py'\n",
      "  adding 'apex/contrib/openfold_triton/__init__.py'\n",
      "  adding 'apex/contrib/openfold_triton/_layer_norm_backward_kernels.py'\n",
      "  adding 'apex/contrib/openfold_triton/_layer_norm_config_ampere.py'\n",
      "  adding 'apex/contrib/openfold_triton/_layer_norm_config_hopper.py'\n",
      "  adding 'apex/contrib/openfold_triton/_layer_norm_forward_kernels.py'\n",
      "  adding 'apex/contrib/openfold_triton/_mha_kernel.py'\n",
      "  adding 'apex/contrib/openfold_triton/fused_adam_swa.py'\n",
      "  adding 'apex/contrib/openfold_triton/layer_norm.py'\n",
      "  adding 'apex/contrib/openfold_triton/mha.py'\n",
      "  adding 'apex/contrib/optimizers/__init__.py'\n",
      "  adding 'apex/contrib/optimizers/distributed_fused_adam.py'\n",
      "  adding 'apex/contrib/optimizers/distributed_fused_lamb.py'\n",
      "  adding 'apex/contrib/optimizers/fp16_optimizer.py'\n",
      "  adding 'apex/contrib/optimizers/fused_adam.py'\n",
      "  adding 'apex/contrib/optimizers/fused_lamb.py'\n",
      "  adding 'apex/contrib/optimizers/fused_sgd.py'\n",
      "  adding 'apex/contrib/peer_memory/__init__.py'\n",
      "  adding 'apex/contrib/peer_memory/peer_halo_exchanger_1d.py'\n",
      "  adding 'apex/contrib/peer_memory/peer_memory.py'\n",
      "  adding 'apex/contrib/sparsity/__init__.py'\n",
      "  adding 'apex/contrib/sparsity/asp.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_lib.py'\n",
      "  adding 'apex/contrib/sparsity/sparse_masklib.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_search_kernels/__init__.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_search_kernels/call_permutation_search_kernels.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_search_kernels/channel_swap.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_search_kernels/exhaustive_search.py'\n",
      "  adding 'apex/contrib/sparsity/permutation_search_kernels/permutation_utilities.py'\n",
      "  adding 'apex/contrib/test/__init__.py'\n",
      "  adding 'apex/contrib/test/bottleneck/__init__.py'\n",
      "  adding 'apex/contrib/test/bottleneck/test_bottleneck_module.py'\n",
      "  adding 'apex/contrib/test/clip_grad/__init__.py'\n",
      "  adding 'apex/contrib/test/clip_grad/test_clip_grad.py'\n",
      "  adding 'apex/contrib/test/conv_bias_relu/__init__.py'\n",
      "  adding 'apex/contrib/test/conv_bias_relu/test_conv_bias_relu.py'\n",
      "  adding 'apex/contrib/test/cudnn_gbn/__init__.py'\n",
      "  adding 'apex/contrib/test/cudnn_gbn/test_cudnn_gbn_with_two_gpus.py'\n",
      "  adding 'apex/contrib/test/fmha/__init__.py'\n",
      "  adding 'apex/contrib/test/fmha/test_fmha.py'\n",
      "  adding 'apex/contrib/test/focal_loss/__init__.py'\n",
      "  adding 'apex/contrib/test/focal_loss/test_focal_loss.py'\n",
      "  adding 'apex/contrib/test/group_norm/__init__.py'\n",
      "  adding 'apex/contrib/test/group_norm/test_group_norm.py'\n",
      "  adding 'apex/contrib/test/index_mul_2d/__init__.py'\n",
      "  adding 'apex/contrib/test/index_mul_2d/test_index_mul_2d.py'\n",
      "  adding 'apex/contrib/test/layer_norm/__init__.py'\n",
      "  adding 'apex/contrib/test/layer_norm/test_fast_layer_norm.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/__init__.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_encdec_multihead_attn.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_encdec_multihead_attn_norm_add.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_fast_self_multihead_attn_bias.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_mha_fused_softmax.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_self_multihead_attn.py'\n",
      "  adding 'apex/contrib/test/multihead_attn/test_self_multihead_attn_norm_add.py'\n",
      "  adding 'apex/contrib/test/optimizers/__init__.py'\n",
      "  adding 'apex/contrib/test/optimizers/test_dist_adam.py'\n",
      "  adding 'apex/contrib/test/optimizers/test_distributed_fused_lamb.py'\n",
      "  adding 'apex/contrib/test/peer_memory/__init__.py'\n",
      "  adding 'apex/contrib/test/peer_memory/test_peer_halo_exchange_module.py'\n",
      "  adding 'apex/contrib/test/transducer/__init__.py'\n",
      "  adding 'apex/contrib/test/transducer/test_transducer_joint.py'\n",
      "  adding 'apex/contrib/test/transducer/test_transducer_loss.py'\n",
      "  adding 'apex/contrib/test/xentropy/__init__.py'\n",
      "  adding 'apex/contrib/test/xentropy/test_label_smoothing.py'\n",
      "  adding 'apex/contrib/transducer/__init__.py'\n",
      "  adding 'apex/contrib/transducer/_transducer_ref.py'\n",
      "  adding 'apex/contrib/transducer/transducer.py'\n",
      "  adding 'apex/contrib/xentropy/__init__.py'\n",
      "  adding 'apex/contrib/xentropy/softmax_xentropy.py'\n",
      "  adding 'apex/fp16_utils/__init__.py'\n",
      "  adding 'apex/fp16_utils/fp16_optimizer.py'\n",
      "  adding 'apex/fp16_utils/fp16util.py'\n",
      "  adding 'apex/fp16_utils/loss_scaler.py'\n",
      "  adding 'apex/fused_dense/__init__.py'\n",
      "  adding 'apex/fused_dense/fused_dense.py'\n",
      "  adding 'apex/mlp/__init__.py'\n",
      "  adding 'apex/mlp/mlp.py'\n",
      "  adding 'apex/multi_tensor_apply/__init__.py'\n",
      "  adding 'apex/multi_tensor_apply/multi_tensor_apply.py'\n",
      "  adding 'apex/normalization/__init__.py'\n",
      "  adding 'apex/normalization/fused_layer_norm.py'\n",
      "  adding 'apex/optimizers/__init__.py'\n",
      "  adding 'apex/optimizers/fused_adagrad.py'\n",
      "  adding 'apex/optimizers/fused_adam.py'\n",
      "  adding 'apex/optimizers/fused_lamb.py'\n",
      "  adding 'apex/optimizers/fused_mixed_precision_lamb.py'\n",
      "  adding 'apex/optimizers/fused_novograd.py'\n",
      "  adding 'apex/optimizers/fused_sgd.py'\n",
      "  adding 'apex/parallel/LARC.py'\n",
      "  adding 'apex/parallel/__init__.py'\n",
      "  adding 'apex/parallel/distributed.py'\n",
      "  adding 'apex/parallel/multiproc.py'\n",
      "  adding 'apex/parallel/optimized_sync_batchnorm.py'\n",
      "  adding 'apex/parallel/optimized_sync_batchnorm_kernel.py'\n",
      "  adding 'apex/parallel/sync_batchnorm.py'\n",
      "  adding 'apex/parallel/sync_batchnorm_kernel.py'\n",
      "  adding 'apex/transformer/__init__.py'\n",
      "  adding 'apex/transformer/_ucc_util.py'\n",
      "  adding 'apex/transformer/enums.py'\n",
      "  adding 'apex/transformer/log_util.py'\n",
      "  adding 'apex/transformer/microbatches.py'\n",
      "  adding 'apex/transformer/parallel_state.py'\n",
      "  adding 'apex/transformer/utils.py'\n",
      "  adding 'apex/transformer/_data/__init__.py'\n",
      "  adding 'apex/transformer/_data/_batchsampler.py'\n",
      "  adding 'apex/transformer/amp/__init__.py'\n",
      "  adding 'apex/transformer/amp/grad_scaler.py'\n",
      "  adding 'apex/transformer/functional/__init__.py'\n",
      "  adding 'apex/transformer/functional/fused_rope.py'\n",
      "  adding 'apex/transformer/functional/fused_softmax.py'\n",
      "  adding 'apex/transformer/layers/__init__.py'\n",
      "  adding 'apex/transformer/layers/layer_norm.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/__init__.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/_timers.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/p2p_communication.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/utils.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/schedules/__init__.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/schedules/common.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/schedules/fwd_bwd_no_pipelining.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_with_interleaving.py'\n",
      "  adding 'apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_without_interleaving.py'\n",
      "  adding 'apex/transformer/tensor_parallel/__init__.py'\n",
      "  adding 'apex/transformer/tensor_parallel/cross_entropy.py'\n",
      "  adding 'apex/transformer/tensor_parallel/data.py'\n",
      "  adding 'apex/transformer/tensor_parallel/layers.py'\n",
      "  adding 'apex/transformer/tensor_parallel/mappings.py'\n",
      "  adding 'apex/transformer/tensor_parallel/memory.py'\n",
      "  adding 'apex/transformer/tensor_parallel/random.py'\n",
      "  adding 'apex/transformer/tensor_parallel/utils.py'\n",
      "  adding 'apex/transformer/testing/__init__.py'\n",
      "  adding 'apex/transformer/testing/arguments.py'\n",
      "  adding 'apex/transformer/testing/commons.py'\n",
      "  adding 'apex/transformer/testing/distributed_test_base.py'\n",
      "  adding 'apex/transformer/testing/global_vars.py'\n",
      "  adding 'apex/transformer/testing/standalone_bert.py'\n",
      "  adding 'apex/transformer/testing/standalone_gpt.py'\n",
      "  adding 'apex/transformer/testing/standalone_transformer_lm.py'\n",
      "  adding 'apex-0.1.dist-info/LICENSE'\n",
      "  adding 'apex-0.1.dist-info/METADATA'\n",
      "  adding 'apex-0.1.dist-info/WHEEL'\n",
      "  adding 'apex-0.1.dist-info/top_level.txt'\n",
      "  adding 'apex-0.1.dist-info/RECORD'\n",
      "  removing build/bdist.linux-x86_64/wheel\n",
      "  Building wheel for apex (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
      "  Created wheel for apex: filename=apex-0.1-py3-none-any.whl size=403781 sha256=274d8ff0fc327081a0cf7023066ea4fc9ba93252091622b6cb4e870ffd7319c3\n",
      "  Stored in directory: /tmp/pip-ephem-wheel-cache-hooazz12/wheels/52/e1/eb/d2274c2728a27d95954a616b430844bf1a248da9f2317330e9\n",
      "Successfully built apex\n",
      "Installing collected packages: apex\n",
      "Successfully installed apex-0.1\n"
     ]
    }
   ],
   "source": [
    "! pip3 install torch torchvision torchaudio\n",
    "! git clone https://github.com/NVIDIA/apex\n",
    "%cd apex\n",
    "! pip uninstall packaging -y\n",
    "! pip install packaging \n",
    "! pip install -v --disable-pip-version-check --no-cache-dir --no-build-isolation --global-option=\"--cpp_ext\" --global-option=\"--cuda_ext\" ./\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import argparse\n",
    "import copy\n",
    "import logging\n",
    "import os\n",
    "import time\n",
    "\n",
    "import numpy as np\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "from apex import amp\n",
    "\n",
    "from preact_resnet import PreActResNet18\n",
    "from utils import (upper_limit, lower_limit, std, clamp, get_loaders,\n",
    "    attack_pgd, evaluate_pgd, evaluate_standard)\n",
    "\n",
    "logger = logging.getLogger(__name__)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "def get_args():\n",
    "    parser = argparse.ArgumentParser()\n",
    "    parser.add_argument('--batch-size', default=128, type=int)\n",
    "    parser.add_argument('--data-dir', default='../../cifar-data', type=str)\n",
    "    parser.add_argument('--epochs', default=30, type=int)\n",
    "    parser.add_argument('--lr-schedule', default='cyclic', choices=['cyclic', 'multistep'])\n",
    "    parser.add_argument('--lr-min', default=0., type=float) # 0.0\n",
    "    parser.add_argument('--lr-max', default=0.2, type=float) # 0.2\n",
    "    parser.add_argument('--weight-decay', default=5e-4, type=float)\n",
    "    parser.add_argument('--momentum', default=0.9, type=float)\n",
    "    #parser.add_argument('--epsilon', default=8, type=int)\n",
    "    #parser.add_argument('--alpha', default=10, type=float, help='Step size')\n",
    "    parser.add_argument('--delta-init', default='random', choices=['zero', 'random', 'previous'],\n",
    "        help='Perturbation initialization method')\n",
    "    parser.add_argument('--out-dir', default='train_fgsm_output', type=str, help='Output directory')\n",
    "    parser.add_argument('--seed', default=0, type=int, help='Random seed')\n",
    "    parser.add_argument('--early-stop', action='store_true', help='Early stop if overfitting occurs')\n",
    "    parser.add_argument('--opt-level', default='O2', type=str, choices=['O0', 'O1', 'O2'],\n",
    "        help='O0 is FP32 training, O1 is Mixed Precision, and O2 is \"Almost FP16\" Mixed Precision')\n",
    "    parser.add_argument('--loss-scale', default='1.0', type=str, choices=['1.0', 'dynamic'],\n",
    "        help='If loss_scale is \"dynamic\", adaptively adjust the loss scale over time')\n",
    "    parser.add_argument('--master-weights', action='store_true',\n",
    "        help='Maintain FP32 master weights to accompany any FP16 model weights, not applicable for O1 opt level')\n",
    "    args, unknown = parser.parse_known_args()\n",
    "\n",
    "    return args"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "8 10.0\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "train_idx_check =  1249038303\n",
      "test_idx_check =  4955575\n",
      "load data ...\n",
      "Epoch \t Seconds \t LR \t \t Train Loss \t Train Acc\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages/apex/amp/scaler.py:56: UserWarning: The torch.cuda.*DtypeTensor constructors are no longer recommended. It's best to use methods such as torch.tensor(data, dtype=*, device='cuda') to create tensors. (Triggered internally at ../torch/csrc/tensor/python_tensor.cpp:78.)\n",
      "  self._overflow_buf = torch.cuda.IntTensor([0])\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 \t 30.3 \t \t 0.0133 \t 2.1963 \t 0.1691\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/ec2-user/anaconda3/envs/python3/lib/python3.10/site-packages/torch/optim/lr_scheduler.py:1613: UserWarning: To get the last learning rate computed by the scheduler, please use `get_last_lr()`.\n",
      "  _warn_get_lr_called_within_step(self)\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1 \t 30.0 \t \t 0.0267 \t 1.9403 \t 0.2648\n",
      "2 \t 30.1 \t \t 0.0400 \t 1.8435 \t 0.3010\n",
      "3 \t 30.1 \t \t 0.0533 \t 1.7588 \t 0.3308\n",
      "4 \t 30.2 \t \t 0.0667 \t 1.6810 \t 0.3580\n",
      "5 \t 30.2 \t \t 0.0800 \t 1.6055 \t 0.3855\n",
      "6 \t 30.2 \t \t 0.0933 \t 1.5415 \t 0.4128\n",
      "7 \t 30.2 \t \t 0.1067 \t 1.4959 \t 0.4299\n",
      "8 \t 30.2 \t \t 0.1200 \t 1.4586 \t 0.4396\n",
      "9 \t 30.2 \t \t 0.1333 \t 1.4249 \t 0.4518\n",
      "10 \t 30.2 \t \t 0.1467 \t 1.4000 \t 0.4645\n",
      "11 \t 30.2 \t \t 0.1600 \t 1.3773 \t 0.4737\n",
      "12 \t 30.2 \t \t 0.1733 \t 1.3583 \t 0.4782\n",
      "13 \t 30.2 \t \t 0.1867 \t 1.3521 \t 0.4817\n",
      "14 \t 30.2 \t \t 0.2000 \t 1.3354 \t 0.4831\n",
      "15 \t 30.2 \t \t 0.1867 \t 1.3268 \t 0.4864\n",
      "16 \t 30.2 \t \t 0.1733 \t 1.2987 \t 0.4979\n",
      "17 \t 30.2 \t \t 0.1600 \t 1.2814 \t 0.5047\n",
      "18 \t 30.2 \t \t 0.1467 \t 1.2586 \t 0.5142\n",
      "19 \t 30.2 \t \t 0.1333 \t 1.2331 \t 0.5233\n",
      "20 \t 30.2 \t \t 0.1200 \t 1.2119 \t 0.5282\n",
      "21 \t 30.2 \t \t 0.1067 \t 1.1836 \t 0.5379\n",
      "22 \t 30.2 \t \t 0.0933 \t 1.1561 \t 0.5497\n",
      "23 \t 30.2 \t \t 0.0800 \t 1.1142 \t 0.5615\n",
      "24 \t 30.2 \t \t 0.0667 \t 1.0837 \t 0.5740\n",
      "25 \t 30.3 \t \t 0.0533 \t 1.0301 \t 0.5920\n",
      "26 \t 30.3 \t \t 0.0400 \t 0.9725 \t 0.6154\n",
      "27 \t 30.3 \t \t 0.0267 \t 0.9013 \t 0.6388\n",
      "28 \t 30.3 \t \t 0.0133 \t 0.7999 \t 0.6810\n",
      "29 \t 30.3 \t \t 0.0000 \t 0.6771 \t 0.7299\n",
      "Total train time: 15.1024 minutes\n",
      "0 / 8\n",
      "1 / 8\n",
      "2 / 8\n",
      "3 / 8\n",
      "4 / 8\n",
      "5 / 8\n",
      "6 / 8\n",
      "7 / 8\n",
      "Test Loss \t Test Acc \t PGD Loss \t PGD Acc\n",
      "0.5240 \t 0.8300 \t 0.9665 \t 0.4200\n",
      "Total evaluation time: 6.1618 minutes\n",
      "6 7.5\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "train_idx_check =  1249038303\n",
      "test_idx_check =  4955575\n",
      "load data ...\n",
      "Epoch \t Seconds \t LR \t \t Train Loss \t Train Acc\n",
      "0 \t 30.3 \t \t 0.0133 \t 2.1318 \t 0.1916\n",
      "1 \t 30.3 \t \t 0.0267 \t 1.8404 \t 0.3018\n",
      "2 \t 30.3 \t \t 0.0400 \t 1.7182 \t 0.3480\n",
      "3 \t 30.3 \t \t 0.0533 \t 1.6127 \t 0.3873\n",
      "4 \t 30.3 \t \t 0.0667 \t 1.5242 \t 0.4212\n",
      "5 \t 30.3 \t \t 0.0800 \t 1.4395 \t 0.4518\n",
      "6 \t 30.3 \t \t 0.0933 \t 1.3732 \t 0.4771\n",
      "7 \t 30.3 \t \t 0.1067 \t 1.3299 \t 0.4958\n",
      "8 \t 30.3 \t \t 0.1200 \t 1.2910 \t 0.5072\n",
      "9 \t 30.3 \t \t 0.1333 \t 1.2574 \t 0.5201\n",
      "10 \t 30.2 \t \t 0.1467 \t 1.2309 \t 0.5299\n",
      "11 \t 30.3 \t \t 0.1600 \t 1.2118 \t 0.5378\n",
      "12 \t 30.2 \t \t 0.1733 \t 1.1947 \t 0.5443\n",
      "13 \t 30.3 \t \t 0.1867 \t 1.1882 \t 0.5463\n",
      "14 \t 30.3 \t \t 0.2000 \t 1.1754 \t 0.5493\n",
      "15 \t 30.3 \t \t 0.1867 \t 1.1659 \t 0.5541\n",
      "16 \t 30.2 \t \t 0.1733 \t 1.1323 \t 0.5663\n",
      "17 \t 30.2 \t \t 0.1600 \t 1.1191 \t 0.5679\n",
      "18 \t 30.2 \t \t 0.1467 \t 1.0884 \t 0.5811\n",
      "19 \t 30.3 \t \t 0.1333 \t 1.0656 \t 0.5903\n",
      "20 \t 30.3 \t \t 0.1200 \t 1.0475 \t 0.5946\n",
      "21 \t 30.2 \t \t 0.1067 \t 1.0095 \t 0.6080\n",
      "22 \t 30.2 \t \t 0.0933 \t 0.9803 \t 0.6200\n",
      "23 \t 30.2 \t \t 0.0800 \t 0.9443 \t 0.6321\n",
      "24 \t 30.2 \t \t 0.0667 \t 0.9049 \t 0.6480\n",
      "25 \t 30.3 \t \t 0.0533 \t 0.8520 \t 0.6690\n",
      "26 \t 30.2 \t \t 0.0400 \t 0.7968 \t 0.6888\n",
      "27 \t 30.2 \t \t 0.0267 \t 0.7222 \t 0.7173\n",
      "28 \t 30.2 \t \t 0.0133 \t 0.6193 \t 0.7582\n",
      "29 \t 30.2 \t \t 0.0000 \t 0.4972 \t 0.8066\n",
      "Total train time: 15.1282 minutes\n",
      "0 / 8\n",
      "1 / 8\n",
      "2 / 8\n",
      "3 / 8\n",
      "4 / 8\n",
      "5 / 8\n",
      "6 / 8\n",
      "7 / 8\n",
      "Test Loss \t Test Acc \t PGD Loss \t PGD Acc\n",
      "0.4262 \t 0.8580 \t 0.9864 \t 0.3690\n",
      "Total evaluation time: 6.1471 minutes\n",
      "4 5.0\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "train_idx_check =  1249038303\n",
      "test_idx_check =  4955575\n",
      "load data ...\n",
      "Epoch \t Seconds \t LR \t \t Train Loss \t Train Acc\n",
      "0 \t 30.3 \t \t 0.0133 \t 2.0448 \t 0.2228\n",
      "1 \t 30.3 \t \t 0.0267 \t 1.7035 \t 0.3548\n",
      "2 \t 30.3 \t \t 0.0400 \t 1.5447 \t 0.4171\n",
      "3 \t 30.3 \t \t 0.0533 \t 1.4159 \t 0.4672\n",
      "4 \t 30.3 \t \t 0.0667 \t 1.3203 \t 0.4989\n",
      "5 \t 30.2 \t \t 0.0800 \t 1.2310 \t 0.5345\n",
      "6 \t 30.3 \t \t 0.0933 \t 1.1678 \t 0.5615\n",
      "7 \t 30.2 \t \t 0.1067 \t 1.1241 \t 0.5801\n",
      "8 \t 30.3 \t \t 0.1200 \t 1.0846 \t 0.5926\n",
      "9 \t 30.2 \t \t 0.1333 \t 1.0499 \t 0.6038\n",
      "10 \t 30.2 \t \t 0.1467 \t 1.0274 \t 0.6133\n",
      "11 \t 30.2 \t \t 0.1600 \t 1.0102 \t 0.6200\n",
      "12 \t 30.2 \t \t 0.1733 \t 0.9930 \t 0.6251\n",
      "13 \t 30.2 \t \t 0.1867 \t 0.9924 \t 0.6251\n",
      "14 \t 30.2 \t \t 0.2000 \t 0.9755 \t 0.6324\n",
      "15 \t 30.2 \t \t 0.1867 \t 0.9638 \t 0.6364\n",
      "16 \t 30.2 \t \t 0.1733 \t 0.9363 \t 0.6472\n",
      "17 \t 30.2 \t \t 0.1600 \t 0.9201 \t 0.6516\n",
      "18 \t 30.3 \t \t 0.1467 \t 0.8909 \t 0.6633\n",
      "19 \t 30.2 \t \t 0.1333 \t 0.8641 \t 0.6727\n",
      "20 \t 30.2 \t \t 0.1200 \t 0.8406 \t 0.6822\n",
      "21 \t 30.2 \t \t 0.1067 \t 0.8089 \t 0.6922\n",
      "22 \t 30.2 \t \t 0.0933 \t 0.7773 \t 0.7029\n",
      "23 \t 30.2 \t \t 0.0800 \t 0.7386 \t 0.7196\n",
      "24 \t 30.2 \t \t 0.0667 \t 0.6997 \t 0.7333\n",
      "25 \t 30.2 \t \t 0.0533 \t 0.6492 \t 0.7528\n",
      "26 \t 30.2 \t \t 0.0400 \t 0.5937 \t 0.7734\n",
      "27 \t 30.2 \t \t 0.0267 \t 0.5188 \t 0.8044\n",
      "28 \t 30.2 \t \t 0.0133 \t 0.4235 \t 0.8407\n",
      "29 \t 30.2 \t \t 0.0000 \t 0.3138 \t 0.8860\n",
      "Total train time: 15.1147 minutes\n",
      "0 / 8\n",
      "1 / 8\n",
      "2 / 8\n",
      "3 / 8\n",
      "4 / 8\n",
      "5 / 8\n",
      "6 / 8\n",
      "7 / 8\n",
      "Test Loss \t Test Acc \t PGD Loss \t PGD Acc\n",
      "0.3302 \t 0.8820 \t 1.1036 \t 0.2920\n",
      "Total evaluation time: 6.1457 minutes\n",
      "2 2.5\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "train_idx_check =  1249038303\n",
      "test_idx_check =  4955575\n",
      "load data ...\n",
      "Epoch \t Seconds \t LR \t \t Train Loss \t Train Acc\n",
      "0 \t 30.4 \t \t 0.0133 \t 1.9129 \t 0.2700\n",
      "1 \t 30.4 \t \t 0.0267 \t 1.4889 \t 0.4452\n",
      "2 \t 30.3 \t \t 0.0400 \t 1.2751 \t 0.5240\n",
      "3 \t 30.3 \t \t 0.0533 \t 1.1336 \t 0.5787\n",
      "4 \t 30.3 \t \t 0.0667 \t 1.0408 \t 0.6154\n",
      "5 \t 30.3 \t \t 0.0800 \t 0.9563 \t 0.6460\n",
      "6 \t 30.3 \t \t 0.0933 \t 0.8971 \t 0.6685\n",
      "7 \t 30.3 \t \t 0.1067 \t 0.8546 \t 0.6864\n",
      "8 \t 30.3 \t \t 0.1200 \t 0.8169 \t 0.6997\n",
      "9 \t 30.2 \t \t 0.1333 \t 0.7828 \t 0.7121\n",
      "10 \t 30.2 \t \t 0.1467 \t 0.7691 \t 0.7165\n",
      "11 \t 30.3 \t \t 0.1600 \t 0.7548 \t 0.7229\n",
      "12 \t 30.3 \t \t 0.1733 \t 0.7424 \t 0.7285\n",
      "13 \t 30.3 \t \t 0.1867 \t 0.7452 \t 0.7267\n",
      "14 \t 30.3 \t \t 0.2000 \t 0.7319 \t 0.7310\n",
      "15 \t 30.2 \t \t 0.1867 \t 0.7184 \t 0.7368\n",
      "16 \t 30.3 \t \t 0.1733 \t 0.6935 \t 0.7439\n",
      "17 \t 30.3 \t \t 0.1600 \t 0.6745 \t 0.7518\n",
      "18 \t 30.3 \t \t 0.1467 \t 0.6482 \t 0.7609\n",
      "19 \t 30.2 \t \t 0.1333 \t 0.6295 \t 0.7669\n",
      "20 \t 30.3 \t \t 0.1200 \t 0.6036 \t 0.7782\n",
      "21 \t 30.2 \t \t 0.1067 \t 0.5761 \t 0.7889\n",
      "22 \t 30.2 \t \t 0.0933 \t 0.5466 \t 0.7976\n",
      "23 \t 30.2 \t \t 0.0800 \t 0.5161 \t 0.8089\n",
      "24 \t 30.3 \t \t 0.0667 \t 0.4781 \t 0.8245\n",
      "25 \t 30.2 \t \t 0.0533 \t 0.4337 \t 0.8429\n",
      "26 \t 30.2 \t \t 0.0400 \t 0.3773 \t 0.8630\n",
      "27 \t 30.2 \t \t 0.0267 \t 0.3162 \t 0.8870\n",
      "28 \t 30.2 \t \t 0.0133 \t 0.2349 \t 0.9174\n",
      "29 \t 30.2 \t \t 0.0000 \t 0.1561 \t 0.9485\n",
      "Total train time: 15.1304 minutes\n",
      "0 / 8\n",
      "1 / 8\n",
      "2 / 8\n",
      "3 / 8\n",
      "4 / 8\n",
      "5 / 8\n",
      "6 / 8\n",
      "7 / 8\n",
      "Test Loss \t Test Acc \t PGD Loss \t PGD Acc\n",
      "0.2649 \t 0.9120 \t 1.5647 \t 0.1700\n",
      "Total evaluation time: 6.1527 minutes\n",
      "0 0.0\n",
      "Files already downloaded and verified\n",
      "Files already downloaded and verified\n",
      "train_idx_check =  1249038303\n",
      "test_idx_check =  4955575\n",
      "load data ...\n",
      "Epoch \t Seconds \t LR \t \t Train Loss \t Train Acc\n",
      "0 \t 30.4 \t \t 0.0133 \t 1.6064 \t 0.4080\n",
      "1 \t 30.4 \t \t 0.0267 \t 1.0104 \t 0.6379\n",
      "2 \t 30.4 \t \t 0.0400 \t 0.7633 \t 0.7320\n",
      "3 \t 30.4 \t \t 0.0533 \t 0.6339 \t 0.7797\n",
      "4 \t 30.3 \t \t 0.0667 \t 0.5647 \t 0.8064\n",
      "5 \t 30.3 \t \t 0.0800 \t 0.5065 \t 0.8245\n",
      "6 \t 30.3 \t \t 0.0933 \t 0.4603 \t 0.8416\n",
      "7 \t 30.3 \t \t 0.1067 \t 0.4325 \t 0.8507\n",
      "8 \t 30.3 \t \t 0.1200 \t 0.4119 \t 0.8578\n",
      "9 \t 30.3 \t \t 0.1333 \t 0.3939 \t 0.8655\n",
      "10 \t 30.3 \t \t 0.1467 \t 0.3953 \t 0.8651\n",
      "11 \t 30.3 \t \t 0.1600 \t 0.3911 \t 0.8644\n",
      "12 \t 30.3 \t \t 0.1733 \t 0.3878 \t 0.8679\n",
      "13 \t 30.3 \t \t 0.1867 \t 0.3848 \t 0.8695\n",
      "14 \t 30.3 \t \t 0.2000 \t 0.3845 \t 0.8689\n",
      "15 \t 30.3 \t \t 0.1867 \t 0.3807 \t 0.8687\n",
      "16 \t 30.3 \t \t 0.1733 \t 0.3614 \t 0.8769\n",
      "17 \t 30.3 \t \t 0.1600 \t 0.3486 \t 0.8820\n",
      "18 \t 30.3 \t \t 0.1467 \t 0.3272 \t 0.8881\n",
      "19 \t 30.2 \t \t 0.1333 \t 0.3117 \t 0.8942\n",
      "20 \t 30.3 \t \t 0.1200 \t 0.2981 \t 0.8976\n",
      "21 \t 30.3 \t \t 0.1067 \t 0.2863 \t 0.9018\n",
      "22 \t 30.3 \t \t 0.0933 \t 0.2620 \t 0.9112\n",
      "23 \t 30.3 \t \t 0.0800 \t 0.2396 \t 0.9180\n",
      "24 \t 30.3 \t \t 0.0667 \t 0.2139 \t 0.9272\n",
      "25 \t 30.3 \t \t 0.0533 \t 0.1853 \t 0.9371\n",
      "26 \t 30.3 \t \t 0.0400 \t 0.1550 \t 0.9474\n",
      "27 \t 30.2 \t \t 0.0267 \t 0.1160 \t 0.9618\n",
      "28 \t 30.2 \t \t 0.0133 \t 0.0720 \t 0.9767\n",
      "29 \t 30.2 \t \t 0.0000 \t 0.0394 \t 0.9881\n",
      "Total train time: 15.1489 minutes\n",
      "0 / 8\n",
      "1 / 8\n",
      "2 / 8\n",
      "3 / 8\n",
      "4 / 8\n",
      "5 / 8\n",
      "6 / 8\n",
      "7 / 8\n",
      "Test Loss \t Test Acc \t PGD Loss \t PGD Acc\n",
      "0.2051 \t 0.9440 \t 8.6513 \t 0.0000\n",
      "Total evaluation time: 0.4773 minutes\n"
     ]
    }
   ],
   "source": [
    "epsilon_lst = [8, 6, 4, 2]\n",
    "for epsilon_raw in epsilon_lst:\n",
    "    alpha = epsilon_raw * 1.25 \n",
    "    print(epsilon_raw, alpha)\n",
    "    args = get_args()\n",
    "    if not os.path.exists(args.out_dir):\n",
    "        os.mkdir(args.out_dir)\n",
    "    logfile = os.path.join(args.out_dir, 'output.log')\n",
    "    if os.path.exists(logfile):\n",
    "        os.remove(logfile)\n",
    "\n",
    "    logging.basicConfig(\n",
    "        format='[%(asctime)s] - %(message)s',\n",
    "        datefmt='%Y/%m/%d %H:%M:%S',\n",
    "        level=logging.INFO,\n",
    "        filename= os.path.join(args.out_dir, 'output.log')\n",
    "        )\n",
    "    logger.info(args)\n",
    "\n",
    "    np.random.seed(args.seed)\n",
    "    torch.manual_seed(args.seed)\n",
    "    torch.cuda.manual_seed(args.seed)\n",
    "\n",
    "\n",
    "    train_loader, test_loader = get_loaders(args.data_dir, args.batch_size)\n",
    "    print('load data ...')\n",
    "    epsilon = (epsilon_raw / 255.) / std\n",
    "    alpha = (alpha / 255.) / std\n",
    "    pgd_alpha = (2 / 255.) / std\n",
    "\n",
    "    model = PreActResNet18().cuda()\n",
    "    model.train()\n",
    "\n",
    "    opt = torch.optim.SGD(model.parameters(), lr=args.lr_max, momentum=args.momentum, weight_decay=args.weight_decay)\n",
    "    amp_args = dict(opt_level=args.opt_level, loss_scale=args.loss_scale, verbosity=False)\n",
    "    if args.opt_level == 'O2':\n",
    "        amp_args['master_weights'] = args.master_weights\n",
    "    model, opt = amp.initialize(model, opt, **amp_args)\n",
    "    criterion = nn.CrossEntropyLoss()\n",
    "\n",
    "    if args.delta_init == 'previous':\n",
    "        delta = torch.zeros(args.batch_size, 3, 32, 32).cuda()\n",
    "\n",
    "    lr_steps = args.epochs * len(train_loader)\n",
    "    if args.lr_schedule == 'cyclic':\n",
    "        scheduler = torch.optim.lr_scheduler.CyclicLR(opt, base_lr=args.lr_min, max_lr=args.lr_max,\n",
    "            step_size_up=lr_steps / 2, step_size_down=lr_steps / 2)\n",
    "    elif args.lr_schedule == 'multistep':\n",
    "        scheduler = torch.optim.lr_scheduler.MultiStepLR(opt, milestones=[lr_steps / 2, lr_steps * 3 / 4], gamma=0.1)\n",
    "\n",
    "    # Training\n",
    "    prev_robust_acc = 0.\n",
    "    start_train_time = time.time()\n",
    "    logger.info('Epoch \\t Seconds \\t LR \\t \\t Train Loss \\t Train Acc')\n",
    "    print('Epoch \\t Seconds \\t LR \\t \\t Train Loss \\t Train Acc')\n",
    "    for epoch in range(args.epochs):\n",
    "        start_epoch_time = time.time()\n",
    "        train_loss = 0\n",
    "        train_acc = 0\n",
    "        train_n = 0\n",
    "        for i, (X, y) in enumerate(train_loader):\n",
    "            X, y = X.cuda(), y.cuda()\n",
    "            # solving inner max \n",
    "            if i == 0:\n",
    "                first_batch = (X, y)\n",
    "            if args.delta_init != 'previous':\n",
    "                delta = torch.zeros_like(X).cuda()\n",
    "            if args.delta_init == 'random':\n",
    "                for j in range(len(epsilon)):\n",
    "                    delta[:, j, :, :].uniform_(-epsilon[j][0][0].item(), epsilon[j][0][0].item())\n",
    "                delta.data = clamp(delta, lower_limit - X, upper_limit - X)\n",
    "            delta.requires_grad = True\n",
    "            output = model(X + delta[:X.size(0)])\n",
    "\n",
    "            # solving outer min via SGD\n",
    "            loss = F.cross_entropy(output, y)\n",
    "            with amp.scale_loss(loss, opt) as scaled_loss:\n",
    "                scaled_loss.backward()\n",
    "            grad = delta.grad.detach()\n",
    "            delta.data = clamp(delta + alpha * torch.sign(grad), -epsilon, epsilon)\n",
    "            delta.data[:X.size(0)] = clamp(delta[:X.size(0)], lower_limit - X, upper_limit - X)\n",
    "            delta = delta.detach()\n",
    "            output = model(X + delta[:X.size(0)])\n",
    "            loss = criterion(output, y)\n",
    "            opt.zero_grad()\n",
    "            with amp.scale_loss(loss, opt) as scaled_loss:\n",
    "                scaled_loss.backward()\n",
    "            opt.step()\n",
    "            train_loss += loss.item() * y.size(0)\n",
    "            train_acc += (output.max(1)[1] == y).sum().item()\n",
    "            train_n += y.size(0)\n",
    "            scheduler.step()\n",
    "        if args.early_stop:\n",
    "            # Check current PGD robustness of model using random minibatch\n",
    "            X, y = first_batch\n",
    "            pgd_delta = attack_pgd(model, X, y, epsilon, pgd_alpha, 5, 1, opt)\n",
    "            with torch.no_grad():\n",
    "                output = model(clamp(X + pgd_delta[:X.size(0)], lower_limit, upper_limit))\n",
    "            robust_acc = (output.max(1)[1] == y).sum().item() / y.size(0)\n",
    "            if robust_acc - prev_robust_acc < -0.2:\n",
    "                break\n",
    "            prev_robust_acc = robust_acc\n",
    "            best_state_dict = copy.deepcopy(model.state_dict())\n",
    "        epoch_time = time.time()\n",
    "        lr = scheduler.get_lr()[0]\n",
    "        logger.info('%d \\t %.1f \\t \\t %.4f \\t %.4f \\t %.4f', epoch, epoch_time - start_epoch_time, lr, train_loss/train_n, train_acc/train_n)\n",
    "        print('%d \\t %.1f \\t \\t %.4f \\t %.4f \\t %.4f' % (epoch, epoch_time - start_epoch_time, lr, train_loss/train_n, train_acc/train_n))\n",
    "    train_time = time.time()\n",
    "    if not args.early_stop:\n",
    "        best_state_dict = model.state_dict()\n",
    "    torch.save(best_state_dict, os.path.join(args.out_dir, '9_25_robust_model_epsilon_' + str(epsilon_raw) + '.pth'))\n",
    "    logger.info('Total train time: %.4f minutes', (train_time - start_train_time)/60)\n",
    "    print('Total train time: %.4f minutes' % ((train_time - start_train_time)/60))\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "conda_python3",
   "language": "python",
   "name": "conda_python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
