{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "db99a9af",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/ec2-user/miniconda3/envs/baselines/lib/python3.11/site-packages/pydantic/_internal/_generate_schema.py:2249: UnsupportedFieldAttributeWarning: The 'repr' attribute with value False was provided to the `Field()` function, which has no effect in the context it was used. 'repr' is field-specific metadata, and can only be attached to a model field using `Annotated` metadata or by assignment. This may have happened because an `Annotated` type alias using the `type` statement was used, or if the `Field()` function was attached to a single member of a union type.\n",
      "  warnings.warn(\n",
      "/home/ec2-user/miniconda3/envs/baselines/lib/python3.11/site-packages/pydantic/_internal/_generate_schema.py:2249: UnsupportedFieldAttributeWarning: The 'frozen' attribute with value True was provided to the `Field()` function, which has no effect in the context it was used. 'frozen' is field-specific metadata, and can only be attached to a model field using `Annotated` metadata or by assignment. This may have happened because an `Annotated` type alias using the `type` statement was used, or if the `Field()` function was attached to a single member of a union type.\n",
      "  warnings.warn(\n"
     ]
    }
   ],
   "source": [
    "from models.models import SCBM\n",
    "from calflops import calculate_flops\n",
    "from argparse import Namespace"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "cac4475f",
   "metadata": {},
   "outputs": [],
   "source": [
    "config = Namespace()\n",
    "config_model = Namespace()\n",
    "config_model.head_arch = 'linear'\n",
    "config_model.training_mode = 'joint'\n",
    "config_model.j_epochs = 50\n",
    "config_model.concept_learning = 'hard'\n",
    "config_model.num_monte_carlo = 100\n",
    "config_model.straight_through = True\n",
    "config_model.cov_type = 'amortized'\n",
    "\n",
    "data = Namespace()\n",
    "data.num_concepts = 700\n",
    "data.num_classes = 100\n",
    "data.model_type = \"resnet50\"\n",
    "\n",
    "config.model = config_model\n",
    "config.data = data\n",
    "\n",
    "\n",
    "model = SCBM(config=config)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "7ae2e268",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "------------------------------------- Calculate Flops Results -------------------------------------\n",
      "Notations:\n",
      "number of parameters (Params), number of multiply-accumulate operations(MACs),\n",
      "number of floating-point operations (FLOPs), floating-point operations per second (FLOPS),\n",
      "fwd FLOPs (model forward propagation FLOPs), bwd FLOPs (model backward propagation FLOPs),\n",
      "default model backpropagation takes 2.00 times as much computation as forward propagation.\n",
      "\n",
      "Total Training Params:                                                  527.73 M\n",
      "fwd MACs:                                                               8.6857 GMACs\n",
      "fwd FLOPs:                                                              17.4368 GFLOPS\n",
      "fwd+bwd MACs:                                                           26.057 GMACs\n",
      "fwd+bwd FLOPs:                                                          52.3105 GFLOPS\n",
      "\n",
      "-------------------------------- Detailed Calculated FLOPs Results --------------------------------\n",
      "Each module caculated is listed after its name in the following order: \n",
      "params, percentage of total params, MACs, percentage of total MACs, FLOPS, percentage of total FLOPs\n",
      "\n",
      "Note: 1. A module can have torch.nn.module or torch.nn.functional to compute logits (e.g. CrossEntropyLoss). \n",
      " They are not counted as submodules in calflops and not to be printed out. However they make up the difference between a parent's MACs and the sum of its submodules'.\n",
      "2. Number of floating-point operations is a theoretical estimation, thus FLOPS computed using that could be larger than the maximum system throughput.\n",
      "\n",
      "SCBM(\n",
      "  527.73 M = 100% Params, 8.69 GMACs = 100% MACs, 17.44 GFLOPS = 100% FLOPs\n",
      "  (encoder_res): ResNet(\n",
      "    23.51 M = 4.4545% Params, 4.09 GMACs = 47.0561% MACs, 8.21 GFLOPS = 47.0671% FLOPs\n",
      "    (conv1): Conv2d(9.41 K = 0.0018% Params, 118.01 MMACs = 1.3587% MACs, 236.03 MFLOPS = 1.3536% FLOPs, 3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)\n",
      "    (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "    (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, inplace=True)\n",
      "    (maxpool): MaxPool2d(0 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)\n",
      "    (layer1): Sequential(\n",
      "      215.81 K = 0.0409% Params, 667.94 MMACs = 7.6902% MACs, 1.35 GFLOPS = 7.7327% FLOPs\n",
      "      (0): Bottleneck(\n",
      "        75.01 K = 0.0142% Params, 231.21 MMACs = 2.662% MACs, 467.64 MFLOPS = 2.6819% FLOPs\n",
      "        (conv1): Conv2d(4.1 K = 0.0008% Params, 12.85 MMACs = 0.1479% MACs, 25.69 MFLOPS = 0.1473% FLOPs, 64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "        (downsample): Sequential(\n",
      "          16.9 K = 0.0032% Params, 51.38 MMACs = 0.5916% MACs, 104.37 MFLOPS = 0.5985% FLOPs\n",
      "          (0): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        )\n",
      "      )\n",
      "      (1): Bottleneck(\n",
      "        70.4 K = 0.0133% Params, 218.37 MMACs = 2.5141% MACs, 440.34 MFLOPS = 2.5254% FLOPs\n",
      "        (conv1): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "      )\n",
      "      (2): Bottleneck(\n",
      "        70.4 K = 0.0133% Params, 218.37 MMACs = 2.5141% MACs, 440.34 MFLOPS = 2.5254% FLOPs\n",
      "        (conv1): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "      )\n",
      "    )\n",
      "    (layer2): Sequential(\n",
      "      1.22 M = 0.2311% Params, 1.03 GMACs = 11.831% MACs, 2.06 GFLOPS = 11.8378% FLOPs\n",
      "      (0): Bottleneck(\n",
      "        379.39 K = 0.0719% Params, 372.51 MMACs = 4.2887% MACs, 748.53 MFLOPS = 4.2928% FLOPs\n",
      "        (conv1): Conv2d(32.77 K = 0.0062% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 256, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 903.17 KFLOPS = 0.0052% FLOPs, inplace=True)\n",
      "        (downsample): Sequential(\n",
      "          132.1 K = 0.025% Params, 102.76 MMACs = 1.1831% MACs, 206.32 MFLOPS = 1.1833% FLOPs\n",
      "          (0): Conv2d(131.07 K = 0.0248% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 256, 512, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "          (1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        )\n",
      "      )\n",
      "      (1): Bottleneck(\n",
      "        280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "        (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "      )\n",
      "      (2): Bottleneck(\n",
      "        280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "        (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "      )\n",
      "      (3): Bottleneck(\n",
      "        280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "        (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "      )\n",
      "    )\n",
      "    (layer3): Sequential(\n",
      "      7.1 M = 1.3451% Params, 1.46 GMACs = 16.8592% MACs, 2.93 GFLOPS = 16.8319% FLOPs\n",
      "      (0): Bottleneck(\n",
      "        1.51 M = 0.2866% Params, 372.51 MMACs = 4.2887% MACs, 746.77 MFLOPS = 4.2827% FLOPs\n",
      "        (conv1): Conv2d(131.07 K = 0.0248% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 512, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 451.58 KFLOPS = 0.0026% FLOPs, inplace=True)\n",
      "        (downsample): Sequential(\n",
      "          526.34 K = 0.0997% Params, 102.76 MMACs = 1.1831% MACs, 205.92 MFLOPS = 1.181% FLOPs\n",
      "          (0): Conv2d(524.29 K = 0.0993% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 512, 1024, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "          (1): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        )\n",
      "      )\n",
      "      (1): Bottleneck(\n",
      "        1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "        (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "      )\n",
      "      (2): Bottleneck(\n",
      "        1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "        (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "      )\n",
      "      (3): Bottleneck(\n",
      "        1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "        (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "      )\n",
      "      (4): Bottleneck(\n",
      "        1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "        (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "      )\n",
      "      (5): Bottleneck(\n",
      "        1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "        (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "      )\n",
      "    )\n",
      "    (layer4): Sequential(\n",
      "      14.96 M = 2.8357% Params, 809.24 MMACs = 9.3169% MACs, 1.62 GFLOPS = 9.2922% FLOPs\n",
      "      (0): Bottleneck(\n",
      "        6.04 M = 1.1444% Params, 372.51 MMACs = 4.2887% MACs, 745.89 MFLOPS = 4.2777% FLOPs\n",
      "        (conv1): Conv2d(524.29 K = 0.0993% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 1024, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 225.79 KFLOPS = 0.0013% FLOPs, inplace=True)\n",
      "        (downsample): Sequential(\n",
      "          2.1 M = 0.3982% Params, 102.76 MMACs = 1.1831% MACs, 205.72 MFLOPS = 1.1798% FLOPs\n",
      "          (0): Conv2d(2.1 M = 0.3974% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 1024, 2048, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "          (1): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        )\n",
      "      )\n",
      "      (1): Bottleneck(\n",
      "        4.46 M = 0.8456% Params, 218.37 MMACs = 2.5141% MACs, 437.18 MFLOPS = 2.5072% FLOPs\n",
      "        (conv1): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 150.53 KFLOPS = 0.0009% FLOPs, inplace=True)\n",
      "      )\n",
      "      (2): Bottleneck(\n",
      "        4.46 M = 0.8456% Params, 218.37 MMACs = 2.5141% MACs, 437.18 MFLOPS = 2.5072% FLOPs\n",
      "        (conv1): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "        (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "        (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "        (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 150.53 KFLOPS = 0.0009% FLOPs, inplace=True)\n",
      "      )\n",
      "    )\n",
      "    (avgpool): AdaptiveAvgPool2d(0 = 0% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, output_size=(1, 1))\n",
      "    (fc): Identity(0 = 0% Params, 0 MACs = 0% MACs, 0 FLOPS = 0% FLOPs)\n",
      "  )\n",
      "  (encoder): Sequential(\n",
      "    23.51 M = 4.4545% Params, 4.09 GMACs = 47.0561% MACs, 8.21 GFLOPS = 47.0671% FLOPs\n",
      "    (0): ResNet(\n",
      "      23.51 M = 4.4545% Params, 4.09 GMACs = 47.0561% MACs, 8.21 GFLOPS = 47.0671% FLOPs\n",
      "      (conv1): Conv2d(9.41 K = 0.0018% Params, 118.01 MMACs = 1.3587% MACs, 236.03 MFLOPS = 1.3536% FLOPs, 3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)\n",
      "      (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "      (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, inplace=True)\n",
      "      (maxpool): MaxPool2d(0 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)\n",
      "      (layer1): Sequential(\n",
      "        215.81 K = 0.0409% Params, 667.94 MMACs = 7.6902% MACs, 1.35 GFLOPS = 7.7327% FLOPs\n",
      "        (0): Bottleneck(\n",
      "          75.01 K = 0.0142% Params, 231.21 MMACs = 2.662% MACs, 467.64 MFLOPS = 2.6819% FLOPs\n",
      "          (conv1): Conv2d(4.1 K = 0.0008% Params, 12.85 MMACs = 0.1479% MACs, 25.69 MFLOPS = 0.1473% FLOPs, 64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "          (downsample): Sequential(\n",
      "            16.9 K = 0.0032% Params, 51.38 MMACs = 0.5916% MACs, 104.37 MFLOPS = 0.5985% FLOPs\n",
      "            (0): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "            (1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          )\n",
      "        )\n",
      "        (1): Bottleneck(\n",
      "          70.4 K = 0.0133% Params, 218.37 MMACs = 2.5141% MACs, 440.34 MFLOPS = 2.5254% FLOPs\n",
      "          (conv1): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "        )\n",
      "        (2): Bottleneck(\n",
      "          70.4 K = 0.0133% Params, 218.37 MMACs = 2.5141% MACs, 440.34 MFLOPS = 2.5254% FLOPs\n",
      "          (conv1): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(36.86 K = 0.007% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(128 = 0% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(16.38 K = 0.0031% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 1.61 MFLOPS = 0.0092% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 1.2 MFLOPS = 0.0069% FLOPs, inplace=True)\n",
      "        )\n",
      "      )\n",
      "      (layer2): Sequential(\n",
      "        1.22 M = 0.2311% Params, 1.03 GMACs = 11.831% MACs, 2.06 GFLOPS = 11.8378% FLOPs\n",
      "        (0): Bottleneck(\n",
      "          379.39 K = 0.0719% Params, 372.51 MMACs = 4.2887% MACs, 748.53 MFLOPS = 4.2928% FLOPs\n",
      "          (conv1): Conv2d(32.77 K = 0.0062% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 256, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 903.17 KFLOPS = 0.0052% FLOPs, inplace=True)\n",
      "          (downsample): Sequential(\n",
      "            132.1 K = 0.025% Params, 102.76 MMACs = 1.1831% MACs, 206.32 MFLOPS = 1.1833% FLOPs\n",
      "            (0): Conv2d(131.07 K = 0.0248% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 256, 512, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "            (1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          )\n",
      "        )\n",
      "        (1): Bottleneck(\n",
      "          280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "          (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "        )\n",
      "        (2): Bottleneck(\n",
      "          280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "          (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "        )\n",
      "        (3): Bottleneck(\n",
      "          280.06 K = 0.0531% Params, 218.37 MMACs = 2.5141% MACs, 438.54 MFLOPS = 2.515% FLOPs\n",
      "          (conv1): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 128, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(147.46 K = 0.0279% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(256 = 0% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(65.54 K = 0.0124% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 128, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 802.82 KFLOPS = 0.0046% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 602.11 KFLOPS = 0.0035% FLOPs, inplace=True)\n",
      "        )\n",
      "      )\n",
      "      (layer3): Sequential(\n",
      "        7.1 M = 1.3451% Params, 1.46 GMACs = 16.8592% MACs, 2.93 GFLOPS = 16.8319% FLOPs\n",
      "        (0): Bottleneck(\n",
      "          1.51 M = 0.2866% Params, 372.51 MMACs = 4.2887% MACs, 746.77 MFLOPS = 4.2827% FLOPs\n",
      "          (conv1): Conv2d(131.07 K = 0.0248% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 512, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 451.58 KFLOPS = 0.0026% FLOPs, inplace=True)\n",
      "          (downsample): Sequential(\n",
      "            526.34 K = 0.0997% Params, 102.76 MMACs = 1.1831% MACs, 205.92 MFLOPS = 1.181% FLOPs\n",
      "            (0): Conv2d(524.29 K = 0.0993% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 512, 1024, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "            (1): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          )\n",
      "        )\n",
      "        (1): Bottleneck(\n",
      "          1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "          (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "        )\n",
      "        (2): Bottleneck(\n",
      "          1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "          (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "        )\n",
      "        (3): Bottleneck(\n",
      "          1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "          (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "        )\n",
      "        (4): Bottleneck(\n",
      "          1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "          (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "        )\n",
      "        (5): Bottleneck(\n",
      "          1.12 M = 0.2117% Params, 218.37 MMACs = 2.5141% MACs, 437.64 MFLOPS = 2.5098% FLOPs\n",
      "          (conv1): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 1024, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(589.82 K = 0.1118% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(512 = 0.0001% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, 256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(262.14 K = 0.0497% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 256, 1024, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(2.05 K = 0.0004% Params, 0 MACs = 0% MACs, 401.41 KFLOPS = 0.0023% FLOPs, 1024, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 301.06 KFLOPS = 0.0017% FLOPs, inplace=True)\n",
      "        )\n",
      "      )\n",
      "      (layer4): Sequential(\n",
      "        14.96 M = 2.8357% Params, 809.24 MMACs = 9.3169% MACs, 1.62 GFLOPS = 9.2922% FLOPs\n",
      "        (0): Bottleneck(\n",
      "          6.04 M = 1.1444% Params, 372.51 MMACs = 4.2887% MACs, 745.89 MFLOPS = 4.2777% FLOPs\n",
      "          (conv1): Conv2d(524.29 K = 0.0993% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 1024, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 225.79 KFLOPS = 0.0013% FLOPs, inplace=True)\n",
      "          (downsample): Sequential(\n",
      "            2.1 M = 0.3982% Params, 102.76 MMACs = 1.1831% MACs, 205.72 MFLOPS = 1.1798% FLOPs\n",
      "            (0): Conv2d(2.1 M = 0.3974% Params, 102.76 MMACs = 1.1831% MACs, 205.52 MFLOPS = 1.1787% FLOPs, 1024, 2048, kernel_size=(1, 1), stride=(2, 2), bias=False)\n",
      "            (1): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          )\n",
      "        )\n",
      "        (1): Bottleneck(\n",
      "          4.46 M = 0.8456% Params, 218.37 MMACs = 2.5141% MACs, 437.18 MFLOPS = 2.5072% FLOPs\n",
      "          (conv1): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 150.53 KFLOPS = 0.0009% FLOPs, inplace=True)\n",
      "        )\n",
      "        (2): Bottleneck(\n",
      "          4.46 M = 0.8456% Params, 218.37 MMACs = 2.5141% MACs, 437.18 MFLOPS = 2.5072% FLOPs\n",
      "          (conv1): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 2048, 512, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn1): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv2): Conv2d(2.36 M = 0.4471% Params, 115.61 MMACs = 1.331% MACs, 231.21 MFLOPS = 1.326% FLOPs, 512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
      "          (bn2): BatchNorm2d(1.02 K = 0.0002% Params, 0 MACs = 0% MACs, 50.18 KFLOPS = 0.0003% FLOPs, 512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (conv3): Conv2d(1.05 M = 0.1987% Params, 51.38 MMACs = 0.5916% MACs, 102.76 MFLOPS = 0.5893% FLOPs, 512, 2048, kernel_size=(1, 1), stride=(1, 1), bias=False)\n",
      "          (bn3): BatchNorm2d(4.1 K = 0.0008% Params, 0 MACs = 0% MACs, 200.7 KFLOPS = 0.0012% FLOPs, 2048, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
      "          (relu): ReLU(0 = 0% Params, 0 MACs = 0% MACs, 150.53 KFLOPS = 0.0009% FLOPs, inplace=True)\n",
      "        )\n",
      "      )\n",
      "      (avgpool): AdaptiveAvgPool2d(0 = 0% Params, 0 MACs = 0% MACs, 100.35 KFLOPS = 0.0006% FLOPs, output_size=(1, 1))\n",
      "      (fc): Identity(0 = 0% Params, 0 MACs = 0% MACs, 0 FLOPS = 0% FLOPs)\n",
      "    )\n",
      "  )\n",
      "  (mu_concepts): Linear(1.43 M = 0.2718% Params, 1.43 MMACs = 0.0165% MACs, 2.87 MFLOPS = 0.0164% FLOPs, in_features=2048, out_features=700, bias=True)\n",
      "  (sigma_concepts): Linear(502.72 M = 95.2604% Params, 502.48 MMACs = 5.7851% MACs, 1 GFLOPS = 5.7634% FLOPs, in_features=2048, out_features=245350, bias=True)\n",
      "  (act_c): Sigmoid(0 = 0% Params, 0 MACs = 0% MACs, 0 FLOPS = 0% FLOPs)\n",
      "  (head): Sequential(\n",
      "    70.1 K = 0.0133% Params, 7 MMACs = 0.0806% MACs, 14 MFLOPS = 0.0803% FLOPs\n",
      "    (0): Linear(70.1 K = 0.0133% Params, 7 MMACs = 0.0806% MACs, 14 MFLOPS = 0.0803% FLOPs, in_features=700, out_features=100, bias=True)\n",
      "  )\n",
      ")\n",
      "---------------------------------------------------------------------------------------------------\n",
      "FoCA-CBM FLOPs:17.4368 GFLOPS   MACs:8.6857 GMACs   Params:527.735 M \n",
      "\n"
     ]
    }
   ],
   "source": [
    "batch_size = 1\n",
    "input_shape = (batch_size, 3, 224, 224)\n",
    "flops, macs, params = calculate_flops(model=model, \n",
    "                                      input_shape=input_shape,\n",
    "                                      output_as_string=True,\n",
    "                                      output_precision=4)\n",
    "\n",
    "print(\"FoCA-CBM FLOPs:%s   MACs:%s   Params:%s \\n\" %(flops, macs, params))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8197a636",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "baselines",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
