{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Compressing a VGG-16 trained on CIFAR-10\n",
    "\n",
    "#### To replicate results with pretrained models please download the following models from CUP repository\n",
    "\n",
    "1. vgg16_cifar10.pth\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The autoreload extension is already loaded. To reload it, use:\n",
      "  %reload_ext autoreload\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<Figure size 640x480 with 0 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import sys; sys.argv=['']; del sys\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "import matplotlib.pyplot as plt\n",
    "%matplotlib inline\n",
    "plt.tight_layout()\n",
    "\n",
    "import argparse\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import torch.optim as optim\n",
    "from torchvision import datasets, transforms\n",
    "from tensorboardX import SummaryWriter\n",
    "\n",
    "import numpy as np\n",
    "import random\n",
    "import os\n",
    "import time\n",
    "import copy\n",
    "\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = '0'\n",
    "\n",
    "from src.utils import plot_tsne,fancy_dendrogram,save_obj,load_obj\n",
    "from src.model import VGG,load_model\n",
    "from src.prune_model import prune_model\n",
    "from src.cluster_model import cluster_model, fuse_model\n",
    "from src.train_test import train,test,adjust_learning_rate_nips,adjust_learning_rate_iccv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "True\n"
     ]
    }
   ],
   "source": [
    "print(torch.cuda.is_available())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Train baseline VGG-16 model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Files already downloaded and verified\n"
     ]
    }
   ],
   "source": [
    "parser = argparse.ArgumentParser(description='PyTorch MNIST Example')\n",
    "parser.add_argument('--batch-size', type=int, default=64, metavar='N',\n",
    "                    help='input batch size for training (default: 128)')\n",
    "parser.add_argument('-j', '--workers', default=4, type=int, metavar='N',\n",
    "                    help='number of data loading workers (default: 4)')\n",
    "parser.add_argument('--epochs', default=160, type=int, metavar='N',\n",
    "                    help='number of total epochs to run')\n",
    "parser.add_argument('--lr', '--learning-rate', default=0.1, type=float,\n",
    "                    metavar='LR', help='initial learning rate')\n",
    "parser.add_argument('--momentum', default=0.9, type=float, metavar='M',\n",
    "                    help='momentum')\n",
    "parser.add_argument('--weight-decay', '--wd', default=1e-4, type=float,\n",
    "                    metavar='W', help='weight decay (default: 1e-4)')\n",
    "parser.add_argument('--no-cuda', action='store_true', default=False,\n",
    "                    help='disables CUDA training')\n",
    "parser.add_argument('--seed', type=int, default=12346, metavar='S',\n",
    "                    help='random seed (default: 12346)')\n",
    "parser.add_argument('--num_output', type=int, default=10, metavar='S',\n",
    "                    help='number of classes(default: 10)')\n",
    "parser.add_argument('--log-interval', type=int, default=100, metavar='N',\n",
    "                    help='how many batches to wait before logging training status')\n",
    "parser.add_argument('--checkpoint_path', type=str, default='./checkpoints/vgg16_cifar10.pth', metavar='S',\n",
    "                    help='path to store model training checkpoints')\n",
    "parser.add_argument('--gpu', type=int, default=[5], nargs='+', help='used gpu')\n",
    "\n",
    "args = parser.parse_args()\n",
    "\n",
    "\n",
    "#set device to CPU or GPU\n",
    "args = parser.parse_args()\n",
    "\n",
    "use_cuda = not args.no_cuda and torch.cuda.is_available()\n",
    "device = torch.device(\"cuda\" if use_cuda else \"cpu\")\n",
    "\n",
    "writer = SummaryWriter('logs/vgg_16_cifar10/base_iccv_param/')\n",
    "\n",
    "#set all seeds for reproducability\n",
    "def set_random_seed(seed):    \n",
    "    random.seed(seed)\n",
    "    torch.manual_seed(seed)\n",
    "    torch.cuda.manual_seed_all(seed)\n",
    "    np.random.seed(args.seed)\n",
    "    os.environ['PYTHONHASHSEED'] = str(seed)\n",
    "    torch.backends.cudnn.deterministic = True\n",
    "\n",
    "set_random_seed(args.seed)\n",
    "\n",
    "\n",
    "kwargs = {'num_workers': 1, 'pin_memory': True} if use_cuda else {}\n",
    "\n",
    "normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],\n",
    "                                     std=[0.229, 0.224, 0.225])\n",
    "\n",
    "train_loader = torch.utils.data.DataLoader(\n",
    "        datasets.CIFAR10(root='data/', train=True, transform=transforms.Compose([\n",
    "            transforms.RandomHorizontalFlip(),\n",
    "            transforms.RandomCrop(32, 4),\n",
    "            transforms.ToTensor(),\n",
    "            normalize,\n",
    "        ]), download=True),\n",
    "        batch_size=args.batch_size, shuffle=True,\n",
    "        num_workers=args.workers, pin_memory=True)\n",
    "\n",
    "val_loader = torch.utils.data.DataLoader(\n",
    "        datasets.CIFAR10(root='data/', train=False, transform=transforms.Compose([\n",
    "            transforms.ToTensor(),\n",
    "            normalize,\n",
    "        ])),\n",
    "        batch_size=args.batch_size, shuffle=False,\n",
    "        num_workers=args.workers, pin_memory=True)\n",
    "\n",
    "vgg16_bn = VGG('VGG16',num_output=args.num_output)\n",
    "vgg16_bn = vgg16_bn.to(device)\n",
    "        \n",
    "optimizer = optim.SGD(vgg16_bn.parameters(),lr=args.lr,momentum=args.momentum,weight_decay=args.weight_decay,nesterov=False)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "original model accuracy is 93.64\n"
     ]
    }
   ],
   "source": [
    "test_loss = 0\n",
    "best_val_acc = 0\n",
    "\n",
    "if not os.path.isfile(args.checkpoint_path):\n",
    "    for epoch in range(1, args.epochs + 1):\n",
    "        start = time.time()\n",
    "        args.lr = adjust_learning_rate_iccv(args,optimizer,epoch)\n",
    "        train_loss,train_acc = train(args,vgg16_bn,device,train_loader,optimizer,epoch)\n",
    "        val_loss,val_acc = test(args,vgg16_bn,device,val_loader)\n",
    "\n",
    "        writer.add_scalars('base_model/loss',{'train_loss': train_loss,\n",
    "                                        'val_loss' : val_loss}, epoch)\n",
    "        writer.add_scalars('base_model/accuracy',{'train_acc': train_acc,\n",
    "                                            'val_acc' : val_acc}, epoch)    \n",
    "\n",
    "        print('Time taken for epoch : {}\\n'.format(time.time()-start))\n",
    "\n",
    "        if val_acc > best_val_acc: \n",
    "            best_val_acc = val_acc\n",
    "\n",
    "            torch.save({\n",
    "                        'epoch': epoch,\n",
    "                        'model_state_dict': vgg16_bn.state_dict(),\n",
    "                        'optimizer_state_dict': optimizer.state_dict(),\n",
    "                        'loss': val_loss,\n",
    "                        }, args.checkpoint_path, pickle_protocol=4)\n",
    "else:\n",
    "    vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "    orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader,verbose=False)\n",
    "    best_val_acc = orig_acc\n",
    "    \n",
    "print('original model accuracy is {}'.format(best_val_acc))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "\n",
    "\n",
    "### Compress using CUP (T = 0.15), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.15"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 0.2885, Accuracy: 9241/10000 (92%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 92.41, accuracy drop 1.230000000000004\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.15,\n",
    "    'merge_criterion' : 'max_l2_norm',   \n",
    "    'tropnnc_features_and_threshold' : False, \n",
    "    'variant' : False,\n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 6.24M\n",
      "  + Number of FLOPs: 0.46G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "458313962.0"
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Compress using CUP (T = 0.2), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 0.9766, Accuracy: 6791/10000 (68%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 67.91, accuracy drop 25.730000000000004\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.2,\n",
    "    'merge_criterion' : 'max_l2_norm',   \n",
    "    'tropnnc_features_and_threshold' : False, \n",
    "    'variant' : False,\n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 4.62M\n",
      "  + Number of FLOPs: 0.42G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "419362650.0"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Compress using CUP (T = 0.25), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.25"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 2.1928, Accuracy: 1602/10000 (16%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 16.02, accuracy drop 77.62\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.25,\n",
    "    'merge_criterion' : 'max_l2_norm',   \n",
    "    'tropnnc_features_and_threshold' : False, \n",
    "    'variant' : False, \n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 3.61M\n",
      "  + Number of FLOPs: 0.39G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "389613298.0"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Compress using iterative TropNNC, variant 1 (T = 0.014), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.014"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 0.2679, Accuracy: 9358/10000 (94%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 93.58, accuracy drop 0.060000000000002274\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.014,\n",
    "    'merge_criterion' : 'tropnnc3iters',   \n",
    "    'tropnnc_features_and_threshold' : True, \n",
    "    'variant' : False,\n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 5.22M\n",
      "  + Number of FLOPs: 0.46G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "455349114.0"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Compress using TropNNC, variant 1 (T = 0.017), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.017"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 0.2556, Accuracy: 9302/10000 (93%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 93.02, accuracy drop 0.6200000000000045\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.017,\n",
    "    'merge_criterion' : 'tropnnc3iters',   \n",
    "    'tropnnc_features_and_threshold' : True, \n",
    "    'variant' : False,\n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 3.61M\n",
      "  + Number of FLOPs: 0.42G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "416316162.0"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Compress using TropNNC, variant 1 (T = 0.02), no retrain"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Load pre-trained model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "loading state from epoch 152 and test loss 0.3201139727592468\n",
      "\n",
      "Test set: Average loss: 0.3201, Accuracy: 9364/10000 (94%)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "set_random_seed(args.seed)\n",
    "vgg16_bn,optimizer = load_model('vgg16_bn','sgd',args)\n",
    "orig_loss, orig_acc = test(args, vgg16_bn, device, val_loader)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Prune using T=0.02"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['cnn_layers', '0']\n",
      "['cnn_layers', '3']\n",
      "['cnn_layers', '7']\n",
      "['cnn_layers', '10']\n",
      "['cnn_layers', '14']\n",
      "['cnn_layers', '17']\n",
      "['cnn_layers', '20']\n",
      "['cnn_layers', '24']\n",
      "['cnn_layers', '27']\n",
      "['cnn_layers', '30']\n",
      "['cnn_layers', '34']\n",
      "['cnn_layers', '37']\n",
      "\n",
      "Test set: Average loss: 0.2807, Accuracy: 9171/10000 (92%)\n",
      "\n",
      "Original accuracy 93.64, compressed model accuracy 91.71, accuracy drop 1.9300000000000068\n"
     ]
    }
   ],
   "source": [
    "cluster_args = {\n",
    "    'cluster_layers' : {0:0,3:0,7:0,10:0,14:0,17:0,20:0,24:0,27:0,30:0,34:0,37:0,40:0},\n",
    "    'conv_feature_size' : 1,\n",
    "    'reshape_exists' : True,\n",
    "    'features' : 'both',\n",
    "    'channel_reduction' : 'fro',\n",
    "    'use_bias' : False,\n",
    "    'linkage_method' : 'ward',\n",
    "    'distance_metric' : 'euclidean',\n",
    "    'cluster_criterion' : 'hierarchical',\n",
    "    'distance_threshold' : 0.02,\n",
    "    'merge_criterion' : 'tropnnc3iters',   \n",
    "    'tropnnc_features_and_threshold' : True, \n",
    "    'variant' : False, \n",
    "    'verbose' : False\n",
    "}\n",
    "\n",
    "model_modifier = cluster_model(vgg16_bn,cluster_args)\n",
    "vgg16_bn_clustered = model_modifier.cluster_model()#[int(nodes*drop_percentage) for nodes in [500,300]])\n",
    "vgg16_bn_clustered.cuda()\n",
    "\n",
    "val_loss_no_retrain, val_accuracy_no_retrain = test(args, vgg16_bn_clustered, device, val_loader)\n",
    "\n",
    "print('Original accuracy {}, compressed model accuracy {}, accuracy drop {}'.format(orig_acc,val_accuracy_no_retrain,orig_acc-val_accuracy_no_retrain))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Calculate #params and #flops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "--- stats for original model ---\n",
      "  + Number of params: 14.73M\n",
      "  + Number of FLOPs: 0.63G\n",
      "--- stats for compressed model ---\n",
      "  + Number of params: 2.75M\n",
      "  + Number of FLOPs: 0.39G\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "389956402.0"
      ]
     },
     "execution_count": 59,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from src.compute_flops import print_model_param_nums,print_model_param_flops\n",
    "\n",
    "print('--- stats for original model ---')\n",
    "print_model_param_nums(vgg16_bn)\n",
    "print_model_param_flops(vgg16_bn.cpu(),input_res=32)\n",
    "\n",
    "print('--- stats for compressed model ---')\n",
    "print_model_param_nums(vgg16_bn_clustered)\n",
    "print_model_param_flops(vgg16_bn_clustered.cpu(),input_res=32)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "myenv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
