{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "4ea497ac",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import scipy.sparse as sp\n",
    "import sklearn\n",
    "import sklearn.metrics\n",
    "import torch\n",
    "import pandas as pd\n",
    "import random\n",
    "\n",
    "def boolean_string(s):\n",
    "    if s not in {'False', 'True'}:\n",
    "        raise ValueError('Not a valid boolean string')\n",
    "    return s == 'True'\n",
    "\n",
    "def encode_onehot(labels):\n",
    "    classes = set(labels)\n",
    "    classes_dict = {c: np.identity(len(classes))[i, :] for i, c in\n",
    "                    enumerate(classes)}\n",
    "    labels_onehot = np.array(list(map(classes_dict.get, labels)),\n",
    "                             dtype=np.int32)\n",
    "    return labels_onehot\n",
    "\n",
    "\n",
    "def loaddata(filename):\n",
    "    df = pd.read_csv(filename, header=None, delimiter=\",\")\n",
    "    a = np.array(df.as_matrix())\n",
    "    return a\n",
    "\n",
    "\n",
    "def load_raw_ts(path, dataset, tensor_format=True):\n",
    "    path = path + \"raw/\" + dataset + \"/\"\n",
    "    x_train = np.load(path + 'X_train.npy')\n",
    "    y_train = np.load(path + 'y_train.npy')\n",
    "    x_test = np.load(path + 'X_test.npy')\n",
    "    y_test = np.load(path + 'y_test.npy')\n",
    "    ts = np.concatenate((x_train, x_test), axis=0)\n",
    "    ts = np.transpose(ts, axes=(0, 2, 1))\n",
    "    labels = np.concatenate((y_train, y_test), axis=0)\n",
    "    nclass = int(np.amax(labels)) + 1\n",
    "\n",
    "\n",
    "    train_size = y_train.shape[0]\n",
    "\n",
    "    total_size = labels.shape[0]\n",
    "    idx_train = range(train_size)\n",
    "    idx_val = range(train_size, total_size)\n",
    "    idx_test = range(train_size, total_size)\n",
    "\n",
    "    if tensor_format:\n",
    "        # features = torch.FloatTensor(np.array(features))\n",
    "        ts = torch.FloatTensor(np.array(ts))\n",
    "        labels = torch.LongTensor(labels)\n",
    "\n",
    "        idx_train = torch.LongTensor(idx_train)\n",
    "        idx_val = torch.LongTensor(idx_val)\n",
    "        idx_test = torch.LongTensor(idx_test)\n",
    "\n",
    "    return ts, labels, idx_train, idx_val, idx_test, nclass\n",
    "\n",
    "\n",
    "def normalize(mx):\n",
    "    \"\"\"Row-normalize sparse matrix\"\"\"\n",
    "    row_sums = mx.sum(axis=1)\n",
    "    mx = mx.astype('float32')\n",
    "    row_sums_inverse = 1 / row_sums\n",
    "    f = mx.multiply(row_sums_inverse)\n",
    "    return sp.csr_matrix(f).astype('float32')\n",
    "\n",
    "\n",
    "def accuracy(output, labels):\n",
    "    preds = output.max(1)[1].cpu().numpy()\n",
    "    labels = labels.cpu().numpy()\n",
    "    accuracy_score = (sklearn.metrics.accuracy_score(labels, preds))\n",
    "\n",
    "    return accuracy_score\n",
    "\n",
    "\n",
    "\n",
    "def euclidean_dist(x, y):\n",
    "    # x: N x D\n",
    "    # y: M x D\n",
    "    n = x.size(0)\n",
    "    m = y.size(0)\n",
    "    d = x.size(1)\n",
    "    assert d == y.size(1)\n",
    "\n",
    "    x = x.unsqueeze(1).expand(n, m, d)\n",
    "    y = y.unsqueeze(0).expand(n, m, d)\n",
    "\n",
    "    return torch.pow(x - y, 2).sum(2)\n",
    "\n",
    "\n",
    "def output_conv_size(in_size, kernel_size, stride, padding):\n",
    "\n",
    "    output = int((in_size - kernel_size + 2 * padding) / stride) + 1\n",
    "\n",
    "    return output\n",
    "\n",
    "def dump_embedding(proto_embed, sample_embed, labels, dump_file='./plot/embeddings.txt'):\n",
    "    proto_embed = proto_embed.cpu().detach().numpy()\n",
    "    sample_embed = sample_embed.cpu().detach().numpy()\n",
    "    embed = np.concatenate((proto_embed, sample_embed), axis=0)\n",
    "\n",
    "    nclass = proto_embed.shape[0]\n",
    "    labels = np.concatenate((np.asarray([i for i in range(nclass)]),\n",
    "                             labels.squeeze().cpu().detach().numpy()), axis=0)\n",
    "\n",
    "    with open(dump_file, 'w') as f:\n",
    "        for i in range(len(embed)):\n",
    "            label = str(labels[i])\n",
    "            line = label + \",\" + \",\".join([\"%.4f\" % j for j in embed[i].tolist()])\n",
    "            f.write(line + '\\n')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "db2521bd",
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n",
    "import numpy as np\n",
    "\n",
    "class TapNet(nn.Module):\n",
    "\n",
    "    def __init__(self, nfeat, len_ts, nclass, dropout, filters, kernels, dilation, layers, use_rp, rp_params,\n",
    "                 use_att=True, use_metric=False, use_lstm=False, use_cnn=True, lstm_dim=128):\n",
    "        super(TapNet, self).__init__()\n",
    "        self.nclass = nclass\n",
    "        self.dropout = dropout\n",
    "        self.use_metric = use_metric\n",
    "        self.use_lstm = use_lstm\n",
    "        self.use_cnn = use_cnn\n",
    "\n",
    "        # parameters for random projection\n",
    "        self.use_rp = use_rp\n",
    "        self.rp_group, self.rp_dim = rp_params\n",
    "\n",
    "        if True:\n",
    "            # LSTM\n",
    "            self.channel = nfeat\n",
    "            self.ts_length = len_ts\n",
    "\n",
    "            self.lstm_dim = lstm_dim\n",
    "            self.lstm = nn.LSTM(self.ts_length, self.lstm_dim)\n",
    "\n",
    "            paddings = [0, 0, 0]\n",
    "            if self.use_rp:\n",
    "                self.conv_1_models = nn.ModuleList()\n",
    "                self.idx = []\n",
    "                for i in range(self.rp_group):\n",
    "                    self.conv_1_models.append(nn.Conv1d(self.rp_dim, filters[0], kernel_size=kernels[0], dilation=dilation, stride=1, padding=paddings[0]))\n",
    "                    self.idx.append(np.random.permutation(nfeat)[0: self.rp_dim])\n",
    "            else:\n",
    "                self.conv_1 = nn.Conv1d(self.channel, filters[0], kernel_size=kernels[0], dilation=dilation, stride=1, padding=paddings[0])\n",
    "\n",
    "            self.conv_bn_1 = nn.BatchNorm1d(filters[0])\n",
    "\n",
    "            self.conv_2 = nn.Conv1d(filters[0], filters[1], kernel_size=kernels[1], stride=1, padding=paddings[1])\n",
    "\n",
    "            self.conv_bn_2 = nn.BatchNorm1d(filters[1])\n",
    "\n",
    "            self.conv_3 = nn.Conv1d(filters[1], filters[2], kernel_size=kernels[2], stride=1, padding=paddings[2])\n",
    "\n",
    "            self.conv_bn_3 = nn.BatchNorm1d(filters[2])\n",
    "\n",
    "            # compute the size of input for fully connected layers\n",
    "            fc_input = 0\n",
    "            if self.use_cnn:\n",
    "                conv_size = len_ts\n",
    "                for i in range(len(filters)):\n",
    "                    conv_size = output_conv_size(conv_size, kernels[i], 1, paddings[i])\n",
    "                fc_input += conv_size \n",
    "                #* filters[-1]\n",
    "            if self.use_lstm:\n",
    "                fc_input += conv_size * self.lstm_dim\n",
    "            \n",
    "            if self.use_rp:\n",
    "                fc_input = self.rp_group * filters[2] + self.lstm_dim\n",
    "\n",
    "\n",
    "        # Representation mapping function\n",
    "        layers = [fc_input] + layers\n",
    "        print(\"Layers\", layers)\n",
    "        self.mapping = nn.Sequential()\n",
    "        for i in range(len(layers) - 2):\n",
    "            self.mapping.add_module(\"fc_\" + str(i), nn.Linear(layers[i], layers[i + 1]))\n",
    "            self.mapping.add_module(\"bn_\" + str(i), nn.BatchNorm1d(layers[i + 1]))\n",
    "            self.mapping.add_module(\"relu_\" + str(i), nn.LeakyReLU())\n",
    "\n",
    "        # add last layer\n",
    "        self.mapping.add_module(\"fc_\" + str(len(layers) - 2), nn.Linear(layers[-2], layers[-1]))\n",
    "        if len(layers) == 2:  # if only one layer, add batch normalization\n",
    "            self.mapping.add_module(\"bn_\" + str(len(layers) - 2), nn.BatchNorm1d(layers[-1]))\n",
    "\n",
    "        # Attention\n",
    "        att_dim, semi_att_dim = 128, 128\n",
    "        self.use_att = use_att\n",
    "        if self.use_att:\n",
    "            self.att_models = nn.ModuleList()\n",
    "            for _ in range(nclass):\n",
    "\n",
    "                att_model = nn.Sequential(\n",
    "                    nn.Linear(layers[-1], att_dim),\n",
    "                    nn.Tanh(),\n",
    "                    nn.Linear(att_dim, 1)\n",
    "                )\n",
    "                self.att_models.append(att_model)\n",
    "\n",
    "        \n",
    "    def forward(self, input):\n",
    "        x, labels, idx_train, idx_val, idx_test = input  # x is N * L, where L is the time-series feature dimension\n",
    "\n",
    "        if True:\n",
    "            N = x.size(0)\n",
    "\n",
    "            # LSTM\n",
    "            if self.use_lstm:\n",
    "                x_lstm = self.lstm(x)[0]\n",
    "                x_lstm = x_lstm.mean(1)\n",
    "                x_lstm = x_lstm.view(N, -1)\n",
    "\n",
    "            if self.use_cnn:\n",
    "                # Covolutional Network\n",
    "                # input ts: # N * C * L\n",
    "                if self.use_rp:\n",
    "                    for i in range(len(self.conv_1_models)):\n",
    "                        #x_conv = x\n",
    "                        x_conv = self.conv_1_models[i](x[:, self.idx[i], :])\n",
    "                        x_conv = self.conv_bn_1(x_conv)\n",
    "                        x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                        x_conv = self.conv_2(x_conv)\n",
    "                        x_conv = self.conv_bn_2(x_conv)\n",
    "                        x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                        x_conv = self.conv_3(x_conv)\n",
    "                        x_conv = self.conv_bn_3(x_conv)\n",
    "                        x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                        x_conv = torch.mean(x_conv, 2)\n",
    "\n",
    "                        if i == 0:\n",
    "                            x_conv_sum = x_conv\n",
    "                        else:\n",
    "                            x_conv_sum = torch.cat([x_conv_sum, x_conv], dim=1)\n",
    "\n",
    "                    x_conv = x_conv_sum\n",
    "                else:\n",
    "                    x_conv = x\n",
    "                    x_conv = self.conv_1(x_conv)  # N * C * L\n",
    "                    x_conv = self.conv_bn_1(x_conv)\n",
    "                    x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                    x_conv = self.conv_2(x_conv)\n",
    "                    x_conv = self.conv_bn_2(x_conv)\n",
    "                    x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                    x_conv = self.conv_3(x_conv)\n",
    "                    x_conv = self.conv_bn_3(x_conv)\n",
    "                    x_conv = F.leaky_relu(x_conv)\n",
    "\n",
    "                    x_conv = x_conv.view(N, -1)\n",
    "\n",
    "            if self.use_lstm and self.use_cnn:\n",
    "                x = torch.cat([x_conv, x_lstm], dim=1)\n",
    "            elif self.use_lstm:\n",
    "                x = x_lstm\n",
    "            elif self.use_cnn:\n",
    "                x = x_conv\n",
    "            #\n",
    "\n",
    "        # linear mapping to low-dimensional space\n",
    "        x = self.mapping(x)\n",
    "\n",
    "        # generate the class protocal with dimension C * D (nclass * dim)\n",
    "        proto_list = []\n",
    "        for i in range(self.nclass):\n",
    "            idx = (labels[idx_train].squeeze() == i).nonzero().squeeze(1)\n",
    "            if self.use_att:\n",
    "                A = self.att_models[i](x[idx_train][idx])  # N_k * 1\n",
    "                A = torch.transpose(A, 1, 0)  # 1 * N_k\n",
    "                A = F.softmax(A, dim=1)  # softmax over N_k\n",
    "\n",
    "                class_repr = torch.mm(A, x[idx_train][idx]) # 1 * L\n",
    "                class_repr = torch.transpose(class_repr, 1, 0)  # L * 1\n",
    "            else:  # if do not use attention, simply use the mean of training samples with the same labels.\n",
    "                class_repr = x[idx_train][idx].mean(0)  # L * 1\n",
    "            proto_list.append(class_repr.view(1, -1))\n",
    "        x_proto = torch.cat(proto_list, dim=0)\n",
    "\n",
    "        # prototype distance\n",
    "        proto_dists = euclidean_dist(x_proto, x_proto)\n",
    "        proto_dists = torch.exp(-0.5*proto_dists)\n",
    "        num_proto_pairs = int(self.nclass * (self.nclass - 1) / 2)\n",
    "        proto_dist = torch.sum(proto_dists) / num_proto_pairs\n",
    "\n",
    "        dists = euclidean_dist(x, x_proto)\n",
    "\n",
    "        dump_embedding(x_proto, x, labels)\n",
    "        return torch.exp(-0.5*dists), proto_dist"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "2a33ad24",
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'features' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[0;32m<ipython-input-5-99db443abfa1>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m model = TapNet(nfeat=features.shape[1],\n\u001b[0m\u001b[1;32m      2\u001b[0m                    \u001b[0mlen_ts\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mfeatures\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      3\u001b[0m                    \u001b[0mlayers\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlayers\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m                    \u001b[0mnclass\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      5\u001b[0m                    \u001b[0mdropout\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0.5\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mNameError\u001b[0m: name 'features' is not defined"
     ]
    }
   ],
   "source": [
    "model = TapNet(nfeat=5,\n",
    "                   len_ts=2000,\n",
    "                   layers=3,\n",
    "                   nclass=2,\n",
    "                   dropout=0.5,\n",
    "                   use_lstm=True,\n",
    "                   use_cnn=True,\n",
    "                   filters=args.filters,\n",
    "                   dilation=args.dilation,\n",
    "                   kernels=args.kernels,\n",
    "                   use_metric=args.use_metric,\n",
    "                   use_rp=args.use_rp,\n",
    "                   rp_params=args.rp_params,\n",
    "                   lstm_dim=args.lstm_dim\n",
    "                   )\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0bb623e6",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
