{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import os\n",
    "from pprint import pprint"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "# nodes=[4, [7] * 4, [2] * 28]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(555, 304)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "agg_mat = pd.read_csv('agg_mat.csv')\n",
    "# agg_mat\n",
    "agg_mat_max = agg_mat.values\n",
    "agg_mat_max = agg_mat_max[:,1:]\n",
    "agg_mat_max.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "nbts: 305\n",
      "nts: 555\n",
      "naggts: 250\n"
     ]
    }
   ],
   "source": [
    "nbts = agg_mat.shape[1]\n",
    "nts  = agg_mat.shape[0]\n",
    "naggts = nts - nbts\n",
    "print(\"nbts:\", nbts)\n",
    "print(\"nts:\", nts)\n",
    "print(\"naggts:\", naggts)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = pd.read_csv('TourismData_v3.csv')\n",
    "data = data.iloc[:,2:]\n",
    "# data = data.drop([\"Unnamed: 0\"], axis=1)\n",
    "# data_bts = data.iloc[:,-nbts+1:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>AAAHol</th>\n",
       "      <th>AAAVis</th>\n",
       "      <th>AAABus</th>\n",
       "      <th>AAAOth</th>\n",
       "      <th>AABHol</th>\n",
       "      <th>AABVis</th>\n",
       "      <th>AABBus</th>\n",
       "      <th>AABOth</th>\n",
       "      <th>ABAHol</th>\n",
       "      <th>ABAVis</th>\n",
       "      <th>...</th>\n",
       "      <th>GBBBus</th>\n",
       "      <th>GBBOth</th>\n",
       "      <th>GBCHol</th>\n",
       "      <th>GBCVis</th>\n",
       "      <th>GBCBus</th>\n",
       "      <th>GBCOth</th>\n",
       "      <th>GBDHol</th>\n",
       "      <th>GBDVis</th>\n",
       "      <th>GBDBus</th>\n",
       "      <th>GBDOth</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2015.444457</td>\n",
       "      <td>1379.273926</td>\n",
       "      <td>230.099578</td>\n",
       "      <td>118.238146</td>\n",
       "      <td>936.208816</td>\n",
       "      <td>297.944688</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>915.526615</td>\n",
       "      <td>361.161122</td>\n",
       "      <td>...</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>7.536223</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>1.628948</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.811856</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>9.478051</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>514.337600</td>\n",
       "      <td>645.980857</td>\n",
       "      <td>450.509894</td>\n",
       "      <td>80.836085</td>\n",
       "      <td>139.829461</td>\n",
       "      <td>96.072530</td>\n",
       "      <td>3.800647</td>\n",
       "      <td>5.862538</td>\n",
       "      <td>211.001057</td>\n",
       "      <td>346.151398</td>\n",
       "      <td>...</td>\n",
       "      <td>1.045797</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>5.296459</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.522899</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>532.097470</td>\n",
       "      <td>683.284592</td>\n",
       "      <td>520.458259</td>\n",
       "      <td>138.306554</td>\n",
       "      <td>117.980175</td>\n",
       "      <td>97.113121</td>\n",
       "      <td>28.431680</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>227.458798</td>\n",
       "      <td>185.651451</td>\n",
       "      <td>...</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>2.945006</td>\n",
       "      <td>1.425324</td>\n",
       "      <td>9.924744</td>\n",
       "      <td>3.100121</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>534.059083</td>\n",
       "      <td>819.807646</td>\n",
       "      <td>755.506898</td>\n",
       "      <td>97.089844</td>\n",
       "      <td>202.266724</td>\n",
       "      <td>196.414355</td>\n",
       "      <td>10.812915</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>1273.068333</td>\n",
       "      <td>265.980973</td>\n",
       "      <td>...</td>\n",
       "      <td>11.461824</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>26.419176</td>\n",
       "      <td>13.690603</td>\n",
       "      <td>2.312088</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>10.958005</td>\n",
       "      <td>2.312088</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>505.222272</td>\n",
       "      <td>693.531752</td>\n",
       "      <td>880.152314</td>\n",
       "      <td>82.210784</td>\n",
       "      <td>121.775526</td>\n",
       "      <td>73.542768</td>\n",
       "      <td>12.185418</td>\n",
       "      <td>24.524678</td>\n",
       "      <td>259.541675</td>\n",
       "      <td>169.085846</td>\n",
       "      <td>...</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>23.789282</td>\n",
       "      <td>67.846207</td>\n",
       "      <td>1.282767</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>223</th>\n",
       "      <td>383.526216</td>\n",
       "      <td>838.269610</td>\n",
       "      <td>455.637579</td>\n",
       "      <td>458.064241</td>\n",
       "      <td>86.281072</td>\n",
       "      <td>83.870793</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>228.048826</td>\n",
       "      <td>243.160300</td>\n",
       "      <td>...</td>\n",
       "      <td>7.874448</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>49.899947</td>\n",
       "      <td>8.300225</td>\n",
       "      <td>17.633478</td>\n",
       "      <td>8.218562</td>\n",
       "      <td>4.121631</td>\n",
       "      <td>0.408894</td>\n",
       "      <td>1.625820</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>224</th>\n",
       "      <td>484.959998</td>\n",
       "      <td>512.190298</td>\n",
       "      <td>451.742958</td>\n",
       "      <td>194.214472</td>\n",
       "      <td>120.465489</td>\n",
       "      <td>46.129082</td>\n",
       "      <td>251.544316</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>181.893020</td>\n",
       "      <td>333.526684</td>\n",
       "      <td>...</td>\n",
       "      <td>0.421996</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>80.058887</td>\n",
       "      <td>37.306013</td>\n",
       "      <td>109.024164</td>\n",
       "      <td>46.447153</td>\n",
       "      <td>11.661140</td>\n",
       "      <td>3.557735</td>\n",
       "      <td>4.448534</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>225</th>\n",
       "      <td>399.867668</td>\n",
       "      <td>907.197296</td>\n",
       "      <td>527.255352</td>\n",
       "      <td>102.575984</td>\n",
       "      <td>201.400342</td>\n",
       "      <td>118.033070</td>\n",
       "      <td>6.457149</td>\n",
       "      <td>4.387921</td>\n",
       "      <td>444.169346</td>\n",
       "      <td>229.721638</td>\n",
       "      <td>...</td>\n",
       "      <td>35.375093</td>\n",
       "      <td>0.273247</td>\n",
       "      <td>52.156131</td>\n",
       "      <td>2.093902</td>\n",
       "      <td>50.283538</td>\n",
       "      <td>3.319366</td>\n",
       "      <td>0.754941</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>226</th>\n",
       "      <td>347.337052</td>\n",
       "      <td>836.958504</td>\n",
       "      <td>978.793782</td>\n",
       "      <td>386.733133</td>\n",
       "      <td>76.961404</td>\n",
       "      <td>139.986929</td>\n",
       "      <td>10.674886</td>\n",
       "      <td>8.834427</td>\n",
       "      <td>324.585224</td>\n",
       "      <td>217.713292</td>\n",
       "      <td>...</td>\n",
       "      <td>10.723090</td>\n",
       "      <td>39.292496</td>\n",
       "      <td>8.344998</td>\n",
       "      <td>7.697995</td>\n",
       "      <td>43.270319</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>5.180648</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>227</th>\n",
       "      <td>287.962683</td>\n",
       "      <td>905.432815</td>\n",
       "      <td>851.208690</td>\n",
       "      <td>227.742052</td>\n",
       "      <td>155.903481</td>\n",
       "      <td>221.231957</td>\n",
       "      <td>21.820660</td>\n",
       "      <td>5.157210</td>\n",
       "      <td>330.738835</td>\n",
       "      <td>277.557351</td>\n",
       "      <td>...</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>2.418446</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.762140</td>\n",
       "      <td>1.055685</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>9.966514</td>\n",
       "      <td>0.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>228 rows × 304 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          AAAHol       AAAVis      AAABus      AAAOth      AABHol      AABVis  \\\n",
       "0    2015.444457  1379.273926  230.099578  118.238146  936.208816  297.944688   \n",
       "1     514.337600   645.980857  450.509894   80.836085  139.829461   96.072530   \n",
       "2     532.097470   683.284592  520.458259  138.306554  117.980175   97.113121   \n",
       "3     534.059083   819.807646  755.506898   97.089844  202.266724  196.414355   \n",
       "4     505.222272   693.531752  880.152314   82.210784  121.775526   73.542768   \n",
       "..           ...          ...         ...         ...         ...         ...   \n",
       "223   383.526216   838.269610  455.637579  458.064241   86.281072   83.870793   \n",
       "224   484.959998   512.190298  451.742958  194.214472  120.465489   46.129082   \n",
       "225   399.867668   907.197296  527.255352  102.575984  201.400342  118.033070   \n",
       "226   347.337052   836.958504  978.793782  386.733133   76.961404  139.986929   \n",
       "227   287.962683   905.432815  851.208690  227.742052  155.903481  221.231957   \n",
       "\n",
       "         AABBus     AABOth       ABAHol      ABAVis  ...     GBBBus  \\\n",
       "0      0.000000   0.000000   915.526615  361.161122  ...   0.000000   \n",
       "1      3.800647   5.862538   211.001057  346.151398  ...   1.045797   \n",
       "2     28.431680   0.000000   227.458798  185.651451  ...   0.000000   \n",
       "3     10.812915   0.000000  1273.068333  265.980973  ...  11.461824   \n",
       "4     12.185418  24.524678   259.541675  169.085846  ...   0.000000   \n",
       "..          ...        ...          ...         ...  ...        ...   \n",
       "223    0.000000   0.000000   228.048826  243.160300  ...   7.874448   \n",
       "224  251.544316   0.000000   181.893020  333.526684  ...   0.421996   \n",
       "225    6.457149   4.387921   444.169346  229.721638  ...  35.375093   \n",
       "226   10.674886   8.834427   324.585224  217.713292  ...  10.723090   \n",
       "227   21.820660   5.157210   330.738835  277.557351  ...   0.000000   \n",
       "\n",
       "        GBBOth     GBCHol     GBCVis      GBCBus     GBCOth     GBDHol  \\\n",
       "0     0.000000   7.536223   0.000000    1.628948   0.000000   0.811856   \n",
       "1     0.000000   0.000000   0.000000    5.296459   0.000000   0.522899   \n",
       "2     0.000000   2.945006   1.425324    9.924744   3.100121   0.000000   \n",
       "3     0.000000  26.419176  13.690603    2.312088   0.000000   0.000000   \n",
       "4     0.000000  23.789282  67.846207    1.282767   0.000000   0.000000   \n",
       "..         ...        ...        ...         ...        ...        ...   \n",
       "223   0.000000  49.899947   8.300225   17.633478   8.218562   4.121631   \n",
       "224   0.000000  80.058887  37.306013  109.024164  46.447153  11.661140   \n",
       "225   0.273247  52.156131   2.093902   50.283538   3.319366   0.754941   \n",
       "226  39.292496   8.344998   7.697995   43.270319   0.000000   0.000000   \n",
       "227   0.000000   2.418446   0.000000    0.762140   1.055685   0.000000   \n",
       "\n",
       "        GBDVis    GBDBus  GBDOth  \n",
       "0     0.000000  9.478051     0.0  \n",
       "1     0.000000  0.000000     0.0  \n",
       "2     0.000000  0.000000     0.0  \n",
       "3    10.958005  2.312088     0.0  \n",
       "4     0.000000  0.000000     0.0  \n",
       "..         ...       ...     ...  \n",
       "223   0.408894  1.625820     0.0  \n",
       "224   3.557735  4.448534     0.0  \n",
       "225   0.000000  0.000000     0.0  \n",
       "226   0.000000  5.180648     0.0  \n",
       "227   0.000000  9.966514     0.0  \n",
       "\n",
       "[228 rows x 304 columns]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "better_names = []\n",
    "for name in list(data.columns):\n",
    "    name_split = [ 'T', name[0], name[1], name[2], name[3:] ]\n",
    "    name_join  = (\"-\").join(name_split)\n",
    "    better_names.append(name_join)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "# better_names"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "tags = []\n",
    "for ts_name in better_names:\n",
    "    path_list = [] \n",
    "    ts_split  = ts_name\n",
    "    ts_split  = ts_split.split(\"-\")\n",
    "#     ts_split.insert(0,'T')\n",
    "    for idx in range(1,len(ts_split)+1):\n",
    "        path_list.append(\"-\".join(ts_split[:idx]))\n",
    "    tags.append(path_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "tags = np.array(tags)\n",
    "np.savetxt(\"tags.csv\", tags, delimiter=\",\", fmt='%s')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([['T', 'T-A', 'T-A-A', 'T-A-A-A', 'T-A-A-A-Hol'],\n",
       "       ['T', 'T-A', 'T-A-A', 'T-A-A-A', 'T-A-A-A-Vis'],\n",
       "       ['T', 'T-A', 'T-A-A', 'T-A-A-A', 'T-A-A-A-Bus'],\n",
       "       ...,\n",
       "       ['T', 'T-G', 'T-G-B', 'T-G-B-D', 'T-G-B-D-Vis'],\n",
       "       ['T', 'T-G', 'T-G-B', 'T-G-B-D', 'T-G-B-D-Bus'],\n",
       "       ['T', 'T-G', 'T-G-B', 'T-G-B-D', 'T-G-B-D-Oth']], dtype='<U11')"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "# # improve column names\n",
    "# colnames = []\n",
    "# for name in list(data.columns):\n",
    "# #     name_reverse = eval(name)[::-1]\n",
    "#     name_split = name.split(\"-\")\n",
    "#     if len(name_split) > 1:\n",
    "#         name_split[0],name_split[1] = name_split[1],name_split[0]\n",
    "#     better_name =  (\"-\").join(name_split)\n",
    "# #     name_reverse = name_split[::-1]\n",
    "#     colnames.append(better_name)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "# # take names of bottom time series\n",
    "# bts_names = colnames[-nbts+1:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tags = []\n",
    "# for ts_name in bts_names:\n",
    "#     path_list = [] \n",
    "#     ts_split  = ts_name\n",
    "#     ts_split  = 'T-'+ts_name\n",
    "#     ts_split  = ts_split.split(\"-\")\n",
    "# #     ts_split.insert(0,'T')\n",
    "#     for idx in range(1,len(ts_split)+1):\n",
    "#         path_list.append(\"-\".join(ts_split[:idx]))\n",
    "# #     print(path_list)\n",
    "#     tags.append(path_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tags = np.array(tags)\n",
    "# np.savetxt(\"tags.csv\", tags, delimiter=\",\", fmt='%s')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
