{
 "metadata": {
  "orig_nbformat": 4,
  "kernelspec": {
   "name": "python3",
   "display_name": "Python 3.9.1 64-bit ('jupyter': conda)"
  },
  "language_info": {
   "name": "python",
   "version": "3.9.1",
   "mimetype": "text/x-python",
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "pygments_lexer": "ipython3",
   "nbconvert_exporter": "python",
   "file_extension": ".py"
  },
  "interpreter": {
   "hash": "fa4135110663b2192d0748208073f3a72fe675f4cc13c80dde80de04c19dfefa"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2,
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 11,
   "source": [
    "import json\n",
    "import math\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import pickle as pickle\n",
    "import datetime\n",
    "from datetime import date"
   ],
   "outputs": [],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "source": [
    "data_name = 'harris'\n",
    "data_root_path = '/data/zhimengj/Human_Mob/Harris/'\n",
    "data_save_path = '/data/zhimengj/dataset/Harris/'\n",
    "Grid_PATH = data_root_path + 'Grid_Map/Harris_010.p'\n",
    "\n",
    "### save nodes features/labels\n",
    "Nodes_PATH = data_root_path + 'Node_Features/Harris_all_labels.csv'\n",
    "OUT_NODE_FEAT = data_save_path + '{}_node.npy'.format(data_name)\n",
    "OUT_NODE_SFEAT = data_save_path + '{}_Snode.p'.format(data_name)\n",
    "OUT_NODE_label = data_save_path + '{}_Ynode.npy'.format(data_name)\n",
    "OUT_NODE_label2 = data_save_path + '{}_Ynode2.npy'.format(data_name)\n",
    "### save temporal links\n",
    "time_duration = 1\n",
    "OUT_DF = data_save_path + '{}_edge_{}.csv'.format(data_name, time_duration)\n",
    "OUT_FEAT = data_save_path + '{}_edge_{}.npy'.format(data_name, time_duration)"
   ],
   "outputs": [],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "source": [
    "with open(Grid_PATH, \"rb\") as f:\n",
    "    grid = pickle.load(f) ## remove column 0, 5, 9, 10\n",
    "index_name = grid.index.tolist()\n",
    "index_name"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "[(1, 64),\n",
       " (1, 65),\n",
       " (2, 62),\n",
       " (2, 63),\n",
       " (2, 64),\n",
       " (3, 59),\n",
       " (3, 60),\n",
       " (3, 61),\n",
       " (3, 62),\n",
       " (3, 63),\n",
       " (3, 64),\n",
       " (4, 56),\n",
       " (4, 57),\n",
       " (4, 58),\n",
       " (4, 59),\n",
       " (4, 60),\n",
       " (4, 61),\n",
       " (4, 62),\n",
       " (4, 63),\n",
       " (5, 53),\n",
       " (5, 54),\n",
       " (5, 55),\n",
       " (5, 56),\n",
       " (5, 57),\n",
       " (5, 58),\n",
       " (5, 59),\n",
       " (5, 60),\n",
       " (5, 61),\n",
       " (5, 62),\n",
       " (5, 63),\n",
       " (6, 50),\n",
       " (6, 51),\n",
       " (6, 52),\n",
       " (6, 53),\n",
       " (6, 54),\n",
       " (6, 55),\n",
       " (6, 56),\n",
       " (6, 57),\n",
       " (6, 58),\n",
       " (6, 59),\n",
       " (6, 60),\n",
       " (6, 61),\n",
       " (6, 62),\n",
       " (7, 48),\n",
       " (7, 49),\n",
       " (7, 50),\n",
       " (7, 51),\n",
       " (7, 52),\n",
       " (7, 53),\n",
       " (7, 54),\n",
       " (7, 55),\n",
       " (7, 56),\n",
       " (7, 57),\n",
       " (7, 58),\n",
       " (7, 59),\n",
       " (7, 60),\n",
       " (7, 61),\n",
       " (7, 62),\n",
       " (8, 45),\n",
       " (8, 46),\n",
       " (8, 47),\n",
       " (8, 48),\n",
       " (8, 49),\n",
       " (8, 50),\n",
       " (8, 51),\n",
       " (8, 52),\n",
       " (8, 53),\n",
       " (8, 54),\n",
       " (8, 55),\n",
       " (8, 56),\n",
       " (8, 57),\n",
       " (8, 58),\n",
       " (8, 59),\n",
       " (8, 60),\n",
       " (8, 61),\n",
       " (8, 62),\n",
       " (9, 42),\n",
       " (9, 43),\n",
       " (9, 44),\n",
       " (9, 45),\n",
       " (9, 46),\n",
       " (9, 47),\n",
       " (9, 48),\n",
       " (9, 49),\n",
       " (9, 50),\n",
       " (9, 51),\n",
       " (9, 52),\n",
       " (9, 53),\n",
       " (9, 54),\n",
       " (9, 55),\n",
       " (9, 56),\n",
       " (9, 57),\n",
       " (9, 58),\n",
       " (9, 59),\n",
       " (9, 60),\n",
       " (9, 61),\n",
       " (9, 62),\n",
       " (10, 39),\n",
       " (10, 40),\n",
       " (10, 41),\n",
       " (10, 42),\n",
       " (10, 43),\n",
       " (10, 44),\n",
       " (10, 45),\n",
       " (10, 46),\n",
       " (10, 47),\n",
       " (10, 48),\n",
       " (10, 49),\n",
       " (10, 50),\n",
       " (10, 51),\n",
       " (10, 52),\n",
       " (10, 53),\n",
       " (10, 54),\n",
       " (10, 55),\n",
       " (10, 56),\n",
       " (10, 57),\n",
       " (10, 58),\n",
       " (10, 59),\n",
       " (10, 60),\n",
       " (11, 37),\n",
       " (11, 38),\n",
       " (11, 39),\n",
       " (11, 40),\n",
       " (11, 41),\n",
       " (11, 42),\n",
       " (11, 43),\n",
       " (11, 44),\n",
       " (11, 45),\n",
       " (11, 46),\n",
       " (11, 47),\n",
       " (11, 48),\n",
       " (11, 49),\n",
       " (11, 50),\n",
       " (11, 51),\n",
       " (11, 52),\n",
       " (11, 53),\n",
       " (11, 54),\n",
       " (11, 55),\n",
       " (11, 56),\n",
       " (11, 57),\n",
       " (11, 58),\n",
       " (11, 59),\n",
       " (11, 60),\n",
       " (12, 34),\n",
       " (12, 35),\n",
       " (12, 36),\n",
       " (12, 37),\n",
       " (12, 38),\n",
       " (12, 39),\n",
       " (12, 40),\n",
       " (12, 41),\n",
       " (12, 42),\n",
       " (12, 43),\n",
       " (12, 44),\n",
       " (12, 45),\n",
       " (12, 46),\n",
       " (12, 47),\n",
       " (12, 48),\n",
       " (12, 49),\n",
       " (12, 50),\n",
       " (12, 51),\n",
       " (12, 52),\n",
       " (12, 53),\n",
       " (12, 54),\n",
       " (12, 55),\n",
       " (12, 56),\n",
       " (12, 57),\n",
       " (12, 58),\n",
       " (13, 31),\n",
       " (13, 32),\n",
       " (13, 33),\n",
       " (13, 34),\n",
       " (13, 35),\n",
       " (13, 36),\n",
       " (13, 37),\n",
       " (13, 38),\n",
       " (13, 39),\n",
       " (13, 40),\n",
       " (13, 41),\n",
       " (13, 42),\n",
       " (13, 43),\n",
       " (13, 44),\n",
       " (13, 45),\n",
       " (13, 46),\n",
       " (13, 47),\n",
       " (13, 48),\n",
       " (13, 49),\n",
       " (13, 50),\n",
       " (13, 51),\n",
       " (13, 52),\n",
       " (13, 53),\n",
       " (13, 54),\n",
       " (13, 55),\n",
       " (13, 56),\n",
       " (13, 57),\n",
       " (13, 58),\n",
       " (14, 29),\n",
       " (14, 30),\n",
       " (14, 31),\n",
       " (14, 32),\n",
       " (14, 33),\n",
       " (14, 34),\n",
       " (14, 35),\n",
       " (14, 36),\n",
       " (14, 37),\n",
       " (14, 38),\n",
       " (14, 39),\n",
       " (14, 40),\n",
       " (14, 41),\n",
       " (14, 42),\n",
       " (14, 43),\n",
       " (14, 44),\n",
       " (14, 45),\n",
       " (14, 46),\n",
       " (14, 47),\n",
       " (14, 48),\n",
       " (14, 49),\n",
       " (14, 50),\n",
       " (14, 51),\n",
       " (14, 52),\n",
       " (14, 53),\n",
       " (14, 54),\n",
       " (14, 55),\n",
       " (14, 56),\n",
       " (14, 57),\n",
       " (14, 58),\n",
       " (15, 29),\n",
       " (15, 30),\n",
       " (15, 31),\n",
       " (15, 32),\n",
       " (15, 33),\n",
       " (15, 34),\n",
       " (15, 35),\n",
       " (15, 36),\n",
       " (15, 37),\n",
       " (15, 38),\n",
       " (15, 39),\n",
       " (15, 40),\n",
       " (15, 41),\n",
       " (15, 42),\n",
       " (15, 43),\n",
       " (15, 44),\n",
       " (15, 45),\n",
       " (15, 46),\n",
       " (15, 47),\n",
       " (15, 48),\n",
       " (15, 49),\n",
       " (15, 50),\n",
       " (15, 51),\n",
       " (15, 52),\n",
       " (15, 53),\n",
       " (15, 54),\n",
       " (15, 55),\n",
       " (15, 56),\n",
       " (15, 57),\n",
       " (15, 58),\n",
       " (16, 28),\n",
       " (16, 29),\n",
       " (16, 30),\n",
       " (16, 31),\n",
       " (16, 32),\n",
       " (16, 33),\n",
       " (16, 34),\n",
       " (16, 35),\n",
       " (16, 36),\n",
       " (16, 37),\n",
       " (16, 38),\n",
       " (16, 39),\n",
       " (16, 40),\n",
       " (16, 41),\n",
       " (16, 42),\n",
       " (16, 43),\n",
       " (16, 44),\n",
       " (16, 45),\n",
       " (16, 46),\n",
       " (16, 47),\n",
       " (16, 48),\n",
       " (16, 49),\n",
       " (16, 50),\n",
       " (16, 51),\n",
       " (16, 52),\n",
       " (16, 53),\n",
       " (16, 54),\n",
       " (16, 55),\n",
       " (16, 56),\n",
       " (16, 57),\n",
       " (16, 58),\n",
       " (16, 59),\n",
       " (17, 28),\n",
       " (17, 29),\n",
       " (17, 30),\n",
       " (17, 31),\n",
       " (17, 32),\n",
       " (17, 33),\n",
       " (17, 34),\n",
       " (17, 35),\n",
       " (17, 36),\n",
       " (17, 37),\n",
       " (17, 38),\n",
       " (17, 39),\n",
       " (17, 40),\n",
       " (17, 41),\n",
       " (17, 42),\n",
       " (17, 43),\n",
       " (17, 44),\n",
       " (17, 45),\n",
       " (17, 46),\n",
       " (17, 47),\n",
       " (17, 48),\n",
       " (17, 49),\n",
       " (17, 50),\n",
       " (17, 51),\n",
       " (17, 52),\n",
       " (17, 53),\n",
       " (17, 54),\n",
       " (17, 55),\n",
       " (17, 56),\n",
       " (17, 57),\n",
       " (17, 58),\n",
       " (17, 59),\n",
       " (18, 27),\n",
       " (18, 28),\n",
       " (18, 29),\n",
       " (18, 30),\n",
       " (18, 31),\n",
       " (18, 32),\n",
       " (18, 33),\n",
       " (18, 34),\n",
       " (18, 35),\n",
       " (18, 36),\n",
       " (18, 37),\n",
       " (18, 38),\n",
       " (18, 39),\n",
       " (18, 40),\n",
       " (18, 41),\n",
       " (18, 42),\n",
       " (18, 43),\n",
       " (18, 44),\n",
       " (18, 45),\n",
       " (18, 46),\n",
       " (18, 47),\n",
       " (18, 48),\n",
       " (18, 49),\n",
       " (18, 50),\n",
       " (18, 51),\n",
       " (18, 52),\n",
       " (18, 53),\n",
       " (18, 54),\n",
       " (18, 55),\n",
       " (18, 56),\n",
       " (18, 57),\n",
       " (18, 58),\n",
       " (18, 59),\n",
       " (19, 27),\n",
       " (19, 28),\n",
       " (19, 29),\n",
       " (19, 30),\n",
       " (19, 31),\n",
       " (19, 32),\n",
       " (19, 33),\n",
       " (19, 34),\n",
       " (19, 35),\n",
       " (19, 36),\n",
       " (19, 37),\n",
       " (19, 38),\n",
       " (19, 39),\n",
       " (19, 40),\n",
       " (19, 41),\n",
       " (19, 42),\n",
       " (19, 43),\n",
       " (19, 44),\n",
       " (19, 45),\n",
       " (19, 46),\n",
       " (19, 47),\n",
       " (19, 48),\n",
       " (19, 49),\n",
       " (19, 50),\n",
       " (19, 51),\n",
       " (19, 52),\n",
       " (19, 53),\n",
       " (19, 54),\n",
       " (19, 55),\n",
       " (19, 56),\n",
       " (19, 57),\n",
       " (19, 58),\n",
       " (19, 59),\n",
       " (20, 26),\n",
       " (20, 27),\n",
       " (20, 28),\n",
       " (20, 29),\n",
       " (20, 30),\n",
       " (20, 31),\n",
       " (20, 32),\n",
       " (20, 33),\n",
       " (20, 34),\n",
       " (20, 35),\n",
       " (20, 36),\n",
       " (20, 37),\n",
       " (20, 38),\n",
       " (20, 39),\n",
       " (20, 40),\n",
       " (20, 41),\n",
       " (20, 42),\n",
       " (20, 43),\n",
       " (20, 44),\n",
       " (20, 45),\n",
       " (20, 46),\n",
       " (20, 47),\n",
       " (20, 48),\n",
       " (20, 49),\n",
       " (20, 50),\n",
       " (20, 51),\n",
       " (20, 52),\n",
       " (20, 53),\n",
       " (20, 54),\n",
       " (20, 55),\n",
       " (20, 56),\n",
       " (20, 57),\n",
       " (20, 58),\n",
       " (20, 59),\n",
       " (21, 25),\n",
       " (21, 26),\n",
       " (21, 27),\n",
       " (21, 28),\n",
       " (21, 29),\n",
       " (21, 30),\n",
       " (21, 31),\n",
       " (21, 32),\n",
       " (21, 33),\n",
       " (21, 34),\n",
       " (21, 35),\n",
       " (21, 36),\n",
       " (21, 37),\n",
       " (21, 38),\n",
       " (21, 39),\n",
       " (21, 40),\n",
       " (21, 41),\n",
       " (21, 42),\n",
       " (21, 43),\n",
       " (21, 44),\n",
       " (21, 45),\n",
       " (21, 46),\n",
       " (21, 47),\n",
       " (21, 48),\n",
       " (21, 49),\n",
       " (21, 50),\n",
       " (21, 51),\n",
       " (21, 52),\n",
       " (21, 53),\n",
       " (21, 54),\n",
       " (21, 55),\n",
       " (21, 56),\n",
       " (21, 57),\n",
       " (21, 58),\n",
       " (21, 59),\n",
       " (22, 25),\n",
       " (22, 26),\n",
       " (22, 27),\n",
       " (22, 28),\n",
       " (22, 29),\n",
       " (22, 30),\n",
       " (22, 31),\n",
       " (22, 32),\n",
       " (22, 33),\n",
       " (22, 34),\n",
       " (22, 35),\n",
       " (22, 36),\n",
       " (22, 37),\n",
       " (22, 38),\n",
       " (22, 39),\n",
       " (22, 40),\n",
       " (22, 41),\n",
       " (22, 42),\n",
       " (22, 43),\n",
       " (22, 44),\n",
       " (22, 45),\n",
       " (22, 46),\n",
       " (22, 47),\n",
       " (22, 48),\n",
       " (22, 49),\n",
       " (22, 50),\n",
       " (22, 51),\n",
       " (22, 52),\n",
       " (22, 53),\n",
       " (22, 54),\n",
       " (22, 55),\n",
       " (22, 56),\n",
       " (22, 57),\n",
       " (22, 58),\n",
       " (22, 59),\n",
       " (23, 24),\n",
       " (23, 25),\n",
       " (23, 26),\n",
       " (23, 27),\n",
       " (23, 28),\n",
       " (23, 29),\n",
       " (23, 30),\n",
       " (23, 31),\n",
       " (23, 32),\n",
       " (23, 33),\n",
       " (23, 34),\n",
       " (23, 35),\n",
       " (23, 36),\n",
       " (23, 37),\n",
       " (23, 38),\n",
       " (23, 39),\n",
       " (23, 40),\n",
       " (23, 41),\n",
       " (23, 42),\n",
       " (23, 43),\n",
       " (23, 44),\n",
       " (23, 45),\n",
       " (23, 46),\n",
       " (23, 47),\n",
       " (23, 48),\n",
       " (23, 49),\n",
       " (23, 50),\n",
       " (23, 51),\n",
       " (23, 52),\n",
       " (23, 53),\n",
       " (23, 54),\n",
       " (23, 55),\n",
       " (23, 56),\n",
       " (23, 57),\n",
       " (23, 58),\n",
       " (23, 59),\n",
       " (24, 24),\n",
       " (24, 25),\n",
       " (24, 26),\n",
       " (24, 27),\n",
       " (24, 28),\n",
       " (24, 29),\n",
       " (24, 30),\n",
       " (24, 31),\n",
       " (24, 32),\n",
       " (24, 33),\n",
       " (24, 34),\n",
       " (24, 35),\n",
       " (24, 36),\n",
       " (24, 37),\n",
       " (24, 38),\n",
       " (24, 39),\n",
       " (24, 40),\n",
       " (24, 41),\n",
       " (24, 42),\n",
       " (24, 43),\n",
       " (24, 44),\n",
       " (24, 45),\n",
       " (24, 46),\n",
       " (24, 47),\n",
       " (24, 48),\n",
       " (24, 49),\n",
       " (24, 50),\n",
       " (24, 51),\n",
       " (24, 52),\n",
       " (24, 53),\n",
       " (24, 54),\n",
       " (24, 55),\n",
       " (24, 56),\n",
       " (24, 57),\n",
       " (24, 58),\n",
       " (24, 59),\n",
       " (24, 60),\n",
       " (25, 23),\n",
       " (25, 24),\n",
       " (25, 25),\n",
       " (25, 26),\n",
       " (25, 27),\n",
       " (25, 28),\n",
       " (25, 29),\n",
       " (25, 30),\n",
       " (25, 31),\n",
       " (25, 32),\n",
       " (25, 33),\n",
       " (25, 34),\n",
       " (25, 35),\n",
       " (25, 36),\n",
       " (25, 37),\n",
       " (25, 38),\n",
       " (25, 39),\n",
       " (25, 40),\n",
       " (25, 41),\n",
       " (25, 42),\n",
       " (25, 43),\n",
       " (25, 44),\n",
       " (25, 45),\n",
       " (25, 46),\n",
       " (25, 47),\n",
       " (25, 48),\n",
       " (25, 49),\n",
       " (25, 50),\n",
       " (25, 51),\n",
       " (25, 52),\n",
       " (25, 53),\n",
       " (25, 54),\n",
       " (25, 55),\n",
       " (25, 56),\n",
       " (25, 57),\n",
       " (25, 58),\n",
       " (25, 59),\n",
       " (25, 60),\n",
       " (26, 23),\n",
       " (26, 24),\n",
       " (26, 25),\n",
       " (26, 26),\n",
       " (26, 27),\n",
       " (26, 28),\n",
       " (26, 29),\n",
       " (26, 30),\n",
       " (26, 31),\n",
       " (26, 32),\n",
       " (26, 33),\n",
       " (26, 34),\n",
       " (26, 35),\n",
       " (26, 36),\n",
       " (26, 37),\n",
       " (26, 38),\n",
       " (26, 39),\n",
       " (26, 40),\n",
       " (26, 41),\n",
       " (26, 42),\n",
       " (26, 43),\n",
       " (26, 44),\n",
       " (26, 45),\n",
       " (26, 46),\n",
       " (26, 47),\n",
       " (26, 48),\n",
       " (26, 49),\n",
       " (26, 50),\n",
       " (26, 51),\n",
       " (26, 52),\n",
       " (26, 53),\n",
       " (26, 54),\n",
       " (26, 55),\n",
       " (26, 56),\n",
       " (26, 57),\n",
       " (26, 58),\n",
       " (26, 59),\n",
       " (26, 60),\n",
       " (27, 22),\n",
       " (27, 23),\n",
       " (27, 24),\n",
       " (27, 25),\n",
       " (27, 26),\n",
       " (27, 27),\n",
       " (27, 28),\n",
       " (27, 29),\n",
       " (27, 30),\n",
       " (27, 31),\n",
       " (27, 32),\n",
       " (27, 33),\n",
       " (27, 34),\n",
       " (27, 35),\n",
       " (27, 36),\n",
       " (27, 37),\n",
       " (27, 38),\n",
       " (27, 39),\n",
       " (27, 40),\n",
       " (27, 41),\n",
       " (27, 42),\n",
       " (27, 43),\n",
       " (27, 44),\n",
       " (27, 45),\n",
       " (27, 46),\n",
       " (27, 47),\n",
       " (27, 48),\n",
       " (27, 49),\n",
       " (27, 50),\n",
       " (27, 51),\n",
       " (27, 52),\n",
       " (27, 53),\n",
       " (27, 54),\n",
       " (27, 55),\n",
       " (27, 56),\n",
       " (27, 57),\n",
       " (27, 58),\n",
       " (27, 59),\n",
       " (27, 60),\n",
       " (28, 21),\n",
       " (28, 22),\n",
       " (28, 23),\n",
       " (28, 24),\n",
       " (28, 25),\n",
       " (28, 26),\n",
       " (28, 27),\n",
       " (28, 28),\n",
       " (28, 29),\n",
       " (28, 30),\n",
       " (28, 31),\n",
       " (28, 32),\n",
       " (28, 33),\n",
       " (28, 34),\n",
       " (28, 35),\n",
       " (28, 36),\n",
       " (28, 37),\n",
       " (28, 38),\n",
       " (28, 39),\n",
       " (28, 40),\n",
       " (28, 41),\n",
       " (28, 42),\n",
       " (28, 43),\n",
       " (28, 44),\n",
       " (28, 45),\n",
       " (28, 46),\n",
       " (28, 47),\n",
       " (28, 48),\n",
       " (28, 49),\n",
       " (28, 50),\n",
       " (28, 51),\n",
       " (28, 52),\n",
       " (28, 53),\n",
       " (28, 54),\n",
       " (28, 55),\n",
       " (28, 56),\n",
       " (28, 57),\n",
       " (28, 58),\n",
       " (28, 59),\n",
       " (28, 60),\n",
       " (29, 21),\n",
       " (29, 22),\n",
       " (29, 23),\n",
       " (29, 24),\n",
       " (29, 25),\n",
       " (29, 26),\n",
       " (29, 27),\n",
       " (29, 28),\n",
       " (29, 29),\n",
       " (29, 30),\n",
       " (29, 31),\n",
       " (29, 32),\n",
       " (29, 33),\n",
       " (29, 34),\n",
       " (29, 35),\n",
       " (29, 36),\n",
       " (29, 37),\n",
       " (29, 38),\n",
       " (29, 39),\n",
       " (29, 40),\n",
       " (29, 41),\n",
       " (29, 42),\n",
       " (29, 43),\n",
       " (29, 44),\n",
       " (29, 45),\n",
       " (29, 46),\n",
       " (29, 47),\n",
       " (29, 48),\n",
       " (29, 49),\n",
       " (29, 50),\n",
       " (29, 51),\n",
       " (29, 52),\n",
       " (29, 53),\n",
       " (29, 54),\n",
       " (29, 55),\n",
       " (29, 56),\n",
       " (29, 57),\n",
       " (29, 58),\n",
       " (29, 59),\n",
       " (29, 60),\n",
       " (30, 20),\n",
       " (30, 21),\n",
       " (30, 22),\n",
       " (30, 23),\n",
       " (30, 24),\n",
       " (30, 25),\n",
       " (30, 26),\n",
       " (30, 27),\n",
       " (30, 28),\n",
       " (30, 29),\n",
       " (30, 30),\n",
       " (30, 31),\n",
       " (30, 32),\n",
       " (30, 33),\n",
       " (30, 34),\n",
       " (30, 35),\n",
       " (30, 36),\n",
       " (30, 37),\n",
       " (30, 38),\n",
       " (30, 39),\n",
       " (30, 40),\n",
       " (30, 41),\n",
       " (30, 42),\n",
       " (30, 43),\n",
       " (30, 44),\n",
       " (30, 45),\n",
       " (30, 46),\n",
       " (30, 47),\n",
       " (30, 48),\n",
       " (30, 49),\n",
       " (30, 50),\n",
       " (30, 51),\n",
       " (30, 52),\n",
       " (30, 53),\n",
       " (30, 54),\n",
       " (30, 55),\n",
       " (30, 56),\n",
       " (30, 57),\n",
       " (30, 58),\n",
       " (30, 59),\n",
       " (30, 60),\n",
       " (31, 20),\n",
       " (31, 21),\n",
       " (31, 22),\n",
       " (31, 23),\n",
       " (31, 24),\n",
       " (31, 25),\n",
       " (31, 26),\n",
       " (31, 27),\n",
       " (31, 28),\n",
       " (31, 29),\n",
       " (31, 30),\n",
       " (31, 31),\n",
       " (31, 32),\n",
       " (31, 33),\n",
       " (31, 34),\n",
       " (31, 35),\n",
       " (31, 36),\n",
       " (31, 37),\n",
       " (31, 38),\n",
       " (31, 39),\n",
       " (31, 40),\n",
       " (31, 41),\n",
       " (31, 42),\n",
       " (31, 43),\n",
       " (31, 44),\n",
       " (31, 45),\n",
       " (31, 46),\n",
       " (31, 47),\n",
       " (31, 48),\n",
       " (31, 49),\n",
       " (31, 50),\n",
       " (31, 51),\n",
       " (31, 52),\n",
       " (31, 53),\n",
       " (31, 54),\n",
       " (31, 55),\n",
       " (31, 56),\n",
       " (31, 57),\n",
       " (31, 58),\n",
       " (31, 59),\n",
       " (31, 60),\n",
       " (31, 61),\n",
       " (32, 19),\n",
       " (32, 20),\n",
       " (32, 21),\n",
       " (32, 22),\n",
       " (32, 23),\n",
       " (32, 24),\n",
       " (32, 25),\n",
       " (32, 26),\n",
       " (32, 27),\n",
       " (32, 28),\n",
       " (32, 29),\n",
       " (32, 30),\n",
       " (32, 31),\n",
       " (32, 32),\n",
       " (32, 33),\n",
       " (32, 34),\n",
       " (32, 35),\n",
       " (32, 36),\n",
       " (32, 37),\n",
       " (32, 38),\n",
       " (32, 39),\n",
       " (32, 40),\n",
       " (32, 41),\n",
       " (32, 42),\n",
       " (32, 43),\n",
       " (32, 44),\n",
       " (32, 45),\n",
       " (32, 46),\n",
       " (32, 47),\n",
       " (32, 48),\n",
       " (32, 49),\n",
       " (32, 50),\n",
       " (32, 51),\n",
       " (32, 52),\n",
       " (32, 53),\n",
       " (32, 54),\n",
       " (32, 55),\n",
       " (32, 56),\n",
       " (32, 57),\n",
       " (32, 58),\n",
       " (32, 59),\n",
       " (32, 60),\n",
       " (32, 61),\n",
       " (32, 62),\n",
       " (33, 19),\n",
       " (33, 20),\n",
       " (33, 21),\n",
       " (33, 22),\n",
       " (33, 23),\n",
       " (33, 24),\n",
       " (33, 25),\n",
       " (33, 26),\n",
       " (33, 27),\n",
       " (33, 28),\n",
       " (33, 29),\n",
       " (33, 30),\n",
       " (33, 31),\n",
       " (33, 32),\n",
       " (33, 33),\n",
       " (33, 34),\n",
       " (33, 35),\n",
       " (33, 36),\n",
       " (33, 37),\n",
       " (33, 38),\n",
       " (33, 39),\n",
       " (33, 40),\n",
       " (33, 41),\n",
       " (33, 42),\n",
       " (33, 43),\n",
       " (33, 44),\n",
       " (33, 45),\n",
       " (33, 46),\n",
       " (33, 47),\n",
       " (33, 48),\n",
       " (33, 49),\n",
       " (33, 50),\n",
       " (33, 51),\n",
       " (33, 52),\n",
       " (33, 53),\n",
       " (33, 54),\n",
       " (33, 55),\n",
       " (33, 56),\n",
       " (33, 57),\n",
       " (33, 58),\n",
       " (33, 59),\n",
       " (33, 60),\n",
       " (33, 61),\n",
       " (33, 62),\n",
       " (34, 18),\n",
       " (34, 19),\n",
       " (34, 20),\n",
       " (34, 21),\n",
       " (34, 22),\n",
       " (34, 23),\n",
       " (34, 24),\n",
       " (34, 25),\n",
       " (34, 26),\n",
       " (34, 27),\n",
       " (34, 28),\n",
       " (34, 29),\n",
       " (34, 30),\n",
       " (34, 31),\n",
       " (34, 32),\n",
       " (34, 33),\n",
       " (34, 34),\n",
       " (34, 35),\n",
       " (34, 36),\n",
       " (34, 37),\n",
       " (34, 38),\n",
       " (34, 39),\n",
       " (34, 40),\n",
       " (34, 41),\n",
       " (34, 42),\n",
       " (34, 43),\n",
       " (34, 44),\n",
       " (34, 45),\n",
       " (34, 46),\n",
       " (34, 47),\n",
       " (34, 48),\n",
       " (34, 49),\n",
       " (34, 50),\n",
       " (34, 51),\n",
       " (34, 52),\n",
       " (34, 53),\n",
       " (34, 54),\n",
       " (34, 55),\n",
       " (34, 56),\n",
       " (34, 57),\n",
       " (34, 58),\n",
       " (34, 59),\n",
       " (34, 60),\n",
       " (34, 61),\n",
       " (34, 62),\n",
       " (34, 63),\n",
       " (35, 18),\n",
       " (35, 19),\n",
       " (35, 20),\n",
       " (35, 21),\n",
       " (35, 22),\n",
       " (35, 23),\n",
       " (35, 24),\n",
       " (35, 25),\n",
       " (35, 26),\n",
       " (35, 27),\n",
       " (35, 28),\n",
       " (35, 29),\n",
       " (35, 30),\n",
       " (35, 31),\n",
       " (35, 32),\n",
       " (35, 33),\n",
       " (35, 34),\n",
       " (35, 35),\n",
       " (35, 36),\n",
       " (35, 37),\n",
       " (35, 38),\n",
       " (35, 39),\n",
       " (35, 40),\n",
       " (35, 41),\n",
       " (35, 42),\n",
       " ...]"
      ]
     },
     "metadata": {},
     "execution_count": 13
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "source": [
    "Nodes = pd.read_csv(Nodes_PATH)\n",
    "# index_name = Nodes.index.tolist()\n",
    "Nodes = Nodes.drop(columns=['box', 'Aux_Stops', 'Aux_Visits', 'Aux_Time'])\n"
   ],
   "outputs": [],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "source": [
    "Sens_features = Nodes.loc[:,['% White', '% Black']]\n",
    "Sen_index = np.invert(pd.isna(Sens_features)).to_numpy()\n",
    "Sen_index = Sen_index[:,0] * Sen_index[:,1]\n",
    "# Sens_features2 = Sens_features[Sen_index].to_numpy()\n",
    "Sens_features = Sens_features.to_numpy()\n",
    "print(f'Sen_index={Sen_index.shape}')\n",
    "print(f'Sens_features={Sens_features.shape}')\n",
    "# Sens_features_dict = {\"sfeature\": Sens_features, \"index\": Sen_index}\n",
    "Sens_features_filter = Sens_features[Sen_index, 0] / 100 ### white people ratio\n",
    "pickle.dump(Sens_features_filter, open(OUT_NODE_SFEAT, \"wb\") )\n",
    "Sen_index"
   ],
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Sen_index=(4287,)\n",
      "Sens_features=(4287, 2)\n"
     ]
    },
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "array([ True, False,  True, ..., False, False, False])"
      ]
     },
     "metadata": {},
     "execution_count": 15
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "source": [
    "index_name_filter = []\n",
    "for i in range(len(Sen_index)):\n",
    "    if Sen_index[i]:\n",
    "        index_name_filter.append(index_name[i])\n",
    "len(index_name_filter)"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "4204"
      ]
     },
     "metadata": {},
     "execution_count": 16
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "source": [
    "### save Nodes features\n",
    "Nodes_features_filter = Nodes.iloc[Sen_index,0:36].to_numpy()\n",
    "np.save(OUT_NODE_FEAT, Nodes_features_filter)\n",
    "Nodes_features_filter.shape"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "(4204, 36)"
      ]
     },
     "metadata": {},
     "execution_count": 17
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "source": [
    "### save Nodes labels\n",
    "Nodes_labels = Nodes['Per capita income'].to_numpy()\n",
    "Label_index = np.invert(pd.isna(Nodes_labels))\n",
    "Nodes_labels = (Nodes_labels > np.median(Nodes_labels[Label_index])).astype(int)\n",
    "Nodes_labels_filter = Nodes_labels[Sen_index]\n",
    "np.save(OUT_NODE_label, Nodes_labels_filter)\n",
    "Nodes_labels_filter"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "array([0, 0, 0, ..., 1, 1, 1])"
      ]
     },
     "metadata": {},
     "execution_count": 18
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "source": [
    "### save Nodes labels 2\n",
    "Nodes_labels = Nodes['Per capita income'].to_numpy()\n",
    "Label_index = np.invert(pd.isna(Nodes_labels))\n",
    "# Nodes_labels = (Nodes_labels > np.median(Nodes_labels[Label_index])).astype(int)\n",
    "Nodes_labels_filter2 = Nodes_labels[Sen_index]\n",
    "Nodes_labels_filter2 = Nodes_labels_filter2 / np.max(Nodes_labels_filter2)\n",
    "np.save(OUT_NODE_label2, Nodes_labels_filter2)\n",
    "Nodes_labels_filter2"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "array([0.16591755, 0.16591755, 0.16591755, ..., 0.20307876, 0.19884808,\n",
       "       0.20307876])"
      ]
     },
     "metadata": {},
     "execution_count": 19
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "source": [
    "start_date = '2017-09-01'\n",
    "date_1 = datetime.datetime.strptime(start_date, \"%Y-%m-%d\")\n",
    "\n",
    "count = 0 \n",
    "sum = 0\n",
    "ratio = 0.1\n",
    "for time_index in range(time_duration):\n",
    "    end_date = date_1 + datetime.timedelta(days=time_index)\n",
    "    end_date = end_date.strftime(\"%Y-%m-%d\")\n",
    "    Links_PATH = data_root_path + 'Links/{}.csv'.format(end_date)\n",
    "    Links = pd.read_csv(Links_PATH)\n",
    "    count += Links.shape[0]\n",
    "    num_link = math.floor(ratio*Links.shape[0])\n",
    "    sum += np.sum(Links.iloc[:num_link, 5])\n",
    "\n",
    "count_th = sum / count\n",
    "Links"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>Origin_ID</th>\n",
       "      <th>Destination_ID</th>\n",
       "      <th>Date</th>\n",
       "      <th>Time</th>\n",
       "      <th>Count</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>(46, 64)</td>\n",
       "      <td>(46, 64)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>12</td>\n",
       "      <td>38</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>(44, 39)</td>\n",
       "      <td>(44, 39)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>20</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>(26, 47)</td>\n",
       "      <td>(51, 23)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>(51, 23)</td>\n",
       "      <td>(51, 23)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>12</td>\n",
       "      <td>35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>(51, 23)</td>\n",
       "      <td>(34, 44)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>20</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>355497</th>\n",
       "      <td>355497</td>\n",
       "      <td>(42, 37)</td>\n",
       "      <td>(39, 45)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>355498</th>\n",
       "      <td>355498</td>\n",
       "      <td>(38, 55)</td>\n",
       "      <td>(36, 51)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>355499</th>\n",
       "      <td>355499</td>\n",
       "      <td>(36, 51)</td>\n",
       "      <td>(37, 54)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>355500</th>\n",
       "      <td>355500</td>\n",
       "      <td>(17, 27)</td>\n",
       "      <td>(18, 26)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>355501</th>\n",
       "      <td>355501</td>\n",
       "      <td>(53, 18)</td>\n",
       "      <td>(43, 7)</td>\n",
       "      <td>2017-09-01</td>\n",
       "      <td>8</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>355502 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        Unnamed: 0 Origin_ID Destination_ID        Date  Time  Count\n",
       "0                0  (46, 64)       (46, 64)  2017-09-01    12     38\n",
       "1                1  (44, 39)       (44, 39)  2017-09-01    20      8\n",
       "2                2  (26, 47)       (51, 23)  2017-09-01     8      1\n",
       "3                3  (51, 23)       (51, 23)  2017-09-01    12     35\n",
       "4                4  (51, 23)       (34, 44)  2017-09-01    20      1\n",
       "...            ...       ...            ...         ...   ...    ...\n",
       "355497      355497  (42, 37)       (39, 45)  2017-09-01     8      1\n",
       "355498      355498  (38, 55)       (36, 51)  2017-09-01     8      1\n",
       "355499      355499  (36, 51)       (37, 54)  2017-09-01     8      1\n",
       "355500      355500  (17, 27)       (18, 26)  2017-09-01     8      1\n",
       "355501      355501  (53, 18)        (43, 7)  2017-09-01     8      1\n",
       "\n",
       "[355502 rows x 6 columns]"
      ]
     },
     "metadata": {},
     "execution_count": 20
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "source": [
    "u_list, i_list, ts_list, label_list = [], [], [], []\n",
    "idx_list = []\n",
    "idx = 0\n",
    "for time_index in range(time_duration):\n",
    "    end_date = date_1 + datetime.timedelta(days=time_index)\n",
    "    end_date = end_date.strftime(\"%Y-%m-%d\")\n",
    "    Links_PATH = data_root_path + 'Links/{}.csv'.format(end_date)\n",
    "    Links = pd.read_csv(Links_PATH)\n",
    "    num_link = math.floor(ratio*Links.shape[0])\n",
    "    for index in range(num_link):\n",
    "        src = eval(Links.iloc[index, 1])\n",
    "        des = eval(Links.iloc[index, 2])\n",
    "        if src in index_name_filter and des in index_name_filter and src != des:\n",
    "            u = index_name_filter.index(src)\n",
    "            i = index_name_filter.index(des)\n",
    "            if Sen_index[u] and Sen_index[i]:\n",
    "                ts = (time_index * 24 + Links.iloc[index, 4]) / 4\n",
    "                label = int(Links.iloc[index, 5] > count_th)\n",
    "                idx += 1\n",
    "\n",
    "                u_list.append(u)\n",
    "                i_list.append(i)\n",
    "                ts_list.append(ts)\n",
    "                label_list.append(label)\n",
    "                idx_list.append(idx)\n",
    "\n",
    "E_feat = pd.DataFrame({'u': u_list, \n",
    "                    'i':i_list, \n",
    "                    'ts':ts_list, \n",
    "                    'label':label_list, \n",
    "                    'idx':idx_list})\n",
    "E_feat.to_csv(OUT_DF)\n",
    "E_feat"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>u</th>\n",
       "      <th>i</th>\n",
       "      <th>ts</th>\n",
       "      <th>label</th>\n",
       "      <th>idx</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>610</td>\n",
       "      <td>1774</td>\n",
       "      <td>2.0</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1774</td>\n",
       "      <td>939</td>\n",
       "      <td>5.0</td>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>939</td>\n",
       "      <td>683</td>\n",
       "      <td>5.0</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1232</td>\n",
       "      <td>1281</td>\n",
       "      <td>5.0</td>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1281</td>\n",
       "      <td>1495</td>\n",
       "      <td>5.0</td>\n",
       "      <td>1</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19941</th>\n",
       "      <td>134</td>\n",
       "      <td>309</td>\n",
       "      <td>3.0</td>\n",
       "      <td>1</td>\n",
       "      <td>19942</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19942</th>\n",
       "      <td>309</td>\n",
       "      <td>134</td>\n",
       "      <td>4.0</td>\n",
       "      <td>1</td>\n",
       "      <td>19943</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19943</th>\n",
       "      <td>2865</td>\n",
       "      <td>3060</td>\n",
       "      <td>4.0</td>\n",
       "      <td>1</td>\n",
       "      <td>19944</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19944</th>\n",
       "      <td>1267</td>\n",
       "      <td>1117</td>\n",
       "      <td>4.0</td>\n",
       "      <td>1</td>\n",
       "      <td>19945</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19945</th>\n",
       "      <td>1117</td>\n",
       "      <td>1320</td>\n",
       "      <td>4.0</td>\n",
       "      <td>1</td>\n",
       "      <td>19946</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>19946 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          u     i   ts  label    idx\n",
       "0       610  1774  2.0      1      1\n",
       "1      1774   939  5.0      1      2\n",
       "2       939   683  5.0      1      3\n",
       "3      1232  1281  5.0      1      4\n",
       "4      1281  1495  5.0      1      5\n",
       "...     ...   ...  ...    ...    ...\n",
       "19941   134   309  3.0      1  19942\n",
       "19942   309   134  4.0      1  19943\n",
       "19943  2865  3060  4.0      1  19944\n",
       "19944  1267  1117  4.0      1  19945\n",
       "19945  1117  1320  4.0      1  19946\n",
       "\n",
       "[19946 rows x 5 columns]"
      ]
     },
     "metadata": {},
     "execution_count": 21
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "source": [
    "feat = np.random.uniform(0, 1, size=(E_feat.shape[0], 36))\n",
    "np.save(OUT_FEAT, feat)"
   ],
   "outputs": [],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "source": [
    "feat = np.load(OUT_FEAT)\n",
    "feat.shape"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "(19946, 36)"
      ]
     },
     "metadata": {},
     "execution_count": 23
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "source": [
    "np.mean(E_feat['label'])"
   ],
   "outputs": [
    {
     "output_type": "execute_result",
     "data": {
      "text/plain": [
       "1.0"
      ]
     },
     "metadata": {},
     "execution_count": 24
    }
   ],
   "metadata": {}
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "source": [],
   "outputs": [],
   "metadata": {}
  }
 ]
}