{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Content-based Filtering Model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "# For data manipulation and analysis\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "\n",
    "# For text preprocessing\n",
    "import re\n",
    "import nltk\n",
    "from nltk.corpus import stopwords\n",
    "from nltk.stem import WordNetLemmatizer\n",
    "from sklearn.feature_extraction.text import TfidfVectorizer\n",
    "import datetime\n",
    "import string\n",
    "\n",
    "# For multilabel classification\n",
    "from sklearn.preprocessing import MultiLabelBinarizer\n",
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.linear_model import LogisticRegression\n",
    "from sklearn.multiclass import OneVsRestClassifier\n",
    "from sklearn.ensemble import RandomForestClassifier\n",
    "from sklearn.naive_bayes import MultinomialNB\n",
    "from ast import literal_eval\n",
    "\n",
    "\n",
    "# For model evaluation\n",
    "from sklearn.metrics import accuracy_score, f1_score, precision_score, recall_score, classification_report, confusion_matrix"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Reading in the same user subset/df that is used in the CF model\n",
    "- Use this because we will combine the output of the CF model with this one\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "tags = pd.read_csv(\"../dataset/tags_contentbased.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0.2</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>Unnamed: 0.1</th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>timestamp</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>has_glove_vec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>7</td>\n",
       "      <td>266</td>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>2015-02-20 22:42:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[ 0.18209    0.88297   -0.49805    0.53137   -...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>8</td>\n",
       "      <td>267</td>\n",
       "      <td>318</td>\n",
       "      <td>115149</td>\n",
       "      <td>action</td>\n",
       "      <td>2015-02-21 15:58:30</td>\n",
       "      <td>action</td>\n",
       "      <td>[ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>15</td>\n",
       "      <td>274</td>\n",
       "      <td>320</td>\n",
       "      <td>2762</td>\n",
       "      <td>twist</td>\n",
       "      <td>2006-04-25 11:33:52</td>\n",
       "      <td>twist</td>\n",
       "      <td>[-9.5859e-02 -1.7472e-01 -3.4692e-02 -3.7307e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>16</td>\n",
       "      <td>275</td>\n",
       "      <td>320</td>\n",
       "      <td>2959</td>\n",
       "      <td>twist</td>\n",
       "      <td>2006-04-25 11:30:58</td>\n",
       "      <td>twist</td>\n",
       "      <td>[-9.5859e-02 -1.7472e-01 -3.4692e-02 -3.7307e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>17</td>\n",
       "      <td>276</td>\n",
       "      <td>320</td>\n",
       "      <td>3996</td>\n",
       "      <td>overrate</td>\n",
       "      <td>2006-04-25 11:32:28</td>\n",
       "      <td>overrated</td>\n",
       "      <td>[ 2.8151e-01 -4.2171e-01 -3.8275e-01  1.5364e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50186</th>\n",
       "      <td>50186</td>\n",
       "      <td>109306</td>\n",
       "      <td>390955</td>\n",
       "      <td>138280</td>\n",
       "      <td>116797</td>\n",
       "      <td>history</td>\n",
       "      <td>2015-01-30 23:07:25</td>\n",
       "      <td>history</td>\n",
       "      <td>[ 4.5847e-02  7.4334e-02  1.5092e-02 -2.6392e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50187</th>\n",
       "      <td>50187</td>\n",
       "      <td>109307</td>\n",
       "      <td>390956</td>\n",
       "      <td>138280</td>\n",
       "      <td>116797</td>\n",
       "      <td>informatics</td>\n",
       "      <td>2015-01-30 23:07:35</td>\n",
       "      <td>informatics</td>\n",
       "      <td>[ 1.7728e-01  1.5395e-01  7.7811e-01  1.6527e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50188</th>\n",
       "      <td>50188</td>\n",
       "      <td>109308</td>\n",
       "      <td>390957</td>\n",
       "      <td>138280</td>\n",
       "      <td>116797</td>\n",
       "      <td>mathematics</td>\n",
       "      <td>2015-01-30 23:07:17</td>\n",
       "      <td>mathematics</td>\n",
       "      <td>[ 1.0033e+00  3.8874e-01  6.4312e-01 -6.8630e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50189</th>\n",
       "      <td>50189</td>\n",
       "      <td>109310</td>\n",
       "      <td>390959</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>2015-01-30 23:09:16</td>\n",
       "      <td>image</td>\n",
       "      <td>[ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50190</th>\n",
       "      <td>50190</td>\n",
       "      <td>109311</td>\n",
       "      <td>390960</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>2015-01-30 23:09:25</td>\n",
       "      <td>story</td>\n",
       "      <td>[-0.35058    0.58245   -0.065584  -0.41768    ...</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>50191 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       Unnamed: 0.2  Unnamed: 0  Unnamed: 0.1  userId  movieId          tag  \\\n",
       "0                 0           7           266     318      260            s   \n",
       "1                 1           8           267     318   115149       action   \n",
       "2                 2          15           274     320     2762        twist   \n",
       "3                 3          16           275     320     2959        twist   \n",
       "4                 4          17           276     320     3996     overrate   \n",
       "...             ...         ...           ...     ...      ...          ...   \n",
       "50186         50186      109306        390955  138280   116797      history   \n",
       "50187         50187      109307        390956  138280   116797  informatics   \n",
       "50188         50188      109308        390957  138280   116797  mathematics   \n",
       "50189         50189      109310        390959  138280   117871        image   \n",
       "50190         50190      109311        390960  138280   117871        story   \n",
       "\n",
       "                 timestamp un-lemmatised  \\\n",
       "0      2015-02-20 22:42:49           NaN   \n",
       "1      2015-02-21 15:58:30        action   \n",
       "2      2006-04-25 11:33:52         twist   \n",
       "3      2006-04-25 11:30:58         twist   \n",
       "4      2006-04-25 11:32:28     overrated   \n",
       "...                    ...           ...   \n",
       "50186  2015-01-30 23:07:25       history   \n",
       "50187  2015-01-30 23:07:35   informatics   \n",
       "50188  2015-01-30 23:07:17   mathematics   \n",
       "50189  2015-01-30 23:09:16         image   \n",
       "50190  2015-01-30 23:09:25         story   \n",
       "\n",
       "                                               glove_vec  has_glove_vec  \n",
       "0      [ 0.18209    0.88297   -0.49805    0.53137   -...           True  \n",
       "1      [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...           True  \n",
       "2      [-9.5859e-02 -1.7472e-01 -3.4692e-02 -3.7307e-...           True  \n",
       "3      [-9.5859e-02 -1.7472e-01 -3.4692e-02 -3.7307e-...           True  \n",
       "4      [ 2.8151e-01 -4.2171e-01 -3.8275e-01  1.5364e-...           True  \n",
       "...                                                  ...            ...  \n",
       "50186  [ 4.5847e-02  7.4334e-02  1.5092e-02 -2.6392e-...           True  \n",
       "50187  [ 1.7728e-01  1.5395e-01  7.7811e-01  1.6527e-...           True  \n",
       "50188  [ 1.0033e+00  3.8874e-01  6.4312e-01 -6.8630e-...           True  \n",
       "50189  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...           True  \n",
       "50190  [-0.35058    0.58245   -0.065584  -0.41768    ...           True  \n",
       "\n",
       "[50191 rows x 10 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "# filtering here - the movie dataframe to only include the movies in the subset: "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "movies = pd.read_csv(\"../dataset/ml-20m/movies.csv\")\n",
    "# Inner join on 'movieId'\n",
    "filtered_movies_df = pd.merge(movies, tags[['movieId']].drop_duplicates(), on='movieId', how='inner')\n",
    "\n",
    "# Now, filtered_movies_df will only contain the movies that are also present in tags['movieId']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "filtered_movies_df.to_csv(\"../dataset/ml-20m/filtered_movies.csv\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Content based analysis\n",
    "- remove duplicates\n",
    "- Semantic\n",
    "    - GloVe vectors - same gloVe vectors from previous\n",
    "    - POS tagging\n",
    "    - NER - entities\n",
    "    - Tag Frequency \n",
    "  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "# removal of duplicates\n",
    "words = tags[[\"tag\", \"glove_vec\"]]\n",
    "words = words.drop_duplicates()\n",
    "\n",
    "words_ul = tags[[\"tag\", \"un-lemmatised\", \"glove_vec\"]] # unlemmatised words\n",
    "words_ul = words_ul.drop_duplicates()\n",
    "\n",
    "def custom_parser(vec_str):\n",
    "    # Remove the square brackets and split the string by spaces\n",
    "    numbers = vec_str[1:-1].split()\n",
    "    \n",
    "    # Convert strings to floats and create a numpy array\n",
    "    return np.array([float(num) for num in numbers])\n",
    "\n",
    "\n",
    "words['glove_vec'] = words['glove_vec'].apply(custom_parser)\n",
    "words_ul['glove_vec'] = words_ul['glove_vec'].apply(custom_parser)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "# words['ner_label'] = \"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>142</th>\n",
       "      <td>suicide</td>\n",
       "      <td>[-0.31681, 0.34677, -0.5601, -0.06169, 0.11104...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>143</th>\n",
       "      <td>depress</td>\n",
       "      <td>[0.34005, 0.62285, 0.0054628, 0.76742, 0.5336,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>144</th>\n",
       "      <td>psychodrama</td>\n",
       "      <td>[-0.20147, 0.14485, 0.36897, 0.51262, 0.4073, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>146</th>\n",
       "      <td>melancholy</td>\n",
       "      <td>[0.056755, -0.31458, 0.62357, -0.42678, 0.4501...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>149</th>\n",
       "      <td>weird</td>\n",
       "      <td>[0.30121, -0.20263, -0.084793, -0.5863, 0.1901...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>80 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "             tag                                          glove_vec\n",
       "0              s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...\n",
       "1         action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...\n",
       "2          twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...\n",
       "4       overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...\n",
       "5        violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...\n",
       "..           ...                                                ...\n",
       "142      suicide  [-0.31681, 0.34677, -0.5601, -0.06169, 0.11104...\n",
       "143      depress  [0.34005, 0.62285, 0.0054628, 0.76742, 0.5336,...\n",
       "144  psychodrama  [-0.20147, 0.14485, 0.36897, 0.51262, 0.4073, ...\n",
       "146   melancholy  [0.056755, -0.31458, 0.62357, -0.42678, 0.4501...\n",
       "149        weird  [0.30121, -0.20263, -0.084793, -0.5863, 0.1901...\n",
       "\n",
       "[80 rows x 2 columns]"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words.head(80)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50062</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2899 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag                                          glove_vec  \\\n",
       "0                     s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "1                action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "2                 twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "4              overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   \n",
       "5               violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...   \n",
       "...                 ...                                                ...   \n",
       "50062         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "50110            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "50139            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "50142              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "50176  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "      ner_label  \n",
       "0           NaN  \n",
       "1           NaN  \n",
       "2           NaN  \n",
       "4           NaN  \n",
       "5           NaN  \n",
       "...         ...  \n",
       "50062       NaN  \n",
       "50110       NaN  \n",
       "50139       NaN  \n",
       "50142       NaN  \n",
       "50176       NaN  \n",
       "\n",
       "[2899 rows x 3 columns]"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# manually labelling some of the words\n",
    "\n",
    "# Dictionary for NER labels\n",
    "ner_labels = {\n",
    "    'childish': 'O',\n",
    "    'location': 'O',\n",
    "    'sibling': 'O',\n",
    "    'musical': 'PROD',\n",
    "    'corporation': 'O',\n",
    "    'rape': 'O',\n",
    "    'romance': 'PROD',\n",
    "    'heartwarming': 'O',\n",
    "    'character': 'O',\n",
    "    'animation': 'PROD',\n",
    "    'feminist': 'O',\n",
    "    'cave': 'LOC',\n",
    "    'time': 'O',\n",
    "    'india': 'LOC',\n",
    "    'friend': 'PER',\n",
    "    'thailand': 'LOC',\n",
    "    'cooking': 'O',\n",
    "    'twitter': 'CORP',\n",
    "    'photography': 'CW',\n",
    "    'drum' : 'PROD',\n",
    "    'prince' : 'PER',\n",
    "    'lion' : 'O',\n",
    "    'favourite' : 'O',\n",
    "    'groundbreaking' : 'O',\n",
    "    'burlesque' : 'CW'\n",
    "    }\n",
    "\n",
    "\n",
    "words['ner_label'] = words['tag'].map(ner_labels)\n",
    "words"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Separate the labelled and unlabelled data"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "##### Named Entity Recognition\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Active Learner Model from MoDAL**\n",
    "0. Set aside some of the labelled dataset as a validation set. \n",
    "    - This validation set is used to evaluate the model at each iteration.\n",
    "    - Provides insights into whether training should stop.\n",
    "1. Split 'words' into an initial labeled set and a larger unlabeled set.\n",
    "2. Train a model on the labeled set.\n",
    "3. Use the model to rank the unlabeled data based on uncertainty or informativeness.\n",
    "4. Manually label the top-N most uncertain/informative samples.\n",
    "5. Add these newly labeled samples to the labeled set.\n",
    "6. Repeat steps 2-5 until you meet one of the stopping criteria.\n",
    "\n",
    "\n",
    "MoDAL code: https://modal-python.readthedocs.io/en/latest/content/examples/query_by_committee.html"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Active Learning Loop:\n",
    "- Query the most informative samples.\n",
    "- Label the queried samples.\n",
    "- Train the model on the labeled data.\n",
    "- Evaluate the model on the validation set.\n",
    "- Record the performance (e.g., accuracy, F1-score).\n",
    "- If the performance plateaus or starts degrading, consider stopping the active learning process."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Assuming 'words' is a pandas DataFrame\n",
    "split_index = int(0.8 * len(words))  # Split at 80% for training, 20% for validation\n",
    "\n",
    "# Splitting the dataframe deterministically\n",
    "train_df = words.iloc[:split_index]\n",
    "valid_df = words.iloc[split_index:]\n",
    "\n",
    "valid_df.to_csv(\"../dataset/to_label_ner/validation_df.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "valid_df = pd.read_csv(\"../dataset/to_label_ner/validation_df_done.csv\")\n",
    "valid_df['glove_vec'] = valid_df['glove_vec'].apply(custom_parser)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>26472</td>\n",
       "      <td>ontario</td>\n",
       "      <td>[-0.32533, -0.18209, -0.021454, 0.16194, -0.07...</td>\n",
       "      <td>LOC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>26484</td>\n",
       "      <td>underworld</td>\n",
       "      <td>[-0.045434, 0.27666, -0.21188, 0.36246, -0.237...</td>\n",
       "      <td>CW</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>26486</td>\n",
       "      <td>mechanic</td>\n",
       "      <td>[0.20201, 0.031268, 0.18269, -0.28702, 0.3244,...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>26488</td>\n",
       "      <td>scientist</td>\n",
       "      <td>[-0.55698, -0.16186, 0.31294, -0.85187, 0.8522...</td>\n",
       "      <td>PER</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>26495</td>\n",
       "      <td>training</td>\n",
       "      <td>[0.11191, -0.51417, 0.17269, -0.56873, 0.09914...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>575</th>\n",
       "      <td>50062</td>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>576</th>\n",
       "      <td>50110</td>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>577</th>\n",
       "      <td>50139</td>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>578</th>\n",
       "      <td>50142</td>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>579</th>\n",
       "      <td>50176</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>580 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0               tag  \\\n",
       "0         26472           ontario   \n",
       "1         26484        underworld   \n",
       "2         26486          mechanic   \n",
       "3         26488         scientist   \n",
       "4         26495          training   \n",
       "..          ...               ...   \n",
       "575       50062         newspaper   \n",
       "576       50110            static   \n",
       "577       50139            repeat   \n",
       "578       50142              seal   \n",
       "579       50176  counterespionage   \n",
       "\n",
       "                                             glove_vec ner_label  \n",
       "0    [-0.32533, -0.18209, -0.021454, 0.16194, -0.07...       LOC  \n",
       "1    [-0.045434, 0.27666, -0.21188, 0.36246, -0.237...        CW  \n",
       "2    [0.20201, 0.031268, 0.18269, -0.28702, 0.3244,...         O  \n",
       "3    [-0.55698, -0.16186, 0.31294, -0.85187, 0.8522...       PER  \n",
       "4    [0.11191, -0.51417, 0.17269, -0.56873, 0.09914...         O  \n",
       "..                                                 ...       ...  \n",
       "575  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...         O  \n",
       "576  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...         O  \n",
       "577  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...         O  \n",
       "578  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...         O  \n",
       "579  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...         O  \n",
       "\n",
       "[580 rows x 4 columns]"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "valid_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50062</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2899 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag                                          glove_vec  \\\n",
       "0                     s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "1                action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "2                 twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "4              overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   \n",
       "5               violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...   \n",
       "...                 ...                                                ...   \n",
       "50062         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "50110            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "50139            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "50142              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "50176  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "      ner_label  \n",
       "0           NaN  \n",
       "1           NaN  \n",
       "2           NaN  \n",
       "4           NaN  \n",
       "5           NaN  \n",
       "...         ...  \n",
       "50062       NaN  \n",
       "50110       NaN  \n",
       "50139       NaN  \n",
       "50142       NaN  \n",
       "50176       NaN  \n",
       "\n",
       "[2899 rows x 3 columns]"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "X_valid = pd.DataFrame(valid_df['glove_vec'].tolist()).to_numpy()\n",
    "y_valid = valid_df['ner_label'].to_numpy()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "22"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# train_df['ner_label'] = train_df['ner_label'].replace(\" \", np.nan)\n",
    "sum(train_df['ner_label'].notna())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "### ITERATION 1 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_1.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 1: 0.7913793103448276\n",
      "### ITERATION 2 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_2.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 2: 0.8137931034482758\n",
      "### ITERATION 3 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_3.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 3: 0.8068965517241379\n",
      "### ITERATION 4 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_4.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 4: 0.8120689655172414\n",
      "### ITERATION 5 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_5.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 5: 0.8051724137931034\n",
      "### ITERATION 6 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_6.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 6: 0.8017241379310345\n",
      "### ITERATION 7 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_7.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 7: 0.8051724137931034\n",
      "### ITERATION 8 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_8.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 8: 0.7982758620689655\n",
      "### ITERATION 9 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_9.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 9: 0.8068965517241379\n",
      "### ITERATION 10 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_10.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 10: 0.8155172413793104\n",
      "### ITERATION 11 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_11.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 11: 0.8017241379310345\n",
      "### ITERATION 12 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_12.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 12: 0.8051724137931034\n",
      "### ITERATION 13 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_13.csv\n",
      "Type 'done' when you've finished labeling: sonw\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 13: 0.8068965517241379\n",
      "### ITERATION 14 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_14.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 14: 0.8068965517241379\n",
      "### ITERATION 15 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_15.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 15: 0.8189655172413793\n",
      "### ITERATION 16 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_16.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 16: 0.8189655172413793\n",
      "### ITERATION 17 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_17.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 17: 0.8206896551724138\n",
      "### ITERATION 18 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_18.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 18: 0.8241379310344827\n",
      "### ITERATION 19 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_19.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 19: 0.8362068965517241\n",
      "### ITERATION 20 ###\n",
      "Label samples in: ../dataset/to_label_ner/samples_to_label_20.csv\n",
      "Type 'done' when you've finished labeling: done\n",
      "Validation Accuracy after iteration 20: 0.8258620689655173\n"
     ]
    }
   ],
   "source": [
    "from modAL.models import ActiveLearner\n",
    "from modAL.uncertainty import uncertainty_sampling\n",
    "from sklearn.ensemble import RandomForestClassifier\n",
    "from sklearn.metrics import accuracy_score\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "\n",
    "\n",
    "labels_sub = train_df\n",
    "labeled_df = labels_sub[labels_sub['ner_label'].notna()]\n",
    "unlabeled_df = labels_sub[labels_sub['ner_label'].isna()]\n",
    "unlabeled_df = unlabeled_df.dropna(subset=['glove_vec'])\n",
    "\n",
    "X_train = pd.DataFrame(labeled_df['glove_vec'].tolist()).to_numpy()\n",
    "y_train = labeled_df['ner_label'].to_numpy()\n",
    "\n",
    "learner = ActiveLearner(\n",
    "    estimator=RandomForestClassifier(),\n",
    "    query_strategy=uncertainty_sampling,\n",
    "    X_training=X_train,\n",
    "    y_training=y_train\n",
    ")\n",
    "\n",
    "X_unlabeled = pd.DataFrame(unlabeled_df['glove_vec'].tolist()).to_numpy()\n",
    "X_unlabeled = X_unlabeled[~np.isnan(X_unlabeled).any(axis=1)]\n",
    "\n",
    "for iteration in range(1, 21):  # This loop will run for 3 iterations. Adjust as needed.\n",
    "    if len(X_unlabeled)==0:\n",
    "        print(f\"All tokens are labelled\")\n",
    "        break\n",
    "    print(f\"### ITERATION {iteration} ###\")\n",
    "\n",
    "    query_idx, query_sample = learner.query(X_unlabeled, n_instances=10)\n",
    "    sample_to_label = unlabeled_df.iloc[query_idx]\n",
    "    sample_to_label.to_csv(f\"../dataset/to_label_ner/samples_to_label_{iteration}.csv\")\n",
    "    \n",
    "    print(f\"Label samples in: ../dataset/to_label_ner/samples_to_label_{iteration}.csv\")\n",
    "    done = \"\"\n",
    "    while done.lower() != \"done\":\n",
    "        done = input(\"Type 'done' when you've finished labeling: \")\n",
    "\n",
    "    annotated_samples = pd.read_csv(f\"../dataset/to_label_ner/samples_to_label_{iteration}_done.csv\")\n",
    "    new = annotated_samples['ner_label'].values\n",
    "    learner.teach(query_sample, new)\n",
    "\n",
    "    y_pred = learner.predict(X_valid)\n",
    "    accuracy = accuracy_score(y_valid, y_pred)\n",
    "    print(f\"Validation Accuracy after iteration {iteration}:\", accuracy)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Combining the labelled datasets, join to tags dataframe\n",
    "- First reading in the labelled datasets then merging them together\n",
    "- Then join to words dataframe"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>Unnamed: 4</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>12756</td>\n",
       "      <td>random</td>\n",
       "      <td>[ 3.7813e-01  9.2614e-01  3.7270e-01 -6.1136e-...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>23934</td>\n",
       "      <td>concert</td>\n",
       "      <td>[ 0.029852  -0.20522   -0.71844   -0.48894   -...</td>\n",
       "      <td>CW</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>12624</td>\n",
       "      <td>song</td>\n",
       "      <td>[-3.5170e-01 -2.8911e-01  1.9884e-01 -4.7476e-...</td>\n",
       "      <td>CW</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>10081</td>\n",
       "      <td>czech</td>\n",
       "      <td>[-1.8492e-01  1.5381e-01  1.2601e+00 -2.1114e-...</td>\n",
       "      <td>LOC</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1858</td>\n",
       "      <td>wedding</td>\n",
       "      <td>[ 0.67658    0.11038    0.17131   -0.75275   -...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>195</th>\n",
       "      <td>9014</td>\n",
       "      <td>jerusalem</td>\n",
       "      <td>[ 4.3531e-01  1.2321e+00  1.0205e+00  1.3986e-...</td>\n",
       "      <td>LOC</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>196</th>\n",
       "      <td>25342</td>\n",
       "      <td>pierce</td>\n",
       "      <td>[ 0.16362   -0.50971   -0.78109   -0.37825   -...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>197</th>\n",
       "      <td>7068</td>\n",
       "      <td>trash</td>\n",
       "      <td>[ 0.29287   -0.017886  -0.16534   -0.11473   -...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>198</th>\n",
       "      <td>25629</td>\n",
       "      <td>penthouse</td>\n",
       "      <td>[-3.3067e-02 -4.4267e-01 -3.6066e-01 -1.4896e-...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>199</th>\n",
       "      <td>25100</td>\n",
       "      <td>bath</td>\n",
       "      <td>[ 2.9690e-01 -2.5744e-02 -1.4287e-01  3.1498e-...</td>\n",
       "      <td>O</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>200 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0        tag                                          glove_vec  \\\n",
       "0         12756     random  [ 3.7813e-01  9.2614e-01  3.7270e-01 -6.1136e-...   \n",
       "1         23934    concert  [ 0.029852  -0.20522   -0.71844   -0.48894   -...   \n",
       "2         12624       song  [-3.5170e-01 -2.8911e-01  1.9884e-01 -4.7476e-...   \n",
       "3         10081      czech  [-1.8492e-01  1.5381e-01  1.2601e+00 -2.1114e-...   \n",
       "4          1858    wedding  [ 0.67658    0.11038    0.17131   -0.75275   -...   \n",
       "..          ...        ...                                                ...   \n",
       "195        9014  jerusalem  [ 4.3531e-01  1.2321e+00  1.0205e+00  1.3986e-...   \n",
       "196       25342     pierce  [ 0.16362   -0.50971   -0.78109   -0.37825   -...   \n",
       "197        7068      trash  [ 0.29287   -0.017886  -0.16534   -0.11473   -...   \n",
       "198       25629  penthouse  [-3.3067e-02 -4.4267e-01 -3.6066e-01 -1.4896e-...   \n",
       "199       25100       bath  [ 2.9690e-01 -2.5744e-02 -1.4287e-01  3.1498e-...   \n",
       "\n",
       "    ner_label  Unnamed: 4  \n",
       "0           O         NaN  \n",
       "1          CW         NaN  \n",
       "2          CW         NaN  \n",
       "3         LOC         NaN  \n",
       "4           O         NaN  \n",
       "..        ...         ...  \n",
       "195       LOC         NaN  \n",
       "196         O         NaN  \n",
       "197         O         NaN  \n",
       "198         O         NaN  \n",
       "199         O         NaN  \n",
       "\n",
       "[200 rows x 5 columns]"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "base_path = \"../dataset/to_label_ner/\"\n",
    "file_prefix = \"samples_to_label_\"\n",
    "file_suffix = \"_done.csv\"\n",
    "\n",
    "dfs = []\n",
    "\n",
    "# Loop to read files 1 through 20\n",
    "for i in range(1, 21):\n",
    "    file_path = f\"{base_path}{file_prefix}{i}{file_suffix}\"\n",
    "    df = pd.read_csv(file_path)\n",
    "    dfs.append(df)\n",
    "\n",
    "# Concatenate all dataframes together\n",
    "df_merged = pd.concat(dfs, axis=0, ignore_index=True)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>12756</td>\n",
       "      <td>random</td>\n",
       "      <td>[ 3.7813e-01  9.2614e-01  3.7270e-01 -6.1136e-...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>23934</td>\n",
       "      <td>concert</td>\n",
       "      <td>[ 0.029852  -0.20522   -0.71844   -0.48894   -...</td>\n",
       "      <td>CW</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>12624</td>\n",
       "      <td>song</td>\n",
       "      <td>[-3.5170e-01 -2.8911e-01  1.9884e-01 -4.7476e-...</td>\n",
       "      <td>CW</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>10081</td>\n",
       "      <td>czech</td>\n",
       "      <td>[-1.8492e-01  1.5381e-01  1.2601e+00 -2.1114e-...</td>\n",
       "      <td>LOC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1858</td>\n",
       "      <td>wedding</td>\n",
       "      <td>[ 0.67658    0.11038    0.17131   -0.75275   -...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>195</th>\n",
       "      <td>9014</td>\n",
       "      <td>jerusalem</td>\n",
       "      <td>[ 4.3531e-01  1.2321e+00  1.0205e+00  1.3986e-...</td>\n",
       "      <td>LOC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>196</th>\n",
       "      <td>25342</td>\n",
       "      <td>pierce</td>\n",
       "      <td>[ 0.16362   -0.50971   -0.78109   -0.37825   -...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>197</th>\n",
       "      <td>7068</td>\n",
       "      <td>trash</td>\n",
       "      <td>[ 0.29287   -0.017886  -0.16534   -0.11473   -...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>198</th>\n",
       "      <td>25629</td>\n",
       "      <td>penthouse</td>\n",
       "      <td>[-3.3067e-02 -4.4267e-01 -3.6066e-01 -1.4896e-...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>199</th>\n",
       "      <td>25100</td>\n",
       "      <td>bath</td>\n",
       "      <td>[ 2.9690e-01 -2.5744e-02 -1.4287e-01  3.1498e-...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>200 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0        tag                                          glove_vec  \\\n",
       "0         12756     random  [ 3.7813e-01  9.2614e-01  3.7270e-01 -6.1136e-...   \n",
       "1         23934    concert  [ 0.029852  -0.20522   -0.71844   -0.48894   -...   \n",
       "2         12624       song  [-3.5170e-01 -2.8911e-01  1.9884e-01 -4.7476e-...   \n",
       "3         10081      czech  [-1.8492e-01  1.5381e-01  1.2601e+00 -2.1114e-...   \n",
       "4          1858    wedding  [ 0.67658    0.11038    0.17131   -0.75275   -...   \n",
       "..          ...        ...                                                ...   \n",
       "195        9014  jerusalem  [ 4.3531e-01  1.2321e+00  1.0205e+00  1.3986e-...   \n",
       "196       25342     pierce  [ 0.16362   -0.50971   -0.78109   -0.37825   -...   \n",
       "197        7068      trash  [ 0.29287   -0.017886  -0.16534   -0.11473   -...   \n",
       "198       25629  penthouse  [-3.3067e-02 -4.4267e-01 -3.6066e-01 -1.4896e-...   \n",
       "199       25100       bath  [ 2.9690e-01 -2.5744e-02 -1.4287e-01  3.1498e-...   \n",
       "\n",
       "    ner_label  \n",
       "0           O  \n",
       "1          CW  \n",
       "2          CW  \n",
       "3         LOC  \n",
       "4           O  \n",
       "..        ...  \n",
       "195       LOC  \n",
       "196         O  \n",
       "197         O  \n",
       "198         O  \n",
       "199         O  \n",
       "\n",
       "[200 rows x 4 columns]"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_merged = df_merged.drop(['Unnamed: 4'], axis=1)\n",
    "df_merged"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [],
   "source": [
    "words = words.drop(columns=['ner_label'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50062</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2899 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag                                          glove_vec\n",
       "0                     s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...\n",
       "1                action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...\n",
       "2                 twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...\n",
       "4              overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...\n",
       "5               violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...\n",
       "...                 ...                                                ...\n",
       "50062         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...\n",
       "50110            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...\n",
       "50139            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...\n",
       "50142              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...\n",
       "50176  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...\n",
       "\n",
       "[2899 rows x 2 columns]"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_lab = df_merged[[\"tag\", \"ner_label\"]]\n",
    "words = words.merge(df_lab, on=['tag'], how=\"left\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [],
   "source": [
    "words.to_csv(\"../dataset/to_label_ner/words.csv\",index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0       NaN\n",
       "6        CW\n",
       "23        O\n",
       "60      LOC\n",
       "102     PER\n",
       "452    PROD\n",
       "Name: ner_label, dtype: object"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words['ner_label'].drop_duplicates() # need to rename for consistency"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [],
   "source": [
    "words['ner_label'] = words['ner_label'].replace('Person', 'PER')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0       NaN\n",
       "6        CW\n",
       "23        O\n",
       "60      LOC\n",
       "102     PER\n",
       "452    PROD\n",
       "Name: ner_label, dtype: object"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words['ner_label'].drop_duplicates()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Testing the join:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>535</th>\n",
       "      <td>poker</td>\n",
       "      <td>[0.42254, 0.24923, -0.15362, -0.73099, 0.19908...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       tag                                          glove_vec ner_label\n",
       "535  poker  [0.42254, 0.24923, -0.15362, -0.73099, 0.19908...       NaN"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words[words['tag'] == 'poker']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Converting the training data to a readable type by SpaCy model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "200"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t = words[words['ner_label'].isna() == False]\n",
    "len(t)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [],
   "source": [
    "t[[\"tag\", \"ner_label\"]].to_csv(\"here.csv\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Merging t and valid_df to increase the size of the training dataset\n",
    "taking 50% of valid_df for training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Sample 70% of valid_df for training\n",
    "sampled_valid_df_train = valid_df.sample(frac=0.7)\n",
    "\n",
    "# The other 30% for testing\n",
    "sampled_valid_df_test = valid_df.drop(sampled_valid_df_train.index)\n",
    "\n",
    "# Merge or concatenate 't' dataframe with the training half of 'valid_df'\n",
    "combined_df_train = pd.concat([t, sampled_valid_df_train], ignore_index=True)\n",
    "\n",
    "t = combined_df_train"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Train spaCy NER model on manual labels - Custom NER model**\n",
    "\n",
    "ref = https://towardsdatascience.com/train-ner-with-custom-training-data-using-spacy-525ce748fab7"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Define the variables required for the training model to be processed.\n",
    "\n",
    "- Model is a pre-trained one and is fine-tuned on my labels\n",
    "    - Add new entity labels to NER component"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Collecting en-core-web-md==3.7.1\n",
      "  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_md-3.7.1/en_core_web_md-3.7.1-py3-none-any.whl (42.8 MB)\n",
      "\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m42.8/42.8 MB\u001B[0m \u001B[31m6.7 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0m00:01\u001B[0m00:01\u001B[0m\n",
      "\u001B[?25hRequirement already satisfied: spacy<3.8.0,>=3.7.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from en-core-web-md==3.7.1) (3.7.6)\n",
      "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.11 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (3.0.12)\n",
      "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.0.5)\n",
      "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.0.10)\n",
      "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.0.8)\n",
      "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (3.0.9)\n",
      "Requirement already satisfied: thinc<8.3.0,>=8.2.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (8.2.5)\n",
      "Requirement already satisfied: wasabi<1.2.0,>=0.9.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.1.3)\n",
      "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.4.8)\n",
      "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.0.10)\n",
      "Requirement already satisfied: weasel<0.5.0,>=0.1.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.4.1)\n",
      "Requirement already satisfied: typer<1.0.0,>=0.3.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.12.4)\n",
      "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (4.65.0)\n",
      "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.31.0)\n",
      "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.10.8)\n",
      "Requirement already satisfied: jinja2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (3.1.2)\n",
      "Requirement already satisfied: setuptools in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (68.0.0)\n",
      "Requirement already satisfied: packaging>=20.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (23.1)\n",
      "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (3.4.0)\n",
      "Requirement already satisfied: numpy>=1.19.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.24.3)\n",
      "Requirement already satisfied: language-data>=1.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from langcodes<4.0.0,>=3.2.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.2.0)\n",
      "Requirement already satisfied: typing-extensions>=4.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (4.12.2)\n",
      "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.0.4)\n",
      "Requirement already satisfied: idna<4,>=2.5 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (3.4)\n",
      "Requirement already satisfied: urllib3<3,>=1.21.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.26.16)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2024.2.2)\n",
      "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.7.11)\n",
      "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.1.5)\n",
      "Requirement already satisfied: click>=8.0.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (8.1.7)\n",
      "Requirement already satisfied: shellingham>=1.3.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.5.4)\n",
      "Requirement already satisfied: rich>=10.11.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (13.7.1)\n",
      "Requirement already satisfied: cloudpathlib<1.0.0,>=0.7.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from weasel<0.5.0,>=0.1.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.18.1)\n",
      "Requirement already satisfied: smart-open<8.0.0,>=5.2.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from weasel<0.5.0,>=0.1.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (5.2.1)\n",
      "Requirement already satisfied: MarkupSafe>=2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from jinja2->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.1.1)\n",
      "Requirement already satisfied: marisa-trie>=0.7.7 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from language-data>=1.2->langcodes<4.0.0,>=3.2.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (1.2.0)\n",
      "Requirement already satisfied: markdown-it-py>=2.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.2.0)\n",
      "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (2.15.1)\n",
      "Requirement already satisfied: mdurl~=0.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-md==3.7.1) (0.1.0)\n",
      "Installing collected packages: en-core-web-md\n",
      "Successfully installed en-core-web-md-3.7.1\n",
      "\u001B[38;5;2m✔ Download and installation successful\u001B[0m\n",
      "You can now load the package via spacy.load('en_core_web_md')\n"
     ]
    }
   ],
   "source": [
    "!python -m spacy download en_core_web_md\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [],
   "source": [
    "from __future__ import unicode_literals, print_function\n",
    "\n",
    "import random\n",
    "from pathlib import Path\n",
    "import spacy\n",
    "from tqdm import tqdm\n",
    "\n",
    "\n",
    "input_data = list(zip(t['tag'], t['ner_label']))\n",
    "\n",
    "TRAIN_DATA = [(word, {\"entities\": [(0, len(word), label)]}) for word, label in input_data]\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loaded model 'en_core_web_md'\n",
      "Iteration 1, Losses {'ner': 422.6617907359614}\n",
      "Iteration 2, Losses {'ner': 247.4135676920996}\n",
      "Iteration 3, Losses {'ner': 233.9982915611472}\n",
      "Iteration 4, Losses {'ner': 209.21005214694014}\n",
      "Iteration 5, Losses {'ner': 209.36362706686486}\n",
      "Iteration 6, Losses {'ner': 183.26999039935254}\n",
      "Iteration 7, Losses {'ner': 176.7985747557163}\n",
      "Iteration 8, Losses {'ner': 167.07425810366433}\n",
      "Iteration 9, Losses {'ner': 163.42062955976098}\n",
      "Iteration 10, Losses {'ner': 135.64236977750815}\n",
      "Iteration 11, Losses {'ner': 128.86931058430733}\n",
      "Iteration 12, Losses {'ner': 120.83931449085503}\n",
      "Iteration 13, Losses {'ner': 113.51734835874157}\n",
      "Iteration 14, Losses {'ner': 108.52877322344843}\n",
      "Iteration 15, Losses {'ner': 107.63247987134598}\n",
      "Iteration 16, Losses {'ner': 82.8958250792876}\n",
      "Iteration 17, Losses {'ner': 85.04189038934966}\n",
      "Iteration 18, Losses {'ner': 80.44434362227304}\n",
      "Iteration 19, Losses {'ner': 62.68704302356356}\n",
      "Iteration 20, Losses {'ner': 49.37958782281637}\n",
      "Iteration 21, Losses {'ner': 61.556898714803474}\n",
      "Iteration 22, Losses {'ner': 62.41234308603369}\n",
      "Iteration 23, Losses {'ner': 56.883526780680675}\n",
      "Iteration 24, Losses {'ner': 51.776533231383986}\n",
      "Iteration 25, Losses {'ner': 41.969433271408086}\n",
      "Iteration 26, Losses {'ner': 50.22159749284181}\n",
      "Iteration 27, Losses {'ner': 52.20117461486553}\n",
      "Iteration 28, Losses {'ner': 21.041922356486076}\n",
      "Iteration 29, Losses {'ner': 32.710640038816145}\n",
      "Iteration 30, Losses {'ner': 38.484637047807105}\n",
      "Iteration 31, Losses {'ner': 32.70339189469239}\n",
      "Iteration 32, Losses {'ner': 18.138543766142604}\n",
      "Iteration 33, Losses {'ner': 35.20201102239631}\n",
      "Iteration 34, Losses {'ner': 17.655179664240826}\n",
      "Iteration 35, Losses {'ner': 23.10356077445856}\n",
      "Iteration 36, Losses {'ner': 28.742394890868706}\n",
      "Iteration 37, Losses {'ner': 26.964449873936218}\n",
      "Iteration 38, Losses {'ner': 25.2010890280019}\n",
      "Iteration 39, Losses {'ner': 21.138997314661342}\n",
      "Iteration 40, Losses {'ner': 20.748290893322192}\n",
      "Iteration 41, Losses {'ner': 23.210311804289816}\n",
      "Iteration 42, Losses {'ner': 21.09696901198159}\n",
      "Iteration 43, Losses {'ner': 16.748639048435066}\n",
      "Iteration 44, Losses {'ner': 19.553263273825905}\n",
      "Iteration 45, Losses {'ner': 21.988974931367736}\n",
      "Iteration 46, Losses {'ner': 18.858876722946466}\n",
      "Iteration 47, Losses {'ner': 12.500464522369038}\n",
      "Iteration 48, Losses {'ner': 15.8141701806719}\n",
      "Iteration 49, Losses {'ner': 28.957901817648427}\n",
      "Iteration 50, Losses {'ner': 15.293988795989073}\n",
      "Iteration 51, Losses {'ner': 9.052524711331163}\n",
      "Iteration 52, Losses {'ner': 17.95808060920012}\n",
      "Iteration 53, Losses {'ner': 10.348478267340724}\n",
      "Iteration 54, Losses {'ner': 18.549233314092742}\n",
      "Iteration 55, Losses {'ner': 20.539523187674735}\n",
      "Iteration 56, Losses {'ner': 31.432147984662883}\n",
      "Iteration 57, Losses {'ner': 20.823523362624112}\n",
      "Iteration 58, Losses {'ner': 17.99894391215919}\n",
      "Iteration 59, Losses {'ner': 16.59873915580375}\n",
      "Iteration 60, Losses {'ner': 13.925211716937397}\n",
      "Iteration 61, Losses {'ner': 20.507162855628142}\n",
      "Iteration 62, Losses {'ner': 12.951482193063535}\n",
      "Iteration 63, Losses {'ner': 13.706259036568907}\n",
      "Iteration 64, Losses {'ner': 18.937040549872933}\n",
      "Iteration 65, Losses {'ner': 6.7451768876422165}\n",
      "Iteration 66, Losses {'ner': 0.2634336030979442}\n",
      "Iteration 67, Losses {'ner': 10.49979152425093}\n",
      "Iteration 68, Losses {'ner': 11.200380788830513}\n",
      "Iteration 69, Losses {'ner': 19.146001676971967}\n",
      "Iteration 70, Losses {'ner': 11.768651516807529}\n",
      "Iteration 71, Losses {'ner': 12.770083443718235}\n",
      "Iteration 72, Losses {'ner': 21.699160390107256}\n",
      "Iteration 73, Losses {'ner': 7.562512016531679}\n",
      "Iteration 74, Losses {'ner': 12.074429266918642}\n",
      "Iteration 75, Losses {'ner': 9.068845397458013}\n",
      "Iteration 76, Losses {'ner': 5.77072254201232}\n",
      "Iteration 77, Losses {'ner': 7.240381700558949}\n",
      "Iteration 78, Losses {'ner': 6.529770657846003}\n",
      "Iteration 79, Losses {'ner': 12.874568626020293}\n",
      "Iteration 80, Losses {'ner': 8.974766121843633}\n",
      "Iteration 81, Losses {'ner': 8.47182850818935}\n",
      "Iteration 82, Losses {'ner': 12.050470430838564}\n",
      "Iteration 83, Losses {'ner': 6.874989821942043}\n",
      "Iteration 84, Losses {'ner': 11.399770812226995}\n",
      "Iteration 85, Losses {'ner': 10.223938391949948}\n",
      "Iteration 86, Losses {'ner': 11.15393743966346}\n",
      "Iteration 87, Losses {'ner': 3.863301331390279}\n",
      "Iteration 88, Losses {'ner': 8.151195251793661}\n",
      "Iteration 89, Losses {'ner': 16.184101034030384}\n",
      "Iteration 90, Losses {'ner': 8.476963047650958}\n",
      "Iteration 91, Losses {'ner': 7.091983999578414}\n",
      "Iteration 92, Losses {'ner': 9.35446571315087}\n",
      "Iteration 93, Losses {'ner': 18.907853375738398}\n",
      "Iteration 94, Losses {'ner': 4.089007331338109}\n",
      "Iteration 95, Losses {'ner': 3.010512058176018}\n",
      "Iteration 96, Losses {'ner': 9.473065866205289}\n",
      "Iteration 97, Losses {'ner': 7.334730114775097}\n",
      "Iteration 98, Losses {'ner': 9.552484310611634}\n",
      "Iteration 99, Losses {'ner': 12.48493270605909}\n",
      "Iteration 100, Losses {'ner': 6.884364797819385}\n",
      "Saved model to ../dataset/ner_output\n"
     ]
    }
   ],
   "source": [
    "import spacy\n",
    "from spacy.training import Example\n",
    "from spacy.util import minibatch, compounding\n",
    "from pathlib import Path\n",
    "import random\n",
    "from tqdm import tqdm\n",
    "import spacy_lookups_data\n",
    "\n",
    "model = \"en_core_web_md\"\n",
    "\n",
    "output_dir=Path(\"../dataset/ner_output\")\n",
    "n_iter = 100\n",
    "\n",
    "\n",
    "# Load the model\n",
    "if model is not None:\n",
    "    nlp = spacy.load(model)\n",
    "    print(\"Loaded model '%s'\" % model)\n",
    "else:\n",
    "    nlp = spacy.blank('en')\n",
    "    print(\"Created blank 'en' model\")\n",
    "\n",
    "# Check for NER pipe\n",
    "if 'ner' not in nlp.pipe_names:\n",
    "    ner = nlp.create_pipe('ner')\n",
    "    nlp.add_pipe(ner, last=True)\n",
    "else:\n",
    "    ner = nlp.get_pipe('ner')\n",
    "\n",
    "# Add new entity labels to entity recognizer\n",
    "for _, annotations in TRAIN_DATA:\n",
    "    for ent in annotations.get('entities'):\n",
    "        ner.add_label(ent[2])\n",
    "\n",
    "# Get names of other pipes to disable them during training\n",
    "other_pipes = [pipe for pipe in nlp.pipe_names if pipe != 'ner']\n",
    "with nlp.disable_pipes(*other_pipes):  # only train NER\n",
    "    optimizer = nlp.create_optimizer()  # continue training on existing model\n",
    "    \n",
    "    for itn in range(n_iter):\n",
    "        random.shuffle(TRAIN_DATA)\n",
    "        losses = {}\n",
    "        \n",
    "        # Data partitioning with minibatch\n",
    "        batches = minibatch(TRAIN_DATA, size=compounding(4.0, 32.0, 1.001))\n",
    "        \n",
    "        for batch in batches:\n",
    "            texts, annotations = zip(*batch)\n",
    "\n",
    "            examples = []\n",
    "            for i in range(len(texts)):\n",
    "                doc = nlp.make_doc(texts[i])\n",
    "                examples.append(Example.from_dict(doc, annotations[i]))\n",
    "\n",
    "            nlp.update(examples, drop=0.5, sgd=optimizer, losses=losses)\n",
    "        print(\"Iteration {}, Losses {}\".format(itn + 1, losses))\n",
    "\n",
    "if output_dir is not None:\n",
    "    output_dir = Path(output_dir)\n",
    "    if not output_dir.exists():\n",
    "        output_dir.mkdir()\n",
    "    nlp.to_disk(output_dir)\n",
    "    print(\"Saved model to\", output_dir)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Hyperparameter tuning for the NER model**\n",
    "1. Dropout Rate\n",
    "2. Minibatch size\n",
    "3. Learning Rate\n",
    "4. Number of Iterations\n",
    "5. Initial model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[I 2024-09-03 00:31:32,745] A new study created in memory with name: no-name-3a573ce2-a58f-42f4-93d9-876b315ba492\n",
      "[I 2024-09-03 00:36:24,316] Trial 0 finished with value: 0.764367816091954 and parameters: {'dropout': 0.5739694415334561, 'compounding_start': 2.0841332606731973, 'compounding_end': 28.884537649220285, 'n_iter': 108}. Best is trial 0 with value: 0.764367816091954.\n",
      "[I 2024-09-03 00:38:20,993] Trial 1 finished with value: 0.7988505747126436 and parameters: {'dropout': 0.5562659598253016, 'compounding_start': 3.1614213290371147, 'compounding_end': 26.7719345870495, 'n_iter': 60}. Best is trial 1 with value: 0.7988505747126436.\n",
      "[I 2024-09-03 00:42:30,867] Trial 2 finished with value: 0.7816091954022989 and parameters: {'dropout': 0.727955302185287, 'compounding_start': 3.68977165516909, 'compounding_end': 21.110094861565415, 'n_iter': 146}. Best is trial 1 with value: 0.7988505747126436.\n",
      "[I 2024-09-03 00:49:08,927] Trial 3 finished with value: 0.7183908045977011 and parameters: {'dropout': 0.5650688903446928, 'compounding_start': 2.2682059216643973, 'compounding_end': 27.646537743884963, 'n_iter': 148}. Best is trial 1 with value: 0.7988505747126436.\n",
      "[I 2024-09-03 00:52:30,775] Trial 4 finished with value: 0.8160919540229885 and parameters: {'dropout': 0.5069418893315567, 'compounding_start': 3.5465715134131166, 'compounding_end': 16.57240868898037, 'n_iter': 114}. Best is trial 4 with value: 0.8160919540229885.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Best trial:\n",
      "Value: 0.8160919540229885\n",
      "Params: \n",
      "dropout: 0.5069418893315567\n",
      "compounding_start: 3.5465715134131166\n",
      "compounding_end: 16.57240868898037\n",
      "n_iter: 114\n"
     ]
    }
   ],
   "source": [
    "import optuna\n",
    "\n",
    "def objective(trial):\n",
    "    # Define hyperparameter search space\n",
    "    dropout = trial.suggest_float(\"dropout\", 0.2, 0.8)\n",
    "    compounding_start = trial.suggest_float(\"compounding_start\", 2.0, 4.0)\n",
    "    compounding_end = trial.suggest_float(\"compounding_end\", 16.0, 32.0)\n",
    "    n_iter = trial.suggest_int(\"n_iter\", 50, 150)\n",
    "    \n",
    "    nlp = spacy.load(model) if model else spacy.blank('en')\n",
    "\n",
    "    if 'ner' not in nlp.pipe_names:\n",
    "        ner = nlp.create_pipe('ner')\n",
    "        nlp.add_pipe(ner, last=True)\n",
    "    else:\n",
    "        ner = nlp.get_pipe('ner')\n",
    "\n",
    "    for _, annotations in TRAIN_DATA:\n",
    "        for ent in annotations.get('entities'):\n",
    "            ner.add_label(ent[2])\n",
    "\n",
    "    other_pipes = [pipe for pipe in nlp.pipe_names if pipe != 'ner']\n",
    "    with nlp.disable_pipes(*other_pipes):\n",
    "        optimizer = nlp.create_optimizer()\n",
    "        for itn in range(n_iter):\n",
    "            random.shuffle(TRAIN_DATA)\n",
    "            losses = {}\n",
    "            batches = minibatch(TRAIN_DATA, size=compounding(compounding_start, compounding_end, 1.001))\n",
    "            for batch in batches:\n",
    "                texts, annotations = zip(*batch)\n",
    "                examples = [Example.from_dict(nlp.make_doc(text), ann) for text, ann in zip(texts, annotations)]\n",
    "                nlp.update(examples, drop=dropout, sgd=optimizer, losses=losses)\n",
    "\n",
    "    # Evaluation method\n",
    "    train_tags = {item[0] for item in TRAIN_DATA}\n",
    "    validation_data = valid_df[~valid_df['tag'].isin(train_tags)]\n",
    "    total_predictions = 0\n",
    "    correct_predictions = 0\n",
    "    for _, row in validation_data.iterrows():\n",
    "        doc = nlp(row['tag'])\n",
    "        if doc.ents:\n",
    "            predicted_label = doc.ents[0].label_\n",
    "            if predicted_label == row['ner_label']:\n",
    "                correct_predictions += 1\n",
    "        else:\n",
    "            if row['ner_label'] == 'O':\n",
    "                correct_predictions += 1\n",
    "        total_predictions += 1\n",
    "    accuracy = correct_predictions / total_predictions\n",
    "\n",
    "    return accuracy\n",
    "\n",
    "study = optuna.create_study(direction=\"maximize\")\n",
    "study.optimize(objective, n_trials=5)\n",
    "\n",
    "print(\"Best trial:\")\n",
    "trial = study.best_trial\n",
    "print(f\"Value: {trial.value}\")\n",
    "print(\"Params: \")\n",
    "for key, value in trial.params.items():\n",
    "    print(f\"{key}: {value}\")\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Best trial:\n",
    "Value: 0.8113207547169812\n",
    "Params: \n",
    "dropout: 0.7481416541082628\n",
    "compounding_start: 2.5633153390206718\n",
    "compounding_end: 18.15885091048632\n",
    "n_iter: 69"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Results of pretrain\n",
    "\n",
    "ner loss = 2 from initial ner loss of 265\n",
    "\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Checking if the model saved in the directory"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "../dataset/ner_output/lemmatizer\n",
      "../dataset/ner_output/ner\n",
      "../dataset/ner_output/tokenizer\n",
      "../dataset/ner_output/attribute_ruler\n",
      "../dataset/ner_output/parser\n",
      "../dataset/ner_output/vocab\n",
      "../dataset/ner_output/config.cfg\n",
      "../dataset/ner_output/tok2vec\n",
      "../dataset/ner_output/tagger\n",
      "../dataset/ner_output/meta.json\n",
      "../dataset/ner_output/senter\n"
     ]
    }
   ],
   "source": [
    "files_in_directory = list(output_dir.iterdir())\n",
    "for file in files_in_directory:\n",
    "    print(file)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**testing the trained model on validation set**\n",
    "- Check that the same words aren't in the TRAIN_DATA \n",
    "- Then, record the accuracy "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>26472</td>\n",
       "      <td>ontario</td>\n",
       "      <td>[-0.32533, -0.18209, -0.021454, 0.16194, -0.07...</td>\n",
       "      <td>LOC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>26484</td>\n",
       "      <td>underworld</td>\n",
       "      <td>[-0.045434, 0.27666, -0.21188, 0.36246, -0.237...</td>\n",
       "      <td>CW</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>26486</td>\n",
       "      <td>mechanic</td>\n",
       "      <td>[0.20201, 0.031268, 0.18269, -0.28702, 0.3244,...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>26488</td>\n",
       "      <td>scientist</td>\n",
       "      <td>[-0.55698, -0.16186, 0.31294, -0.85187, 0.8522...</td>\n",
       "      <td>PER</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>26495</td>\n",
       "      <td>training</td>\n",
       "      <td>[0.11191, -0.51417, 0.17269, -0.56873, 0.09914...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>575</th>\n",
       "      <td>50062</td>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>576</th>\n",
       "      <td>50110</td>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>577</th>\n",
       "      <td>50139</td>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>578</th>\n",
       "      <td>50142</td>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>579</th>\n",
       "      <td>50176</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>O</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>580 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0               tag  \\\n",
       "0         26472           ontario   \n",
       "1         26484        underworld   \n",
       "2         26486          mechanic   \n",
       "3         26488         scientist   \n",
       "4         26495          training   \n",
       "..          ...               ...   \n",
       "575       50062         newspaper   \n",
       "576       50110            static   \n",
       "577       50139            repeat   \n",
       "578       50142              seal   \n",
       "579       50176  counterespionage   \n",
       "\n",
       "                                             glove_vec ner_label  \n",
       "0    [-0.32533, -0.18209, -0.021454, 0.16194, -0.07...       LOC  \n",
       "1    [-0.045434, 0.27666, -0.21188, 0.36246, -0.237...        CW  \n",
       "2    [0.20201, 0.031268, 0.18269, -0.28702, 0.3244,...         O  \n",
       "3    [-0.55698, -0.16186, 0.31294, -0.85187, 0.8522...       PER  \n",
       "4    [0.11191, -0.51417, 0.17269, -0.56873, 0.09914...         O  \n",
       "..                                                 ...       ...  \n",
       "575  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...         O  \n",
       "576  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...         O  \n",
       "577  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...         O  \n",
       "578  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...         O  \n",
       "579  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...         O  \n",
       "\n",
       "[580 rows x 4 columns]"
      ]
     },
     "execution_count": 48,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "valid_df "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Entities [('lottery', 'O')]\n",
      "Entities [('engineer', 'PER')]\n",
      "Entities [('narrator', 'O')]\n",
      "Entities [('special', 'O')]\n",
      "Entities [('protection', 'O')]\n",
      "Entities [('unorthodox', 'O')]\n",
      "Entities [('score', 'O')]\n",
      "Entities [('brooch', 'O')]\n",
      "Entities [('tightrope', 'O')]\n",
      "Entities [('con', 'O')]\n",
      "Entities [('hbomb', 'O')]\n",
      "Entities [('erotism', 'O')]\n",
      "Entities [('medieval', 'O')]\n",
      "Entities [('cowboy', 'PER')]\n",
      "Entities [('deaf', 'O')]\n",
      "Entities [('stylish', 'O')]\n",
      "Entities [('vatican', 'O')]\n",
      "Entities [('literary', 'O')]\n",
      "Entities [('doubledealing', 'O')]\n",
      "Entities [('senseless', 'O')]\n",
      "Entities [('tomb', 'O')]\n",
      "Entities [('panoramic', 'O')]\n",
      "Entities [('counterespionage', 'O')]\n",
      "Entities [('piano', 'PROD')]\n",
      "Entities [('unfinished', 'O')]\n",
      "Entities [('grace', 'O')]\n",
      "Entities [('avant-garde', 'CW')]\n",
      "Entities [('cosmic', 'O')]\n",
      "Entities [('respect', 'O')]\n",
      "Entities [('democracy', 'O')]\n",
      "Entities [('alienation', 'O')]\n",
      "Entities [('wander', 'O')]\n",
      "Entities [('misunderstood', 'O')]\n",
      "Entities [('repeat', 'O')]\n",
      "Entities [('trouble', 'O')]\n",
      "Entities [('aba', 'CORP')]\n",
      "Entities [('underdeveloped', 'PROD')]\n",
      "Entities [('caravan', 'O')]\n",
      "Entities [('fragment', 'O')]\n",
      "Entities [('kubrick', 'PER')]\n",
      "Entities [('tennessee', 'LOC')]\n",
      "Entities [('voyage', 'O')]\n",
      "Entities [('restaurant', 'LOC')]\n",
      "Entities [('tire', 'O')]\n",
      "Entities [('panama', 'LOC')]\n",
      "Entities [('bali', 'LOC')]\n",
      "Entities [('concert', 'CW')]\n",
      "Entities [('versailles', 'LOC')]\n",
      "Entities [('cult', 'O')]\n",
      "Entities [('song', 'CW')]\n",
      "Entities [('perception', 'O')]\n",
      "Entities [('stereotypical', 'O')]\n",
      "Entities [('bordering', 'O')]\n",
      "Entities [('sitcom', 'CW')]\n",
      "Entities [('different', 'O')]\n",
      "Entities [('artist', 'PER')]\n",
      "Entities [('hoax', 'O')]\n",
      "Entities [('inception', 'O')]\n",
      "Entities [('clean', 'O')]\n",
      "Entities [('allegorical', 'O')]\n",
      "Entities [('atrocity', 'O')]\n",
      "Entities [('church', 'O')]\n",
      "Entities [('virginia', 'LOC')]\n",
      "Entities [('islamabad', 'LOC')]\n",
      "Entities [('rocco', 'PER')]\n",
      "Entities [('accomplice', 'PER')]\n",
      "Entities [('mob', 'O')]\n",
      "Entities [('clown', 'O')]\n",
      "Entities [('theater', 'LOC')]\n",
      "Entities [('olde', 'O')]\n",
      "Entities [('brawl', 'O')]\n",
      "Entities [('yosemite', 'LOC')]\n",
      "Entities [('wisconsin', 'LOC')]\n",
      "Entities [('violin', 'O')]\n",
      "Entities [('accurate', 'O')]\n",
      "Entities [('simulation', 'O')]\n",
      "Entities [('tranquilizer', 'O')]\n",
      "Entities [('nepal', 'LOC')]\n",
      "Entities [('sa', 'LOC')]\n",
      "Entities [('scientist', 'PER')]\n",
      "Entities [('emperor', 'PER')]\n",
      "Entities [('jingle', 'O')]\n",
      "Entities [('wildlife', 'O')]\n",
      "Entities [('terminator', 'CW')]\n",
      "Entities [('bollywood', 'PROD')]\n",
      "Entities [('genealogical', 'O')]\n",
      "Entities [('whitney', 'PER')]\n",
      "Entities [('kingdom', 'O')]\n",
      "Entities [('lynch', 'PER')]\n",
      "Entities [('nondiscrimination', 'O')]\n",
      "Entities [('hospitalization', 'O')]\n",
      "Entities [('referee', 'PER')]\n",
      "Entities [('ahem', 'O')]\n",
      "Entities [('art', 'CW')]\n",
      "Entities [('solidarity', 'O')]\n",
      "Entities [('dickens', 'PER')]\n",
      "Entities [('teamwork', 'O')]\n",
      "Entities [('sydney', 'LOC')]\n",
      "Entities [('rabies', 'O')]\n",
      "Entities [('playboy', 'O')]\n",
      "Entities [('pentecostal', 'O')]\n",
      "Entities [('corrupt', 'O')]\n",
      "Entities [('bitch', 'O')]\n",
      "Entities [('patriotism', 'O')]\n",
      "Entities [('chile', 'LOC')]\n",
      "Entities [('white', 'O')]\n",
      "Entities [('netherlands', 'LOC')]\n",
      "Entities [('saturate', 'O')]\n",
      "Entities [('anarchist', 'O')]\n",
      "Entities [('memoir', 'O')]\n",
      "Entities [('wrestling', 'O')]\n",
      "Entities [('omaha', 'LOC')]\n",
      "Entities [('weightlessness', 'O')]\n",
      "Entities [('ptsd', 'O')]\n",
      "Entities [('imperfect', 'O')]\n",
      "Entities [('dream', 'O')]\n",
      "Entities [('jail', 'O')]\n",
      "Entities [('playful', 'O')]\n",
      "Entities [('entrepreneur', 'PER')]\n",
      "Entities [('morocco', 'PER')]\n",
      "Entities [('girl', 'O')]\n",
      "Entities [('unintelligent', 'O')]\n",
      "Entities [('fastpaced', 'O')]\n",
      "Entities [('palestine', 'LOC')]\n",
      "Entities [('mcg', 'CORP')]\n",
      "Entities [('modernism', 'O')]\n",
      "Entities [('scheme', 'O')]\n",
      "Entities [('mistress', 'O')]\n",
      "Entities [('circus', 'CW')]\n",
      "Entities [('rave', 'O')]\n",
      "Entities [('salvation', 'O')]\n",
      "Entities [('focus', 'O')]\n",
      "Entities [('cohen', 'PER')]\n",
      "Entities [('gershwin', 'PER')]\n",
      "Entities [('nashville', 'LOC')]\n",
      "Entities [('purity', 'O')]\n",
      "Entities [('arrogance', 'O')]\n",
      "Entities [('playwright', 'PER')]\n",
      "Entities [('geese', 'O')]\n",
      "Entities [('email', 'O')]\n",
      "Entities [('cryptic', 'O')]\n",
      "Entities [('vampire', 'PER')]\n",
      "Entities [('brave', 'O')]\n",
      "Entities [('skull', 'O')]\n",
      "Entities [('mechanize', 'O')]\n",
      "Entities [('minion', 'O')]\n",
      "Entities [('sushi', 'CW')]\n",
      "Entities [('importer', 'O')]\n",
      "Entities [('wholesome', 'O')]\n",
      "Entities [('forget', 'O')]\n",
      "Entities [('childishness', 'O')]\n",
      "Entities [('stepbrother', 'PER')]\n",
      "Entities [('patriarchy', 'O')]\n",
      "Entities [('static', 'O')]\n",
      "Entities [('magnificent', 'O')]\n",
      "Entities [('music', 'CW')]\n",
      "Entities [('inform', 'O')]\n",
      "Entities [('grain', 'O')]\n",
      "Entities [('butterfly', 'O')]\n",
      "Entities [('germany', 'LOC')]\n",
      "Entities [('wy', 'O')]\n",
      "Entities [('sicily', 'LOC')]\n",
      "Entities [('rocker', 'O')]\n",
      "Entities [('cricket', 'PROD')]\n",
      "Entities [('sith', 'O')]\n",
      "Entities [('cock', 'O')]\n",
      "Entities [('proust', 'PER')]\n",
      "Entities [('prague', 'LOC')]\n",
      "Entities [('spaghetti', 'CW')]\n",
      "Entities [('birth', 'O')]\n",
      "Entities [('vega', 'LOC')]\n",
      "Entities [('sisterhood', 'O')]\n",
      "Entities [('shakespearean', 'O')]\n",
      "Entities [('fantasy', 'O')]\n",
      "Entities [('edinburgh', 'LOC')]\n",
      "Entities [('joint', 'O')]\n",
      "Entities [('penis', 'O')]\n",
      "Entities [('amnesia', 'O')]\n",
      "Entities [('river', 'O')]\n",
      "Entities [('jodhpur', 'LOC')]\n",
      "Entities [('seedy', 'O')]\n",
      "Entities [('narcissistic', 'O')]\n",
      "Entities [('tombstone', 'CW')]\n",
      "Entities [('jean', 'CW')]\n",
      "Entities [('meditation', 'O')]\n",
      "Entities [('chomsky', 'PER')]\n",
      "Entities [('mt', 'LOC')]\n",
      "Entities [('scatter', 'O')]\n",
      "Entities [('dictatorship', 'O')]\n",
      "Entities [('classroom', 'O')]\n",
      "Entities [('lyricist', 'PER')]\n",
      "Entities [('sens', 'O')]\n",
      "Entities [('televangelist', 'O')]\n",
      "Entities [('poetry', 'CW')]\n",
      "Entities [('tribal', 'O')]\n",
      "Entities [('alpinism', 'O')]\n",
      "Entities [('happy', 'O')]\n",
      "Entities [('paris', 'LOC')]\n",
      "Entities [('cairo', 'LOC')]\n",
      "Entities [('aggressive', 'O')]\n",
      "Entities [('cliffhanger', 'O')]\n",
      "Entities [('latin', 'O')]\n",
      "Entities [('production', 'O')]\n",
      "Entities [('jungle', 'LOC')]\n",
      "Entities [('composer', 'PER')]\n",
      "Entities [('pierce', 'O')]\n",
      "Entities [('recession', 'O')]\n",
      "Entities [('pauli', 'PER')]\n",
      "Entities [('bakery', 'O')]\n",
      "Entities [('heroic', 'O')]\n",
      "Entities [('poet', 'PER')]\n",
      "Entities [('normality', 'O')]\n",
      "Entities [('land', 'O')]\n",
      "Entities [('polish', 'O')]\n",
      "Entities [('bosnia', 'LOC')]\n",
      "Entities [('ambulance', 'O')]\n",
      "Entities [('pink', 'O')]\n",
      "Entities [('thriller', 'CW')]\n",
      "Entities [('dazzle', 'O')]\n",
      "Entities [('king', 'PER')]\n",
      "Entities [('okinawa', 'LOC')]\n",
      "Entities [('film', 'CW')]\n",
      "Entities [('foreign', 'O')]\n",
      "Entities [('collaborator', 'O')]\n",
      "Entities [('unnerve', 'O')]\n",
      "Entities [('zoo', 'LOC')]\n",
      "Entities [('sing', 'O')]\n",
      "Entities [('technicolor', 'O')]\n",
      "Entities [('naturalist', 'O')]\n",
      "Entities [('oscar', 'PER')]\n",
      "Entities [('typography', 'O')]\n",
      "Entities [('warrior', 'O')]\n",
      "Entities [('script', 'O')]\n",
      "Entities [('robotics', 'CW')]\n",
      "Entities [('deceptive', 'O')]\n",
      "Entities [('secretary', 'PER')]\n",
      "Entities [('moose', 'O')]\n",
      "Entities [('alchemy', 'O')]\n",
      "Entities [('grumpy', 'O')]\n",
      "Entities [('newspaper', 'O')]\n",
      "Entities [('snuff', 'O')]\n",
      "Entities [('jeff', 'PER')]\n",
      "Entities [('utah', 'LOC')]\n",
      "Entities [('scent', 'O')]\n",
      "Entities [('postwar', 'O')]\n",
      "Entities [('treason', 'O')]\n",
      "Entities [('banana', 'O')]\n",
      "Entities [('pizza', 'CW')]\n",
      "Entities [('lapland', 'LOC')]\n",
      "Entities [('rock', 'PROD')]\n",
      "Entities [('endear', 'O')]\n",
      "Entities [('schmaltz', 'O')]\n",
      "Entities [('work', 'O')]\n",
      "Entities [('disobedience', 'O')]\n",
      "Entities [('bewitch', 'O')]\n",
      "Entities [('daredevil', 'O')]\n",
      "Entities [('docudrama', 'CW')]\n",
      "Entities [('unchallenging', 'O')]\n",
      "Entities [('captain', 'PER')]\n",
      "Entities [('firefly', 'O')]\n",
      "Entities [('automatic', 'O')]\n",
      "Entities [('astound', 'O')]\n",
      "Entities [('hooliganism', 'O')]\n",
      "Entities [('planning', 'O')]\n",
      "Entities [('ontario', 'LOC')]\n",
      "Entities [('sculpture', 'O')]\n",
      "Entities [('scrabble', 'O')]\n",
      "Entities [('conservatism', 'O')]\n",
      "Entities [('czech', 'LOC')]\n",
      "Entities [('lemur', 'O')]\n",
      "Entities [('rebellious', 'O')]\n",
      "Entities [('criticism', 'O')]\n",
      "Entities [('usn', 'CORP')]\n",
      "Entities [('vandalism', 'O')]\n",
      "Entities [('camera', 'O')]\n",
      "Entities [('mole', 'O')]\n",
      "Entities [('base', 'O')]\n",
      "Entities [('serbia', 'LOC')]\n",
      "Entities [('straightforward', 'O')]\n",
      "Entities [('repulsive', 'O')]\n",
      "Entities [('realtime', 'O')]\n",
      "Entities [('informative', 'O')]\n",
      "Entities [('yoga', 'O')]\n",
      "Entities [('observant', 'O')]\n",
      "Entities [('taxidermied', 'O')]\n",
      "Entities [('mormon', 'CORP')]\n",
      "Entities [('tobacco', 'O')]\n",
      "Entities [('jazz', 'O')]\n",
      "Entities [('technophobic', 'O')]\n",
      "Entities [('cyberman', 'O')]\n",
      "Entities [('blockade', 'O')]\n",
      "Entities [('speech', 'O')]\n",
      "Entities [('nonsense', 'O')]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Entities [('feel', 'O')]\n",
      "Entities [('dick', 'PER')]\n",
      "Entities [('organ', 'PROD')]\n",
      "Entities [('toon', 'O')]\n",
      "Entities [('malik', 'PER')]\n",
      "Entities [('rabbi', 'O')]\n",
      "Entities [('scout', 'O')]\n",
      "Entities [('pygmalion', 'PER')]\n",
      "Entities [('symbolic', 'O')]\n",
      "Entities [('beauty', 'CW')]\n",
      "Entities [('himalaya', 'LOC')]\n",
      "Entities [('giza', 'LOC')]\n",
      "Entities [('humanism', 'O')]\n",
      "Entities [('underground', 'LOC')]\n",
      "Entities [('travelogue', 'CW')]\n",
      "Entities [('originality', 'O')]\n",
      "Entities [('dull', 'O')]\n",
      "Entities [('dancer', 'PER')]\n",
      "Entities [('tropical', 'O')]\n",
      "Entities [('alabama', 'LOC')]\n",
      "Entities [('definitive', 'O')]\n",
      "Entities [('beef', 'O')]\n",
      "Entities [('radical', 'O')]\n",
      "Entities [('article', 'O')]\n",
      "Entities [('darwin', 'PER')]\n",
      "Entities [('fascinate', 'O')]\n",
      "Entities [('gandhi', 'LOC')]\n",
      "Entities [('warlord', 'O')]\n",
      "Entities [('cruise', 'O')]\n",
      "Entities [('lawsuit', 'O')]\n",
      "Entities [('university', 'O')]\n",
      "Entities [('epic', 'O')]\n",
      "Entities [('shadow', 'O')]\n",
      "Entities [('masculine', 'O')]\n",
      "Entities [('paratrooper', 'O')]\n",
      "Entities [('actress', 'PER')]\n",
      "Entities [('patricia', 'PER')]\n",
      "Entities [('location', 'LOC')]\n",
      "Entities [('ludditism', 'O')]\n",
      "Entities [('fellini', 'PER')]\n",
      "Entities [('photographer', 'PER')]\n",
      "Entities [('misguide', 'O')]\n",
      "Entities [('large', 'O')]\n",
      "Entities [('symbol', 'O')]\n",
      "Entities [('asian', 'LOC')]\n",
      "Entities [('guru', 'O')]\n",
      "Entities [('colombia', 'LOC')]\n",
      "Entities [('drive', 'O')]\n",
      "Entities [('bergman', 'CORP')]\n",
      "Entities [('dance', 'CW')]\n",
      "Entities [('bebop', 'CW')]\n",
      "Entities [('fall', 'O')]\n",
      "Entities [('old', 'O')]\n",
      "Entities [('resistance', 'O')]\n",
      "Entities [('ireland', 'LOC')]\n",
      "Entities [('lobectomy', 'O')]\n",
      "Entities [('brazilian', 'LOC')]\n",
      "Entities [('distrustful', 'O')]\n",
      "Entities [('sleeper', 'O')]\n",
      "Entities [('award', 'O')]\n",
      "Entities [('vocalist', 'PER')]\n",
      "Entities [('shot', 'O')]\n",
      "Entities [('dyslexia', 'O')]\n",
      "Entities [('dervish', 'PER')]\n",
      "Entities [('immoral', 'O')]\n",
      "Entities [('existentialist', 'PER')]\n",
      "Entities [('classical', 'O')]\n",
      "Entities [('perfectionist', 'O')]\n",
      "Entities [('bavaria', 'LOC')]\n",
      "Entities [('denmark', 'LOC')]\n",
      "Entities [('mechanic', 'O')]\n",
      "Entities [('moth', 'O')]\n",
      "Entities [('cop', 'PER')]\n",
      "Entities [('poky', 'O')]\n",
      "Entities [('buy', 'O')]\n",
      "Entities [('protective', 'O')]\n",
      "Entities [('complete', 'O')]\n",
      "Entities [('sale', 'O')]\n",
      "Entities [('lawlessness', 'O')]\n",
      "Entities [('guitarist', 'PER')]\n",
      "Entities [('birthday', 'O')]\n",
      "Entities [('montenegro', 'LOC')]\n",
      "Entities [('tunisia', 'LOC')]\n",
      "Entities [('destroyer', 'O')]\n",
      "Entities [('mastermind', 'PER')]\n",
      "Entities [('testosterone', 'O')]\n",
      "Entities [('savagely', 'O')]\n",
      "Entities [('mercy', 'O')]\n",
      "Entities [('subordination', 'O')]\n",
      "Entities [('oneliners', 'O')]\n",
      "Entities [('chimpanzee', 'O')]\n",
      "Entities [('cure', 'O')]\n",
      "Entities [('hasty', 'O')]\n",
      "Entities [('rebel', 'O')]\n",
      "Entities [('extraction', 'O')]\n",
      "Entities [('remorse', 'O')]\n",
      "Entities [('ballet', 'O')]\n",
      "Entities [('mirror', 'O')]\n",
      "Entities [('resilience', 'O')]\n",
      "Entities [('statistician', 'O')]\n",
      "Entities [('steak', 'O')]\n",
      "Entities [('economy', 'O')]\n",
      "Entities [('executive', 'O')]\n",
      "Entities [('pleasant', 'O')]\n",
      "Entities [('moses', 'PER')]\n",
      "Entities [('vivacious', 'O')]\n",
      "Entities [('roleplay', 'O')]\n",
      "Entities [('phd', 'O')]\n",
      "Entities [('infiltrates', 'O')]\n",
      "Entities [('madonna', 'PER')]\n",
      "Entities [('swedish', 'LOC')]\n",
      "Entities [('hate', 'O')]\n",
      "Entities [('extortion', 'O')]\n",
      "Entities [('queen', 'PER')]\n",
      "Entities [('karate', 'O')]\n",
      "Entities [('d', 'O')]\n",
      "Entities [('revival', 'O')]\n",
      "Entities [('burton', 'PER')]\n",
      "Entities [('plagiarism', 'O')]\n",
      "Entities [('gender', 'O')]\n",
      "Entities [('pedantic', 'O')]\n",
      "Entities [('rapper', 'PER')]\n",
      "Entities [('industrialist', 'PER')]\n",
      "Entities [('harrow', 'LOC')]\n",
      "Entities [('helmet', 'O')]\n",
      "Entities [('antichrist', 'PER')]\n",
      "Entities [('quartet', 'CW')]\n",
      "Entities [('dinosaur', 'O')]\n",
      "Entities [('gloomy', 'O')]\n",
      "Entities [('semiotic', 'O')]\n",
      "Entities [('arnold', 'PER')]\n",
      "Entities [('backdoor', 'O')]\n",
      "Entities [('yokohama', 'LOC')]\n",
      "Entities [('scenography', 'CW')]\n",
      "Entities [('ulcer', 'O')]\n",
      "Entities [('ai', 'O')]\n",
      "Entities [('darwinism', 'O')]\n",
      "Entities [('search', 'O')]\n",
      "Entities [('drought', 'O')]\n",
      "Entities [('pretty', 'O')]\n",
      "Entities [('victory', 'O')]\n",
      "Entities [('tacky', 'O')]\n",
      "Entities [('dumbfound', 'O')]\n",
      "Entities [('bet', 'O')]\n",
      "Entities [('silent', 'O')]\n",
      "Entities [('graduation', 'O')]\n",
      "Entities [('dumpling', 'O')]\n",
      "Entities [('broadway', 'LOC')]\n",
      "Entities [('executioner', 'PER')]\n",
      "Entities [('wedding', 'O')]\n",
      "Entities [('crosscultural', 'O')]\n",
      "Entities [('congressman', 'O')]\n",
      "Entities [('iranian', 'CW')]\n",
      "Entities [('bioterrorism', 'O')]\n",
      "Entities [('evangelist', 'PER')]\n",
      "Entities [('didactic', 'O')]\n",
      "Entities [('nirvana', 'O')]\n",
      "Entities [('indian', 'PER')]\n",
      "Entities [('bath', 'O')]\n",
      "Entities [('adorably', 'O')]\n",
      "Entities [('monastery', 'O')]\n",
      "Entities [('skate', 'O')]\n",
      "Entities [('sinatra', 'PER')]\n",
      "Entities [('preparation', 'O')]\n",
      "Entities [('court', 'LOC')]\n",
      "Entities [('opera', 'O')]\n",
      "Entities [('mug', 'O')]\n",
      "Entities [('misanthrope', 'O')]\n",
      "Entities [('random', 'O')]\n",
      "Entities [('matchmaker', 'O')]\n",
      "Entities [('confucian', 'O')]\n",
      "Entities [('lucas', 'PER')]\n",
      "Entities [('allusive', 'O')]\n",
      "Entities [('hollywood', 'LOC')]\n",
      "Entities [('illiteracy', 'O')]\n",
      "Entities [('mindfulness', 'O')]\n",
      "Entities [('lyric', 'CW')]\n",
      "Entities [('paramount', 'O')]\n",
      "Entities [('triplet', 'O')]\n",
      "Entities [('indigenous', 'O')]\n",
      "Entities [('penthouse', 'O')]\n",
      "Entities [('fictional', 'O')]\n",
      "Entities [('migration', 'O')]\n",
      "Entities [('streetcar', 'O')]\n",
      "Entities [('subconsciousness', 'O')]\n",
      "Entities [('nightlife', 'O')]\n",
      "Entities [('buddha', 'PER')]\n",
      "Entities [('rocket', 'O')]\n",
      "Entities [('guy', 'PER')]\n",
      "Entities [('moralistic', 'O')]\n",
      "Entities [('saint', 'O')]\n",
      "Entities [('mosaic', 'O')]\n",
      "Entities [('scathing', 'O')]\n",
      "Entities [('sicken', 'O')]\n",
      "Entities [('gang', 'O')]\n",
      "Entities [('australian', 'O')]\n",
      "Entities [('pathetic', 'O')]\n",
      "Entities [('montana', 'LOC')]\n",
      "Entities [('screenplay', 'CW')]\n",
      "Entities [('techno', 'PROD')]\n",
      "Entities [('insubstantial', 'O')]\n",
      "Entities [('dialog', 'O')]\n",
      "Entities [('batman', 'CW')]\n",
      "Entities [('wilson', 'PER')]\n",
      "Entities [('christine', 'PER')]\n",
      "Entities [('nightclub', 'LOC')]\n",
      "Entities [('marathon', 'PROD')]\n",
      "Entities [('piracy', 'O')]\n",
      "Entities [('desperation', 'O')]\n",
      "Entities [('pale', 'O')]\n",
      "Entities [('volcano', 'O')]\n",
      "Entities [('painterly', 'O')]\n",
      "Entities [('psychedelic', 'O')]\n",
      "Entities [('commentary', 'CW')]\n",
      "Entities [('anachronism', 'CW')]\n",
      "Entities [('venice', 'LOC')]\n",
      "Entities [('ramayana', 'CW')]\n",
      "Entities [('sapp', 'O')]\n",
      "Entities [('theatre', 'LOC')]\n",
      "Entities [('gaia', 'PER')]\n",
      "Entities [('titanic', 'CW')]\n",
      "Entities [('woody', 'O')]\n",
      "Entities [('jerusalem', 'LOC')]\n",
      "Entities [('brilliance', 'O')]\n",
      "Entities [('hemingway', 'PER')]\n",
      "Entities [('chicken', 'O')]\n",
      "Entities [('rap', 'CW')]\n",
      "Entities [('dvd', 'CW')]\n",
      "Entities [('hitler', 'PER')]\n",
      "Entities [('cisco', 'CORP')]\n",
      "Entities [('cinematography', 'CW')]\n",
      "Entities [('abstract', 'O')]\n",
      "Entities [('hurricane', 'O')]\n",
      "Entities [('neighbour', 'O')]\n",
      "Entities [('parachute', 'O')]\n",
      "Entities [('confound', 'O')]\n",
      "Entities [('trigger', 'O')]\n",
      "Entities [('radar', 'O')]\n",
      "Entities [('generous', 'O')]\n",
      "Entities [('incredible', 'O')]\n",
      "Entities [('flirt', 'O')]\n",
      "Entities [('kenya', 'LOC')]\n",
      "Entities [('humanistic', 'O')]\n",
      "Entities [('trash', 'O')]\n",
      "Entities [('therapy', 'O')]\n",
      "Entities [('undertaken', 'O')]\n",
      "Entities [('south-central', 'LOC')]\n",
      "Entities [('quebec', 'LOC')]\n",
      "Entities [('cafe', 'O')]\n",
      "Entities [('f', 'O')]\n",
      "Entities [('irrelevant', 'O')]\n",
      "Entities [('hamlet', 'O')]\n",
      "Entities [('individualism', 'O')]\n",
      "Entities [('unclear', 'O')]\n",
      "Entities [('gymnastics', 'O')]\n",
      "Entities [('selfsufficiency', 'O')]\n",
      "Entities [('paycheck', 'O')]\n",
      "Entities [('blockbuster', 'PROD')]\n",
      "Entities [('veterinarian', 'O')]\n",
      "Entities [('plotter', 'CW')]\n",
      "Entities [('deathbed', 'O')]\n",
      "Entities [('mafia', 'PER')]\n",
      "Entities [('bos', 'O')]\n",
      "Entities [('redistribution', 'O')]\n",
      "Entities [('dostoyevsky', 'PER')]\n",
      "Entities [('shower', 'O')]\n",
      "Entities [('mood', 'O')]\n",
      "Entities [('virgin', 'O')]\n",
      "Entities [('taiwan', 'LOC')]\n",
      "Entities [('ludicrously', 'O')]\n",
      "Entities [('provence', 'LOC')]\n",
      "Entities [('norway', 'LOC')]\n",
      "Entities [('english', 'O')]\n",
      "Entities [('wit', 'O')]\n",
      "Entities [('movie', 'CW')]\n",
      "Entities [('entitlement', 'O')]\n",
      "Entities [('emptiness', 'O')]\n",
      "Entities [('environmentalist', 'O')]\n",
      "Entities [('uniform', 'O')]\n",
      "Entities [('training', 'O')]\n",
      "Entities [('ambiance', 'O')]\n",
      "Entities [('r', 'O')]\n",
      "Entities [('pulp', 'CW')]\n",
      "Entities [('asia', 'LOC')]\n",
      "Entities [('nativity', 'O')]\n",
      "Entities [('allegation', 'O')]\n",
      "Entities [('clock', 'O')]\n",
      "Entities [('flaw', 'O')]\n",
      "Entities [('tokyo', 'LOC')]\n",
      "Entities [('whitewater', 'O')]\n",
      "Entities [('choreography', 'O')]\n",
      "Entities [('great', 'O')]\n",
      "Entities [('coolness', 'O')]\n",
      "Entities [('counterfeit', 'O')]\n",
      "Entities [('hopeful', 'O')]\n",
      "Entities [('train', 'O')]\n",
      "Entities [('protest', 'O')]\n",
      "Entities [('sensuality', 'O')]\n",
      "Entities [('oman', 'LOC')]\n",
      "Entities [('bluegrass', 'O')]\n",
      "Entities [('rebirth', 'O')]\n",
      "Entities [('growth', 'O')]\n",
      "Entities [('marxism', 'O')]\n",
      "Entities [('extraordinary', 'O')]\n",
      "Entities [('herman', 'PER')]\n",
      "Entities [('lovely', 'O')]\n",
      "Entities [('bowdlerize', 'O')]\n",
      "Entities [('website', 'O')]\n",
      "Entities [('bagpipe', 'PROD')]\n",
      "Entities [('ect', 'O')]\n",
      "Entities [('rescue', 'O')]\n",
      "Entities [('outdoor', 'O')]\n",
      "Entities [('bengal', 'LOC')]\n"
     ]
    }
   ],
   "source": [
    "for text, _ in TRAIN_DATA:\n",
    "    doc = nlp(text)\n",
    "    print('Entities', [(ent.text, ent.label_) for ent in doc.ents])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading from ../dataset/ner_output\n",
      "Accuracy on validation data: 80.46%\n"
     ]
    }
   ],
   "source": [
    "# Load the trained model\n",
    "if output_dir:\n",
    "    print(\"Loading from\", output_dir)\n",
    "    nlp = spacy.load(output_dir)\n",
    "\n",
    "# Extract tags from valid_df that are not in the training data\n",
    "train_tags = {item[0] for item in TRAIN_DATA}\n",
    "validation_data = valid_df[~valid_df['tag'].isin(train_tags)]\n",
    "\n",
    "# Initialize counters for total and correct predictions\n",
    "total_predictions = 0\n",
    "correct_predictions = 0\n",
    "\n",
    "# Iterate through the validation data and compare predictions with actual labels\n",
    "for _, row in validation_data.iterrows():\n",
    "    doc = nlp(row['tag'])\n",
    "    \n",
    "    # Check if there's an entity prediction and if it matches the label\n",
    "    if doc.ents:\n",
    "        predicted_label = doc.ents[0].label_\n",
    "        if predicted_label == row['ner_label']:\n",
    "            correct_predictions += 1\n",
    "    else:\n",
    "        if row['ner_label'] == 'O':  # 'O' is typically used for \"Outside any entity\"\n",
    "            correct_predictions += 1\n",
    "    total_predictions += 1\n",
    "\n",
    "# Calculate accuracy\n",
    "accuracy = correct_predictions / total_predictions * 100\n",
    "print(f\"Accuracy on validation data: {accuracy:.2f}%\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n"
     ]
    }
   ],
   "source": [
    "# check for nan values and drop\n",
    "print(words['tag'].isna().sum())\n",
    "\n",
    "words = words.dropna(subset=['tag'])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/var/folders/tk/x3sjpph95kz4ghcssq1py2zc0000gn/T/ipykernel_68855/3238962201.py:10: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  words['ner_model'] = words['tag'].apply(get_entities)\n"
     ]
    }
   ],
   "source": [
    "### Loading the model and running on the rest of the words\n",
    "model_path = \"../dataset/ner_output/\"\n",
    "nlp = spacy.load(model_path)\n",
    "\n",
    "def get_entities(text):\n",
    "    doc = nlp(text)\n",
    "    return [(ent.text, ent.label_) for ent in doc.ents]\n",
    "\n",
    "# Apply the model to the 'tag' column\n",
    "words['ner_model'] = words['tag'].apply(get_entities)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### POS Tagging\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Get the un-lemmatised version of the tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>overrated</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>repeating</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>seals</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50189</th>\n",
       "      <td>image</td>\n",
       "      <td>image</td>\n",
       "      <td>[0.011091, 0.48461, 0.019142, 0.083725, 0.5027...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>3084 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag     un-lemmatised  \\\n",
       "0                     s               NaN   \n",
       "1                action            action   \n",
       "2                 twist             twist   \n",
       "4              overrate         overrated   \n",
       "5               violent           violent   \n",
       "...                 ...               ...   \n",
       "50110            static            static   \n",
       "50139            repeat         repeating   \n",
       "50142              seal             seals   \n",
       "50176  counterespionage  counterespionage   \n",
       "50189             image             image   \n",
       "\n",
       "                                               glove_vec  \n",
       "0      [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...  \n",
       "1      [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...  \n",
       "2      [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...  \n",
       "4      [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...  \n",
       "5      [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...  \n",
       "...                                                  ...  \n",
       "50110  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...  \n",
       "50139  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...  \n",
       "50142  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...  \n",
       "50176  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...  \n",
       "50189  [0.011091, 0.48461, 0.019142, 0.083725, 0.5027...  \n",
       "\n",
       "[3084 rows x 3 columns]"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words_ul"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package treebank to /Users/jiayi/nltk_data...\n",
      "[nltk_data]   Unzipping corpora/treebank.zip.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Percentage of words covered by Penn Treebank: 25.84%\n"
     ]
    }
   ],
   "source": [
    "import nltk\n",
    "import pandas as pd\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# Load your words dataframe\n",
    "# (assuming you already have it loaded; if not, adjust the loading method)\n",
    "# words = pd.read_csv(\"path_to_your_dataframe.csv\")\n",
    "\n",
    "# Load Penn Treebank dataset\n",
    "nltk.download(\"treebank\")\n",
    "from nltk.corpus import treebank\n",
    "\n",
    "# Extract words from Penn Treebank\n",
    "ptb_words = set(word for word, _ in treebank.tagged_words())\n",
    "\n",
    "# Split words into train, test, and validation sets (80%, 10%, 10%)\n",
    "all_words = list(ptb_words)\n",
    "train_words, temp_words = train_test_split(all_words, test_size=0.2, random_state=42)\n",
    "test_words, val_words = train_test_split(temp_words, test_size=0.5, random_state=42)\n",
    "\n",
    "# Check percentage of words from your dataframe covered by Penn Treebank\n",
    "your_words = set(words_ul['un-lemmatised'])\n",
    "covered_words = your_words.intersection(ptb_words)\n",
    "coverage_percentage = (len(covered_words) / len(your_words)) * 100\n",
    "\n",
    "print(f\"Percentage of words covered by Penn Treebank: {coverage_percentage:.2f}%\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package brown to /Users/jiayi/nltk_data...\n",
      "[nltk_data]   Unzipping corpora/brown.zip.\n"
     ]
    }
   ],
   "source": [
    "import nltk\n",
    "from nltk.corpus import brown\n",
    "nltk.download('brown')\n",
    "brown_tagged_words = brown.tagged_words(categories='news')  # You can choose a specific category or use all\n",
    "brown_words, brown_tags = zip(*brown_tagged_words)\n",
    "\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# Splitting into train and temporary set (80/20)\n",
    "train_temp, test_set = train_test_split(list(zip(brown_words, brown_tags)), test_size=0.2, random_state=42)\n",
    "\n",
    "# Splitting the temporary set into test and validation (50/50)\n",
    "train_set, valid_set = train_test_split(train_temp, test_size=0.5, random_state=42)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Running this again however with a bigger set of words we get:\n",
    "- by just reading in the tags_full, then renaming the dataframes in above code blocks - saves repetition of code\n",
    "- need to remove duplicates "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>overrated</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>repeating</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>seals</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50189</th>\n",
       "      <td>image</td>\n",
       "      <td>image</td>\n",
       "      <td>[0.011091, 0.48461, 0.019142, 0.083725, 0.5027...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>3084 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag     un-lemmatised  \\\n",
       "0                     s               NaN   \n",
       "1                action            action   \n",
       "2                 twist             twist   \n",
       "4              overrate         overrated   \n",
       "5               violent           violent   \n",
       "...                 ...               ...   \n",
       "50110            static            static   \n",
       "50139            repeat         repeating   \n",
       "50142              seal             seals   \n",
       "50176  counterespionage  counterespionage   \n",
       "50189             image             image   \n",
       "\n",
       "                                               glove_vec  \n",
       "0      [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...  \n",
       "1      [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...  \n",
       "2      [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...  \n",
       "4      [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...  \n",
       "5      [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...  \n",
       "...                                                  ...  \n",
       "50110  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...  \n",
       "50139  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...  \n",
       "50142  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...  \n",
       "50176  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...  \n",
       "50189  [0.011091, 0.48461, 0.019142, 0.083725, 0.5027...  \n",
       "\n",
       "[3084 rows x 3 columns]"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words_ul"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Applying spaCy POS tagging"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Collecting en-core-web-sm==3.7.1\n",
      "  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.1/en_core_web_sm-3.7.1-py3-none-any.whl (12.8 MB)\n",
      "\u001B[2K     \u001B[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001B[0m \u001B[32m12.8/12.8 MB\u001B[0m \u001B[31m6.7 MB/s\u001B[0m eta \u001B[36m0:00:00\u001B[0ma \u001B[36m0:00:01\u001B[0m\n",
      "\u001B[?25hRequirement already satisfied: spacy<3.8.0,>=3.7.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from en-core-web-sm==3.7.1) (3.7.6)\n",
      "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.11 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.0.12)\n",
      "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.0.5)\n",
      "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.0.10)\n",
      "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.8)\n",
      "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.0.9)\n",
      "Requirement already satisfied: thinc<8.3.0,>=8.2.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (8.2.5)\n",
      "Requirement already satisfied: wasabi<1.2.0,>=0.9.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.1.3)\n",
      "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.4.8)\n",
      "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.10)\n",
      "Requirement already satisfied: weasel<0.5.0,>=0.1.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.4.1)\n",
      "Requirement already satisfied: typer<1.0.0,>=0.3.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.12.4)\n",
      "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (4.65.0)\n",
      "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.31.0)\n",
      "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.10.8)\n",
      "Requirement already satisfied: jinja2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.1.2)\n",
      "Requirement already satisfied: setuptools in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (68.0.0)\n",
      "Requirement already satisfied: packaging>=20.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (23.1)\n",
      "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.4.0)\n",
      "Requirement already satisfied: numpy>=1.19.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.24.3)\n",
      "Requirement already satisfied: language-data>=1.2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from langcodes<4.0.0,>=3.2.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.2.0)\n",
      "Requirement already satisfied: typing-extensions>=4.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (4.12.2)\n",
      "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.4)\n",
      "Requirement already satisfied: idna<4,>=2.5 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.4)\n",
      "Requirement already satisfied: urllib3<3,>=1.21.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.26.16)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2024.2.2)\n",
      "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.7.11)\n",
      "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.1.5)\n",
      "Requirement already satisfied: click>=8.0.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (8.1.7)\n",
      "Requirement already satisfied: shellingham>=1.3.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.5.4)\n",
      "Requirement already satisfied: rich>=10.11.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (13.7.1)\n",
      "Requirement already satisfied: cloudpathlib<1.0.0,>=0.7.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from weasel<0.5.0,>=0.1.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.18.1)\n",
      "Requirement already satisfied: smart-open<8.0.0,>=5.2.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from weasel<0.5.0,>=0.1.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (5.2.1)\n",
      "Requirement already satisfied: MarkupSafe>=2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from jinja2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.1.1)\n",
      "Requirement already satisfied: marisa-trie>=0.7.7 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from language-data>=1.2->langcodes<4.0.0,>=3.2.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.2.0)\n",
      "Requirement already satisfied: markdown-it-py>=2.2.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.2.0)\n",
      "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.15.1)\n",
      "Requirement already satisfied: mdurl~=0.1 in /Users/jiayi/anaconda3/lib/python3.11/site-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->typer<1.0.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.1.0)\n",
      "Installing collected packages: en-core-web-sm\n",
      "Successfully installed en-core-web-sm-3.7.1\n",
      "\u001B[38;5;2m✔ Download and installation successful\u001B[0m\n",
      "You can now load the package via spacy.load('en_core_web_sm')\n",
      "                    tag     un-lemmatised  \\\n",
      "0                     s               NaN   \n",
      "1                action            action   \n",
      "2                 twist             twist   \n",
      "4              overrate         overrated   \n",
      "5               violent           violent   \n",
      "...                 ...               ...   \n",
      "50110            static            static   \n",
      "50139            repeat         repeating   \n",
      "50142              seal             seals   \n",
      "50176  counterespionage  counterespionage   \n",
      "50189             image             image   \n",
      "\n",
      "                                               glove_vec    POS  \n",
      "0      [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...  PROPN  \n",
      "1      [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   NOUN  \n",
      "2      [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   NOUN  \n",
      "4      [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   VERB  \n",
      "5      [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...    ADJ  \n",
      "...                                                  ...    ...  \n",
      "50110  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   NOUN  \n",
      "50139  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   VERB  \n",
      "50142  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   NOUN  \n",
      "50176  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   NOUN  \n",
      "50189  [0.011091, 0.48461, 0.019142, 0.083725, 0.5027...   NOUN  \n",
      "\n",
      "[3084 rows x 4 columns]\n"
     ]
    }
   ],
   "source": [
    "import spacy\n",
    "import pandas as pd\n",
    "\n",
    "# Initialize spaCy model\n",
    "!python -m spacy download en_core_web_sm\n",
    "nlp = spacy.load(\"en_core_web_sm\")\n",
    "\n",
    "\n",
    "\n",
    "# Function to get POS tags\n",
    "def get_pos_tag(word):\n",
    "    word = str(word)\n",
    "    doc = nlp(word)\n",
    "    return doc[0].pos_ if doc else None\n",
    "\n",
    "# Apply function to DataFrame\n",
    "words_ul[\"POS\"] = words_ul[\"un-lemmatised\"].apply(get_pos_tag)\n",
    "\n",
    "print(words_ul)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>POS</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>PROPN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>overrate</td>\n",
       "      <td>overrated</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>VERB</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>violent</td>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>ADJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50110</th>\n",
       "      <td>static</td>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50139</th>\n",
       "      <td>repeat</td>\n",
       "      <td>repeating</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>VERB</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50142</th>\n",
       "      <td>seal</td>\n",
       "      <td>seals</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50176</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50189</th>\n",
       "      <td>image</td>\n",
       "      <td>image</td>\n",
       "      <td>[0.011091, 0.48461, 0.019142, 0.083725, 0.5027...</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>3084 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag     un-lemmatised  \\\n",
       "0                     s               NaN   \n",
       "1                action            action   \n",
       "2                 twist             twist   \n",
       "4              overrate         overrated   \n",
       "5               violent           violent   \n",
       "...                 ...               ...   \n",
       "50110            static            static   \n",
       "50139            repeat         repeating   \n",
       "50142              seal             seals   \n",
       "50176  counterespionage  counterespionage   \n",
       "50189             image             image   \n",
       "\n",
       "                                               glove_vec    POS  \n",
       "0      [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...  PROPN  \n",
       "1      [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   NOUN  \n",
       "2      [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   NOUN  \n",
       "4      [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   VERB  \n",
       "5      [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...    ADJ  \n",
       "...                                                  ...    ...  \n",
       "50110  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   NOUN  \n",
       "50139  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   VERB  \n",
       "50142  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   NOUN  \n",
       "50176  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   NOUN  \n",
       "50189  [0.011091, 0.48461, 0.019142, 0.083725, 0.5027...   NOUN  \n",
       "\n",
       "[3084 rows x 4 columns]"
      ]
     },
     "execution_count": 62,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words_ul"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Evaluating results of POS Tagging - Manual"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA1sAAAIjCAYAAAD1OgEdAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/H5lhTAAAACXBIWXMAAA9hAAAPYQGoP6dpAABZvklEQVR4nO3deVgVdf//8ddBBAQFXEFKcd9NS0vRLE0Sl8ytkiJFI+0uNPfSW3NrcancyiXLREvNrDS1WxNXKklNI8tcqMwlBDQV3BWY3x/+mK9HUBEYD8vzcV1zXZ7PfGbmPcNwDi9n5nNshmEYAgAAAADkKidHFwAAAAAABRFhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAJCnjB07Vjab7Y5sq2XLlmrZsqX5evPmzbLZbPriiy/uyPZ79eqlSpUq3ZFtZdfZs2f1/PPPy9fXVzabTQMHDnR0SQCQbxC2ABQ6ERERstlsmU7Dhw93dHkFyvXH2s3NTX5+fgoKCtKMGTN05syZXNlOXFycxo4dq5iYmFxZX27Ky7VlxVtvvaWIiAi9+OKL+uSTT9SjR48b9q1UqZLdz7tcuXJq0aKFli9fnqGvYRj65JNP9NBDD8nb21vu7u6qX7++xo8fr3PnzmXon5aWpoULF6pJkyYqVaqUSpQooRo1aqhnz5768ccfb1hTr169bvj7fu3Uq1evbB0fALgZZ0cXAACOMn78eFWuXNmurV69eg6qpmBLP9ZXrlxRfHy8Nm/erIEDB2rKlClauXKl7rnnHrPvqFGjbjv0xsXFady4capUqZIaNmyY5eXWrVt3W9vJjpvV9uGHHyotLc3yGnJi48aNatq0qcaMGZOl/g0bNtSQIUMkXd33Dz74QF27dtXs2bP1n//8R5KUmpqqZ555Rp9//rlatGihsWPHyt3dXd99953GjRunZcuWaf369fLx8THX+/LLL2vmzJnq1KmTQkJC5OzsrP3792vNmjWqUqWKmjZtmmk9L7zwggIDA83XBw8e1OjRo9W3b1+1aNHCbK9ateptHxsAuCUDAAqZ+fPnG5KMHTt2ZHmZCxcuGKmpqRZWVTDd7Fhv2LDBKFasmOHv72+cP38+R9vZsWOHIcmYP39+lvqfO3cu0/ZNmzYZkoxly5blqJ6c1JbXVK5c2ejQoUOW+vr7+2foe+zYMcPDw8OoUaOG2fbWW28ZkoyhQ4dmWMfKlSsNJycno23btmZbfHy8YbPZjD59+mTon5aWZiQkJGR1d/L9zwNA/sJthABwnfTndj777DONGjVKd911l9zd3ZWcnCxJ2rZtm9q2bSsvLy+5u7vr4Ycf1g8//JBhPd9//73uv/9+ubm5qWrVqvrggw8yPI/0999/y2azKSIiIsPyNptNY8eOtWv7559/9Nxzz8nHx0eurq6qW7euPv7440zr//zzz/Xmm2/q7rvvlpubm1q3bq0//vgjw3a2bdum9u3bq2TJkvLw8NA999yj6dOnS5Lmz58vm82mn3/+OcNyb731looUKaJ//vnnlsc0M4888ohee+01HTp0SJ9++qnZntkzW5GRkXrwwQfl7e2t4sWLq2bNmvrvf/9r7u/9998vSerdu7d5W1j6MW3ZsqXq1aunnTt36qGHHpK7u7u57PXPbKVLTU3Vf//7X/n6+srDw0OPP/64jhw5YtenUqVKmd56du06b1VbZs9snTt3TkOGDFGFChXk6uqqmjVr6p133pFhGHb9bDab+vXrpxUrVqhevXrm+bB27drMD/h1EhMTFRYWJh8fH7m5ualBgwZasGCBOT/9PDp48KC++eYbs/a///47S+tP5+vrq9q1a+vgwYOSpAsXLujtt99WjRo1NGHChAz9O3bsqNDQUK1du9a8PfDgwYMyDEPNmzfP0D/9dsWc2L17t3r16qUqVarIzc1Nvr6+eu655/Tvv/9m6Lt582Y1btz4pr/X0s3PWQCFB7cRAii0kpKSdOLECbu2MmXKmP9+/fXX5eLioqFDh+rSpUtycXHRxo0b1a5dOzVq1EhjxoyRk5OT5s+fr0ceeUTfffedHnjgAUnSr7/+qjZt2qhs2bIaO3asUlJSNGbMGLvbom5XQkKCmjZtav6RXbZsWa1Zs0ZhYWFKTk7OMHDBxIkT5eTkpKFDhyopKUmTJ09WSEiItm3bZvaJjIzUY489pvLly2vAgAHy9fXV3r17tXr1ag0YMEBPPPGEwsPDtWjRIt17771261+0aJFatmypu+66K9v71KNHD/33v//VunXr1KdPn0z77NmzR4899pjuuecejR8/Xq6urvrjjz/MgFu7dm2NHz8+w61hzZo1M9fx77//ql27dgoODtazzz57y5/Dm2++KZvNpldffVWJiYmaNm2aAgMDFRMTo2LFimV5/7JS27UMw9Djjz+uTZs2KSwsTA0bNtS3336rYcOG6Z9//tHUqVPt+n///ff66quv9NJLL6lEiRKaMWOGunXrpsOHD6t06dI3rOvChQtq2bKl/vjjD/Xr10+VK1fWsmXL1KtXL50+fVoDBgxQ7dq19cknn2jQoEG6++67zVsDy5Ytm+X9l6QrV67oyJEjZj3ff/+9Tp06pQEDBsjZOfM/Q3r27Kn58+dr9erVatq0qfz9/SVJy5Yt05NPPil3d/fbquFWIiMj9ddff6l3797y9fXVnj17NHfuXO3Zs0c//vijGaR+/vlntW3bVuXLl9e4ceOUmpqq8ePHZzgmtzpnARQiDr6yBgB3XPqtbZlNhvF/t5JVqVLF7va2tLQ0o3r16kZQUJCRlpZmtp8/f96oXLmy8eijj5ptnTt3Ntzc3IxDhw6Zbb///rtRpEgR49q33oMHD97wliZJxpgxY8zXYWFhRvny5Y0TJ07Y9QsODja8vLzMWtPrr127tnHp0iWz3/Tp0w1Jxq+//moYhmGkpKQYlStXNvz9/Y1Tp07ZrfPa/Xv66acNPz8/u9sod+3alaVbsbJyy6aXl5dx7733mq/HjBljd4ymTp1qSDKOHz9+w3Xc7Nawhx9+2JBkzJkzJ9N5Dz/8sPk6/djdddddRnJystn++eefG5KM6dOnm23+/v5GaGjoLdd5s9pCQ0MNf39/8/WKFSsMScYbb7xh1++JJ54wbDab8ccff5htkgwXFxe7tl9++cWQZLz33nsZtnWtadOmGZKMTz/91Gy7fPmyERAQYBQvXtxu3zO7NfBG/P39jTZt2hjHjx83jh8/bvzyyy9GcHCwIcno37+/3baXL19+w/WcPHnSkGR07drVbOvZs6chyShZsqTRpUsX45133jH27t2bpbquldnPI7PbWJcsWWJIMqKiosy2jh07Gu7u7sY///xjtsXGxhrOzs63fc4CKBy4jRBAoTVz5kxFRkbaTdcKDQ21u4oRExOj2NhYPfPMM/r333914sQJnThxQufOnVPr1q0VFRWltLQ0paam6ttvv1Xnzp1VsWJFc/natWsrKCgoW7UahqEvv/xSHTt2lGEY5rZPnDihoKAgJSUladeuXXbL9O7dWy4uLubr9Ksqf/31l6Sr/0t/8OBBDRw4UN7e3nbLXntLVM+ePRUXF6dNmzaZbYsWLVKxYsXUrVu3bO3PtYoXL37TUQnTa/v666+zPZiEq6urevfuneX+PXv2VIkSJczXTzzxhMqXL6///e9/2dp+Vv3vf/9TkSJF9PLLL9u1DxkyRIZhaM2aNXbtgYGBdgM73HPPPfL09DR/xjfbjq+vr55++mmzrWjRonr55Zd19uxZbdmyJdv7sG7dOpUtW1Zly5ZVgwYNtGzZMvXo0UOTJk2SJPNnfe3xvV76vPRbd6Wrt7S+//77qly5spYvX66hQ4eqdu3aat26dbZvZU137e/5xYsXdeLECXPAjfTfq9TUVK1fv16dO3eWn5+f2b9atWpq166d3fpy45wFUDAQtgAUWg888IACAwPtpmtdP1JhbGyspKshLP2PyfTpo48+0qVLl5SUlKTjx4/rwoULql69eoZt1qxZM1u1Hj9+XKdPn9bcuXMzbDs9RCQmJtotc23Qk6SSJUtKkk6dOiVJ+vPPPyXdegTGRx99VOXLl9eiRYskXR2Ce8mSJerUqdNN/2DOqrNnz950Pd27d1fz5s31/PPPy8fHR8HBwfr8889v64/Yu+66yy543sr1PzubzaZq1ard9vNKt+vQoUPy8/PLcDxq165tzr/W9T9j6erPOf1nfLPtVK9eXU5O9n8G3Gg7t6NJkyaKjIzU+vXrtXXrVp04cUILFy40A036vt0sYGcWyJycnBQeHq6dO3fqxIkT+vrrr9WuXTtt3LhRwcHB2a5Xkk6ePKkBAwbIx8dHxYoVU9myZc3f/6SkJElXf78uXLigatWqZVj++rbcOGcBFAw8swUAN3D9sznpfyi9/fbbNxxevHjx4rp06VKWt3GjL+9NTU3NdNvPPvusQkNDM13m2uHTJalIkSKZ9jOuG2jhVooUKaJnnnlGH374oWbNmqUffvhBcXFxevbZZ29rPZk5evSokpKSMv0DNl2xYsUUFRWlTZs26ZtvvtHatWu1dOlSPfLII1q3bt0N9/P6deS2m/3sslJTbsitn3FuKlOmTIb/uLhWeqDbvXu3OnfunGmf3bt3S5Lq1KmT6fzSpUvr8ccf1+OPP66WLVtqy5YtOnTokPls1+166qmntHXrVg0bNkwNGzZU8eLFlZaWprZt22YrIOXGOQugYCBsAUAWpd+u5enpedM/JsuWLatixYqZV8KutX//frvX6VebTp8+bdd+/ZWFsmXLqkSJEkpNTb3ptm9H+v789ttvt1xnz5499e6772rVqlVas2aNypYtm+1bIq/1ySefSNIt1+Xk5KTWrVurdevWmjJlit566y2NHDlSmzZtUmBg4A2DT3Zd/7MzDEN//PGHXaAtWbJkhp+bdPVnV6VKFfP17dTm7++v9evX68yZM3ZXdfbt22fOzw3+/v7avXu30tLS7K5u5fZ2MpM+Qt/ixYs1cuTITIPHwoULJUmPPfbYLdfXuHFjbdmyRceOHctW3adOndKGDRs0btw4jR492my//hwoV66c3NzcMh3RM7O2W52zAAoHbiMEgCxq1KiRqlatqnfeeUdnz57NMP/48eOSrl5tCAoK0ooVK3T48GFz/t69e/Xtt9/aLePp6akyZcooKirKrn3WrFl2r4sUKaJu3brpyy+/1G+//XbDbd+O++67T5UrV9a0adMyhIbrr4zcc889uueee/TRRx/pyy+/VHBw8A1HksuqjRs36vXXX1flypUVEhJyw34nT57M0JZ+ZTH9KqKHh4ekjKE1uxYuXGh3m9sXX3yhY8eO2T2bU7VqVf3444+6fPmy2bZ69eoMQ8TfTm3t27dXamqq3n//fbv2qVOnymazZXg2KLvat2+v+Ph4LV261GxLSUnRe++9p+LFi+vhhx/Ole1kxt3dXUOHDtX+/fs1cuTIDPO/+eYbRUREKCgoyHxuKj4+Xr///nuGvpcvX9aGDRvk5OR006ujN5Me9q4/56dNm5ahX2BgoFasWKG4uDiz/Y8//sjwLF1WzlkAhQNXtgAgi5ycnPTRRx+pXbt2qlu3rnr37q277rpL//zzjzZt2iRPT0+tWrVKkjRu3DitXbtWLVq00EsvvWT+IVu3bl3zFql0zz//vCZOnKjnn39ejRs3VlRUlA4cOJBh+xMnTtSmTZvUpEkT9enTR3Xq1NHJkye1a9curV+/PtM/8G61P7Nnz1bHjh3VsGFD9e7dW+XLl9e+ffu0Z8+eDMGwZ8+eGjp0qCTd9i2Ea9as0b59+5SSkqKEhARt3LhRkZGR8vf318qVK+Xm5nbDZcePH6+oqCh16NBB/v7+SkxM1KxZs3T33XfrwQcflHQ1+Hh7e2vOnDkqUaKEPDw81KRJkwzP3WVVqVKl9OCDD6p3795KSEjQtGnTVK1aNbvh6Z9//nl98cUXatu2rZ566in9+eef+vTTT+0GrLjd2jp27KhWrVpp5MiR+vvvv9WgQQOtW7dOX3/9tQYOHJhh3dnVt29fffDBB+rVq5d27typSpUq6YsvvtAPP/ygadOm5cqzeDczfPhw/fzzz5o0aZKio6PVrVs3FStWTN9//70+/fRT1a5d2+47v44ePaoHHnhAjzzyiFq3bi1fX18lJiZqyZIl+uWXXzRw4EC7r224HZ6ennrooYc0efJkXblyRXfddZfWrVtnfi/YtcaOHat169apefPmevHFF81gXK9ePcXExJj9snLOAigkHDcQIgA4xq2GI08f/nvZsmWZzv/555+Nrl27GqVLlzZcXV0Nf39/46mnnjI2bNhg12/Lli1Go0aNDBcXF6NKlSrGnDlzMgxrbhhXh50OCwszvLy8jBIlShhPPfWUkZiYmGHod8MwjISEBCM8PNyoUKGCUbRoUcPX19do3bq1MXfu3FvWf6Nh5r///nvj0UcfNUqUKGF4eHgY99xzT6ZDhx87dswoUqSIUaNGjUyPS2auH2bfxcXF8PX1NR599FFj+vTpdkOMp7v+GG3YsMHo1KmT4efnZ7i4uBh+fn7G008/bRw4cMBuua+//tqoU6eOOQx3+n4+/PDDRt26dTOt70ZDvy9ZssQYMWKEUa5cOaNYsWJGhw4d7IbxT/fuu+8ad911l+Hq6mo0b97c+OmnnzKs82a1XT/0u2EYxpkzZ4xBgwYZfn5+RtGiRY3q1asbb7/9tt1w/IZxdej38PDwDDXdaEj66yUkJBi9e/c2ypQpY7i4uBj169fPdHj62x36Pat9U1NTjfnz5xvNmzc3PD09DTc3N6Nu3brGuHHjjLNnz9r1TU5ONqZPn24EBQUZd999t1G0aFGjRIkSRkBAgPHhhx9mODY3k9nQ70ePHjW6dOlieHt7G15eXsaTTz5pxMXFZfo7uGHDBuPee+81XFxcjKpVqxofffSRMWTIEMPNzc2uT1bOWQAFn80wHPgULQAUMmPHjtW4ceMcOoBBdp04cULly5fX6NGj9dprrzm6HCDP6Ny5s/bs2ZPpc5oACjee2QIAZElERIRSU1PVo0cPR5cCOMyFCxfsXsfGxup///ufWrZs6ZiCAORpPLMFALipjRs36vfff9ebb76pzp07q1KlSo4uCXCYKlWqqFevXqpSpYoOHTqk2bNny8XFRa+88oqjSwOQBxG2AAA3NX78eG3dulXNmzfXe++95+hyAIdq27atlixZovj4eLm6uiogIEBvvfVWpl9iDgA8swUAAAAAFuCZLQAAAACwAGELAAAAACzAM1tZlJaWpri4OJUoUUI2m83R5QAAAABwEMMwdObMGfn5+cnJ6cbXrwhbWRQXF6cKFSo4ugwAAAAAecSRI0d0991333A+YSuLSpQoIenqAfX09HRwNQAAAAAcJTk5WRUqVDAzwo0QtrIo/dZBT09PwhYAAACAWz5exAAZAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFnB2dAHIHpvN0RU4lmE4ugIAAADg5riyBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABRwatqKiotSxY0f5+fnJZrNpxYoVGfrs3btXjz/+uLy8vOTh4aH7779fhw8fNudfvHhR4eHhKl26tIoXL65u3bopISHBbh2HDx9Whw4d5O7urnLlymnYsGFKSUmxevcAAAAAFGIODVvnzp1TgwYNNHPmzEzn//nnn3rwwQdVq1Ytbd68Wbt379Zrr70mNzc3s8+gQYO0atUqLVu2TFu2bFFcXJy6du1qzk9NTVWHDh10+fJlbd26VQsWLFBERIRGjx5t+f4BAAAAKLxshmEYji5Ckmw2m5YvX67OnTubbcHBwSpatKg++eSTTJdJSkpS2bJltXjxYj3xxBOSpH379ql27dqKjo5W06ZNtWbNGj322GOKi4uTj4+PJGnOnDl69dVXdfz4cbm4uGSpvuTkZHl5eSkpKUmenp4529lcYLM5ugLHyhtnLQAAAAqjrGaDPPvMVlpamr755hvVqFFDQUFBKleunJo0aWJ3q+HOnTt15coVBQYGmm21atVSxYoVFR0dLUmKjo5W/fr1zaAlSUFBQUpOTtaePXtuuP1Lly4pOTnZbgIAAACArMqzYSsxMVFnz57VxIkT1bZtW61bt05dunRR165dtWXLFklSfHy8XFxc5O3tbbesj4+P4uPjzT7XBq30+enzbmTChAny8vIypwoVKuTi3gEAAAAo6PJs2EpLS5MkderUSYMGDVLDhg01fPhwPfbYY5ozZ47l2x8xYoSSkpLM6ciRI5ZvEwAAAEDBkWfDVpkyZeTs7Kw6derYtdeuXdscjdDX11eXL1/W6dOn7fokJCTI19fX7HP96ITpr9P7ZMbV1VWenp52EwAAAABkVZ4NWy4uLrr//vu1f/9+u/YDBw7I399fktSoUSMVLVpUGzZsMOfv379fhw8fVkBAgCQpICBAv/76qxITE80+kZGR8vT0zBDkAAAAACC3ODty42fPntUff/xhvj548KBiYmJUqlQpVaxYUcOGDVP37t310EMPqVWrVlq7dq1WrVqlzZs3S5K8vLwUFhamwYMHq1SpUvL09FT//v0VEBCgpk2bSpLatGmjOnXqqEePHpo8ebLi4+M1atQohYeHy9XV1RG7DQAAAKAQcOjQ75s3b1arVq0ytIeGhioiIkKS9PHHH2vChAk6evSoatasqXHjxqlTp05m34sXL2rIkCFasmSJLl26pKCgIM2aNcvuFsFDhw7pxRdf1ObNm+Xh4aHQ0FBNnDhRzs5Zz5oM/Z63MPQ7AAAAHCWr2SDPfM9WXkfYyls4awEAAOAo+f57tgAAAAAgPyNsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYwKFhKyoqSh07dpSfn59sNptWrFhxw77/+c9/ZLPZNG3aNLv2kydPKiQkRJ6envL29lZYWJjOnj1r12f37t1q0aKF3NzcVKFCBU2ePNmCvQEAAACA/+PQsHXu3Dk1aNBAM2fOvGm/5cuX68cff5Sfn1+GeSEhIdqzZ48iIyO1evVqRUVFqW/fvub85ORktWnTRv7+/tq5c6fefvttjR07VnPnzs31/QEAAACAdM6O3Hi7du3Url27m/b5559/1L9/f3377bfq0KGD3by9e/dq7dq12rFjhxo3bixJeu+999S+fXu988478vPz06JFi3T58mV9/PHHcnFxUd26dRUTE6MpU6bYhTIAAAAAyE15+pmttLQ09ejRQ8OGDVPdunUzzI+Ojpa3t7cZtCQpMDBQTk5O2rZtm9nnoYcekouLi9knKChI+/fv16lTp2647UuXLik5OdluAgAAAICsytNha9KkSXJ2dtbLL7+c6fz4+HiVK1fOrs3Z2VmlSpVSfHy82cfHx8euT/rr9D6ZmTBhgry8vMypQoUKOdkVAAAAAIVMng1bO3fu1PTp0xURESGbzXbHtz9ixAglJSWZ05EjR+54DQAAAADyrzwbtr777jslJiaqYsWKcnZ2lrOzsw4dOqQhQ4aoUqVKkiRfX18lJibaLZeSkqKTJ0/K19fX7JOQkGDXJ/11ep/MuLq6ytPT024CAAAAgKzKs2GrR48e2r17t2JiYszJz89Pw4YN07fffitJCggI0OnTp7Vz505zuY0bNyotLU1NmjQx+0RFRenKlStmn8jISNWsWVMlS5a8szsFAAAAoNBw6GiEZ8+e1R9//GG+PnjwoGJiYlSqVClVrFhRpUuXtutftGhR+fr6qmbNmpKk2rVrq23bturTp4/mzJmjK1euqF+/fgoODjaHiX/mmWc0btw4hYWF6dVXX9Vvv/2m6dOna+rUqXduRwEAAAAUOg4NWz/99JNatWplvh48eLAkKTQ0VBEREVlax6JFi9SvXz+1bt1aTk5O6tatm2bMmGHO9/Ly0rp16xQeHq5GjRqpTJkyGj16NMO+AwAAALCUzTAMw9FF5AfJycny8vJSUlJSnnh+ywFjhuQpnLUAAABwlKxmgzz7zBYAAAAA5GeELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMACDg1bUVFR6tixo/z8/GSz2bRixQpz3pUrV/Tqq6+qfv368vDwkJ+fn3r27Km4uDi7dZw8eVIhISHy9PSUt7e3wsLCdPbsWbs+u3fvVosWLeTm5qYKFSpo8uTJd2L3AAAAABRiDg1b586dU4MGDTRz5swM886fP69du3bptdde065du/TVV19p//79evzxx+36hYSEaM+ePYqMjNTq1asVFRWlvn37mvOTk5PVpk0b+fv7a+fOnXr77bc1duxYzZ071/L9AwAAAFB42QzDMBxdhCTZbDYtX75cnTt3vmGfHTt26IEHHtChQ4dUsWJF7d27V3Xq1NGOHTvUuHFjSdLatWvVvn17HT16VH5+fpo9e7ZGjhyp+Ph4ubi4SJKGDx+uFStWaN++fVmuLzk5WV5eXkpKSpKnp2eO9jU32GyOrsCx8sZZCwAAgMIoq9kgXz2zlZSUJJvNJm9vb0lSdHS0vL29zaAlSYGBgXJyctK2bdvMPg899JAZtCQpKChI+/fv16lTp264rUuXLik5OdluAgAAAICsyjdh6+LFi3r11Vf19NNPm+kxPj5e5cqVs+vn7OysUqVKKT4+3uzj4+Nj1yf9dXqfzEyYMEFeXl7mVKFChdzcHQAAAAAFXL4IW1euXNFTTz0lwzA0e/bsO7LNESNGKCkpyZyOHDlyR7YLAAAAoGBwdnQBt5IetA4dOqSNGzfa3RPp6+urxMREu/4pKSk6efKkfH19zT4JCQl2fdJfp/fJjKurq1xdXXNrNwAAAAAUMnn6ylZ60IqNjdX69etVunRpu/kBAQE6ffq0du7cabZt3LhRaWlpatKkidknKipKV65cMftERkaqZs2aKlmy5J3ZEQAAAACFjkPD1tmzZxUTE6OYmBhJ0sGDBxUTE6PDhw/rypUreuKJJ/TTTz9p0aJFSk1NVXx8vOLj43X58mVJUu3atdW2bVv16dNH27dv1w8//KB+/fopODhYfn5+kqRnnnlGLi4uCgsL0549e7R06VJNnz5dgwcPdtRuAwAAACgEHDr0++bNm9WqVasM7aGhoRo7dqwqV66c6XKbNm1Sy5YtJV39UuN+/fpp1apVcnJyUrdu3TRjxgwVL17c7L97926Fh4drx44dKlOmjPr3769XX331tmpl6Pe8haHfAQAA4ChZzQZ55nu28jrCVt7CWQsAAABHKZDfswUAAAAA+QVhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAtkK2z99ddfuV0HAAAAABQo2Qpb1apVU6tWrfTpp5/q4sWLuV0TAAAAAOR72Qpbu3bt0j333KPBgwfL19dXL7zwgrZv337b64mKilLHjh3l5+cnm82mFStW2M03DEOjR49W+fLlVaxYMQUGBio2Ntauz8mTJxUSEiJPT095e3srLCxMZ8+eteuze/dutWjRQm5ubqpQoYImT55827UCAAAAwO3IVthq2LChpk+frri4OH388cc6duyYHnzwQdWrV09TpkzR8ePHs7Sec+fOqUGDBpo5c2am8ydPnqwZM2Zozpw52rZtmzw8PBQUFGR3NS0kJER79uxRZGSkVq9eraioKPXt29ecn5ycrDZt2sjf3187d+7U22+/rbFjx2ru3LnZ2XUAAAAAyBKbYRhGTldy6dIlzZo1SyNGjNDly5fl4uKip556SpMmTVL58uWzVojNpuXLl6tz586Srl7V8vPz05AhQzR06FBJUlJSknx8fBQREaHg4GDt3btXderU0Y4dO9S4cWNJ0tq1a9W+fXsdPXpUfn5+mj17tkaOHKn4+Hi5uLhIkoYPH64VK1Zo3759Wd7H5ORkeXl5KSkpSZ6enrdxdKxhszm6AsfK+VkLAAAAZE9Ws0GORiP86aef9NJLL6l8+fKaMmWKhg4dqj///FORkZGKi4tTp06dsr3ugwcPKj4+XoGBgWabl5eXmjRpoujoaElSdHS0vL29zaAlSYGBgXJyctK2bdvMPg899JAZtCQpKChI+/fv16lTp264/UuXLik5OdluAgAAAICsylbYmjJliurXr69mzZopLi5OCxcu1KFDh/TGG2+ocuXKatGihSIiIrRr165sFxYfHy9J8vHxsWv38fEx58XHx6tcuXJ2852dnVWqVCm7Ppmt49ptZGbChAny8vIypwoVKmR7XwAAAAAUPtkKW7Nnz9YzzzyjQ4cOacWKFXrsscfk5GS/qnLlymnevHm5UqQjjBgxQklJSeZ05MgRR5cEAAAAIB9xzs5C148ImBkXFxeFhoZmZ/WSJF9fX0lSQkKC3XNfCQkJatiwodknMTHRbrmUlBSdPHnSXN7X11cJCQl2fdJfp/fJjKurq1xdXbNdPwAAAIDCLVtXtubPn69ly5ZlaF+2bJkWLFiQ46IkqXLlyvL19dWGDRvMtuTkZG3btk0BAQGSpICAAJ0+fVo7d+40+2zcuFFpaWlq0qSJ2ScqKkpXrlwx+0RGRqpmzZoqWbJkrtQKAAAAANfLVtiaMGGCypQpk6G9XLlyeuutt7K8nrNnzyomJkYxMTGSrg6KERMTo8OHD8tms2ngwIF64403tHLlSv3666/q2bOn/Pz8zBELa9eurbZt26pPnz7avn27fvjhB/Xr10/BwcHy8/OTJD3zzDNycXFRWFiY9uzZo6VLl2r69OkaPHhwdnYdAAAAALIkW7cRHj58WJUrV87Q7u/vr8OHD2d5PT/99JNatWplvk4PQKGhoYqIiNArr7yic+fOqW/fvjp9+rQefPBBrV27Vm5ubuYyixYtUr9+/dS6dWs5OTmpW7dumjFjhjnfy8tL69atU3h4uBo1aqQyZcpo9OjRdt/FBQAAAAC5LVvfs1WxYkW9//77evzxx+3av/76a4WHh+vo0aO5VmBewfds5S18zxYAAAAcxdLv2Xr66af18ssva9OmTUpNTVVqaqo2btyoAQMGKDg4ONtFAwAAAEBBka3bCF9//XX9/fffat26tZydr64iLS1NPXv2vK1ntgAAAACgoMrWbYTpDhw4oF9++UXFihVT/fr15e/vn5u15SncRpi3cBshAAAAHCWr2SBbV7bS1ahRQzVq1MjJKgAAAACgQMpW2EpNTVVERIQ2bNigxMREpaWl2c3fuHFjrhQHAAAAAPlVtsLWgAEDFBERoQ4dOqhevXqyFfZ72gAAAADgOtkKW5999pk+//xztW/fPrfrAQAAAIACIVtDv7u4uKhatWq5XQsAAAAAFBjZCltDhgzR9OnTlYOBDAEAAACgQMvWbYTff/+9Nm3apDVr1qhu3boqWrSo3fyvvvoqV4oDAAAAgPwqW2HL29tbXbp0ye1aAAAAAKDAyFbYmj9/fm7XAQAAAAAFSrae2ZKklJQUrV+/Xh988IHOnDkjSYqLi9PZs2dzrTgAAAAAyK+ydWXr0KFDatu2rQ4fPqxLly7p0UcfVYkSJTRp0iRdunRJc+bMye06AQAAACBfydaVrQEDBqhx48Y6deqUihUrZrZ36dJFGzZsyLXiAAAAACC/ytaVre+++05bt26Vi4uLXXulSpX0zz//5EphAAAAAJCfZevKVlpamlJTUzO0Hz16VCVKlMhxUQAAAACQ32UrbLVp00bTpk0zX9tsNp09e1ZjxoxR+/btc6s2AAAAAMi3bIZhGLe70NGjRxUUFCTDMBQbG6vGjRsrNjZWZcqUUVRUlMqVK2dFrQ6VnJwsLy8vJSUlydPT09HlyGZzdAWOdftnLQAAAJA7spoNshW2pKtDv3/22WfavXu3zp49q/vuu08hISF2A2YUJIStvIWwBQAAAEfJajbI1gAZkuTs7Kxnn302u4sDAAAAQIGWrbC1cOHCm87v2bNntooBAAAAgIIiW7cRlixZ0u71lStXdP78ebm4uMjd3V0nT57MtQLzCm4jzFu4jRAAAACOktVskK3RCE+dOmU3nT17Vvv379eDDz6oJUuWZLtoAAAAACgoshW2MlO9enVNnDhRAwYMyK1VAgAAAEC+lWthS7o6aEZcXFxurhIAAAAA8qVsDZCxcuVKu9eGYejYsWN6//331bx581wpDAAAAADys2yFrc6dO9u9ttlsKlu2rB555BG9++67uVEXAAAAAORr2QpbaWlpuV0HAAAAABQoufrMFgAAAADgqmxd2Ro8eHCW+06ZMiU7mwAAAACAfC1bYevnn3/Wzz//rCtXrqhmzZqSpAMHDqhIkSK67777zH62wv7NuwAAAAAKrWyFrY4dO6pEiRJasGCBSpYsKenqFx337t1bLVq00JAhQ3K1SAAAAADIb2yGYRi3u9Bdd92ldevWqW7dunbtv/32m9q0aVMgv2srOTlZXl5eSkpKkqenp6PLUWG/aHj7Zy0AAACQO7KaDbI1QEZycrKOHz+eof348eM6c+ZMdlYJAAAAAAVKtsJWly5d1Lt3b3311Vc6evSojh49qi+//FJhYWHq2rVrbtcIAAAAAPlOtp7ZmjNnjoYOHapnnnlGV65cuboiZ2eFhYXp7bffztUCAQAAACA/ytYzW+nOnTunP//8U5JUtWpVeXh45FpheQ3PbOUtPLMFAAAAR7H0ma10x44d07Fjx1S9enV5eHgoB7kNAAAAAAqUbIWtf//9V61bt1aNGjXUvn17HTt2TJIUFhbGsO8AAAAAoGyGrUGDBqlo0aI6fPiw3N3dzfbu3btr7dq1uVZcamqqXnvtNVWuXFnFihVT1apV9frrr9tdQTMMQ6NHj1b58uVVrFgxBQYGKjY21m49J0+eVEhIiDw9PeXt7a2wsDCdPXs21+oEAAAAgOtlK2ytW7dOkyZN0t13323XXr16dR06dChXCpOkSZMmafbs2Xr//fe1d+9eTZo0SZMnT9Z7771n9pk8ebJmzJihOXPmaNu2bfLw8FBQUJAuXrxo9gkJCdGePXsUGRmp1atXKyoqSn379s21OgEAAADgetkajfDcuXN2V7TSnTx5Uq6urjkuKt3WrVvVqVMndejQQZJUqVIlLVmyRNu3b5d09arWtGnTNGrUKHXq1EmStHDhQvn4+GjFihUKDg7W3r17tXbtWu3YsUONGzeWJL333ntq37693nnnHfn5+eVavQAAAACQLltXtlq0aKGFCxear202m9LS0jR58mS1atUq14pr1qyZNmzYoAMHDkiSfvnlF33//fdq166dJOngwYOKj49XYGCguYyXl5eaNGmi6OhoSVJ0dLS8vb3NoCVJgYGBcnJy0rZt22647UuXLik5OdluAgAAAICsytaVrcmTJ6t169b66aefdPnyZb3yyivas2ePTp48qR9++CHXihs+fLiSk5NVq1YtFSlSRKmpqXrzzTcVEhIiSYqPj5ck+fj42C3n4+NjzouPj1e5cuXs5js7O6tUqVJmn8xMmDBB48aNy7V9AQAAAFC4ZOvKVr169XTgwAE9+OCD6tSpk86dO6euXbvq559/VtWqVXOtuM8//1yLFi3S4sWLtWvXLi1YsEDvvPOOFixYkGvbuJERI0YoKSnJnI4cOWL5NgEAAAAUHLd9ZevKlStq27at5syZo5EjR1pRk2nYsGEaPny4goODJUn169fXoUOHNGHCBIWGhsrX11eSlJCQoPLly5vLJSQkqGHDhpIkX19fJSYm2q03JSVFJ0+eNJfPjKura64+fwYAAACgcLntK1tFixbV7t27raglg/Pnz8vJyb7EIkWKKC0tTZJUuXJl+fr6asOGDeb85ORkbdu2TQEBAZKkgIAAnT59Wjt37jT7bNy4UWlpaWrSpMkd2AsAAAAAhVG2biN89tlnNW/evNyuJYOOHTvqzTff1DfffKO///5by5cv15QpU9SlSxdJVwfmGDhwoN544w2tXLlSv/76q3r27Ck/Pz917txZklS7dm21bdtWffr00fbt2/XDDz+oX79+Cg4OZiRCAAAAAJbJ1gAZKSkp+vjjj7V+/Xo1atRIHh4edvOnTJmSK8W99957eu211/TSSy8pMTFRfn5+euGFFzR69GizzyuvvKJz586pb9++On36tB588EGtXbtWbm5uZp9FixapX79+at26tZycnNStWzfNmDEjV2oEAAAAgMzYDMMwstr5r7/+UqVKldS6desbr9Bm08aNG3OluLwkOTlZXl5eSkpKkqenp6PLkc3m6AocK+tnLQAAAJC7spoNbuvKVvXq1XXs2DFt2rRJktS9e3fNmDEjw9DrAAAAAFDY3dYzW9dfBFuzZo3OnTuXqwUBAAAAQEGQrQEy0t3GHYgAAAAAUKjcVtiy2WyyXfew0PWvAQAAAAC3+cyWYRjq1auX+WW/Fy9e1H/+858MoxF+9dVXuVchAAAAAORDtxW2QkND7V4/++yzuVoMAAAAABQUtxW25s+fb1UdAAAAAFCg5GiADAAAAABA5ghbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYIE8H7b++ecfPfvssypdurSKFSum+vXr66effjLnG4ah0aNHq3z58ipWrJgCAwMVGxtrt46TJ08qJCREnp6e8vb2VlhYmM6ePXundwUAAABAIZKnw9apU6fUvHlzFS1aVGvWrNHvv/+ud999VyVLljT7TJ48WTNmzNCcOXO0bds2eXh4KCgoSBcvXjT7hISEaM+ePYqMjNTq1asVFRWlvn37OmKXAAAAABQSNsMwDEcXcSPDhw/XDz/8oO+++y7T+YZhyM/PT0OGDNHQoUMlSUlJSfLx8VFERISCg4O1d+9e1alTRzt27FDjxo0lSWvXrlX79u119OhR+fn5ZamW5ORkeXl5KSkpSZ6enrmzgzlgszm6AsfKu2ctAAAACrqsZoM8fWVr5cqVaty4sZ588kmVK1dO9957rz788ENz/sGDBxUfH6/AwECzzcvLS02aNFF0dLQkKTo6Wt7e3mbQkqTAwEA5OTlp27ZtN9z2pUuXlJycbDcBAAAAQFbl6bD1119/afbs2apevbq+/fZbvfjii3r55Ze1YMECSVJ8fLwkycfHx245Hx8fc158fLzKlStnN9/Z2VmlSpUy+2RmwoQJ8vLyMqcKFSrk5q4BAAAAKODydNhKS0vTfffdp7feekv33nuv+vbtqz59+mjOnDmWb3vEiBFKSkoypyNHjli+TQAAAAAFR54OW+XLl1edOnXs2mrXrq3Dhw9Lknx9fSVJCQkJdn0SEhLMeb6+vkpMTLSbn5KSopMnT5p9MuPq6ipPT0+7CQAAAACyKk+HrebNm2v//v12bQcOHJC/v78kqXLlyvL19dWGDRvM+cnJydq2bZsCAgIkSQEBATp9+rR27txp9tm4caPS0tLUpEmTO7AXAAAAAAojZ0cXcDODBg1Ss2bN9NZbb+mpp57S9u3bNXfuXM2dO1eSZLPZNHDgQL3xxhuqXr26KleurNdee01+fn7q3LmzpKtXwtq2bWvefnjlyhX169dPwcHBWR6JEAAAAABuV54e+l2SVq9erREjRig2NlaVK1fW4MGD1adPH3O+YRgaM2aM5s6dq9OnT+vBBx/UrFmzVKNGDbPPyZMn1a9fP61atUpOTk7q1q2bZsyYoeLFi2e5DoZ+z1vy9lkLAACAgiyr2SDPh628grCVt3DWAgAAwFEKxPdsAQAAAEB+RdgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACzg7ugDAEWw2R1fgWIbh6AoAAAAKPq5sAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAWdHFwAg/7HZHF2BYxmGoysAAAD5AVe2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALJCvwtbEiRNls9k0cOBAs+3ixYsKDw9X6dKlVbx4cXXr1k0JCQl2yx0+fFgdOnSQu7u7ypUrp2HDhiklJeUOVw8AAACgMMk3YWvHjh364IMPdM8999i1Dxo0SKtWrdKyZcu0ZcsWxcXFqWvXrub81NRUdejQQZcvX9bWrVu1YMECRUREaPTo0Xd6FwAAAAAUIvkibJ09e1YhISH68MMPVbJkSbM9KSlJ8+bN05QpU/TII4+oUaNGmj9/vrZu3aoff/xRkrRu3Tr9/vvv+vTTT9WwYUO1a9dOr7/+umbOnKnLly/fcJuXLl1ScnKy3QQAAAAAWZUvwlZ4eLg6dOigwMBAu/adO3fqypUrdu21atVSxYoVFR0dLUmKjo5W/fr15ePjY/YJCgpScnKy9uzZc8NtTpgwQV5eXuZUoUKFXN4rAAAAAAVZng9bn332mXbt2qUJEyZkmBcfHy8XFxd5e3vbtfv4+Cg+Pt7sc23QSp+fPu9GRowYoaSkJHM6cuRIDvcEAAAAQGHi7OgCbubIkSMaMGCAIiMj5ebmdke37erqKldX1zu6TQCFg83m6AocyzAcXQEAAHdGnr6ytXPnTiUmJuq+++6Ts7OznJ2dtWXLFs2YMUPOzs7y8fHR5cuXdfr0abvlEhIS5OvrK0ny9fXNMDph+uv0PgAAAACQ2/J02GrdurV+/fVXxcTEmFPjxo0VEhJi/rto0aLasGGDucz+/ft1+PBhBQQESJICAgL066+/KjEx0ewTGRkpT09P1alT547vEwAAAIDCIU/fRliiRAnVq1fPrs3Dw0OlS5c228PCwjR48GCVKlVKnp6e6t+/vwICAtS0aVNJUps2bVSnTh316NFDkydPVnx8vEaNGqXw8HBuEwQAAABgmTwdtrJi6tSpcnJyUrdu3XTp0iUFBQVp1qxZ5vwiRYpo9erVevHFFxUQECAPDw+FhoZq/PjxDqwaAAAAQEFnMwweVc6K5ORkeXl5KSkpSZ6eno4uhwfsc3jWcvxytjzHL2fLc/wcXQEAADmT1WyQp5/ZAgAAAID8irAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWAAAAAFiAsAUAAAAAFiBsAQAAAIAFCFsAAAAAYAHCFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGCBPB+2JkyYoPvvv18lSpRQuXLl1LlzZ+3fv9+uz8WLFxUeHq7SpUurePHi6tatmxISEuz6HD58WB06dJC7u7vKlSunYcOGKSUl5U7uCgAAAIBCJM+HrS1btig8PFw//vijIiMjdeXKFbVp00bnzp0z+wwaNEirVq3SsmXLtGXLFsXFxalr167m/NTUVHXo0EGXL1/W1q1btWDBAkVERGj06NGO2CUAAAAAhYDNMAzD0UXcjuPHj6tcuXLasmWLHnroISUlJals2bJavHixnnjiCUnSvn37VLt2bUVHR6tp06Zas2aNHnvsMcXFxcnHx0eSNGfOHL366qs6fvy4XFxcbrnd5ORkeXl5KSkpSZ6enpbuY1bYbI6uwLFyetZy/HK2PMcvZ8tz/BxdAQAAOZPVbJDnr2xdLykpSZJUqlQpSdLOnTt15coVBQYGmn1q1aqlihUrKjo6WpIUHR2t+vXrm0FLkoKCgpScnKw9e/Zkup1Lly4pOTnZbgIAAACArMpXYSstLU0DBw5U8+bNVa9ePUlSfHy8XFxc5O3tbdfXx8dH8fHxZp9rg1b6/PR5mZkwYYK8vLzMqUKFCrm8NwAAAAAKsnwVtsLDw/Xbb7/ps88+s3xbI0aMUFJSkjkdOXLE8m0CAAAAKDicHV1AVvXr10+rV69WVFSU7r77brPd19dXly9f1unTp+2ubiUkJMjX19fss337drv1pY9WmN7neq6urnJ1dc3lvQAAAABQWOT5K1uGYahfv35avny5Nm7cqMqVK9vNb9SokYoWLaoNGzaYbfv379fhw4cVEBAgSQoICNCvv/6qxMREs09kZKQ8PT1Vp06dO7MjAAAAAAqVPH9lKzw8XIsXL9bXX3+tEiVKmM9YeXl5qVixYvLy8lJYWJgGDx6sUqVKydPTU/3791dAQICaNm0qSWrTpo3q1KmjHj16aPLkyYqPj9eoUaMUHh7O1SsAAAAAlsjzQ7/bbjBG8vz589WrVy9JV7/UeMiQIVqyZIkuXbqkoKAgzZo1y+4WwUOHDunFF1/U5s2b5eHhodDQUE2cOFHOzlnLmwz9nrcw9HbOcPxyhuOXM3n7UwcAgFvLajbI82ErryBs5S38sZszHL+c4fjlDJ86AID8rsB+zxYAAAAA5AeELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAKELQAAAACwAGELAAAAACxA2AIAAAAACxC2AAAAAMAChC0AAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALODs6AIAALgdNpujK3Asw3B0BQCArOLKFgAAAABYgLAFAAAAABYgbAEAAACABQhbAAAAAGABwhYAAAAAWKBQha2ZM2eqUqVKcnNzU5MmTbR9+3ZHlwQAAACggCo0YWvp0qUaPHiwxowZo127dqlBgwYKCgpSYmKio0sDAOCOsdkK9wQAd1KhCVtTpkxRnz591Lt3b9WpU0dz5syRu7u7Pv74Y0eXBgAAAKAAKhRfanz58mXt3LlTI0aMMNucnJwUGBio6OjoTJe5dOmSLl26ZL5OSkqSJCUnJ1tbLLKEH0POcPxyhuOXMxy/nOH45UxOj5+XV+7UkV/9/z+Hso3jl7PlOX6OruD/pGcC4xbfNF8owtaJEyeUmpoqHx8fu3YfHx/t27cv02UmTJigcePGZWivUKGCJTXi9hT2N5uc4vjlDMcvZzh+OcPxyxmOX85w/HKG45czefH4nTlzRl43KaxQhK3sGDFihAYPHmy+TktL08mTJ1W6dGnZCvlN38nJyapQoYKOHDkiT09PR5eT73D8cobjlzMcv5zh+OUMxy9nOH45w/HLGY6fPcMwdObMGfn5+d20X6EIW2XKlFGRIkWUkJBg156QkCBfX99Ml3F1dZWrq6tdm7e3t1Ul5kuenp78suUAxy9nOH45w/HLGY5fznD8cobjlzMcv5zh+P2fm13RSlcoBshwcXFRo0aNtGHDBrMtLS1NGzZsUEBAgAMrAwAAAFBQFYorW5I0ePBghYaGqnHjxnrggQc0bdo0nTt3Tr1793Z0aQAAAAAKoEITtrp3767jx49r9OjRio+PV8OGDbV27doMg2bg1lxdXTVmzJgMt1kiazh+OcPxyxmOX85w/HKG45czHL+c4fjlDMcve2zGrcYrBAAAAADctkLxzBYAAAAA3GmELQAAAACwAGELAAAAACxA2AIAAAAACxC2ColevXrJZrNp4sSJdu0rVqyQzWYzX6empmrq1KmqX7++3NzcVLJkSbVr104//PCD3XJjx45Vw4YNM2zn77//ls1mU0xMjCRp8+bNstlsqlu3rlJTU+36ent7KyIiIlf2707o2LGj2rZtm+m87777TjabTbt375bNZst0+vHHHyVJERERZpuTk5PKly+v7t276/Dhw3brbNmypd3yPj4+evLJJ3Xo0CHL99WRoqOjVaRIEXXo0MGuPf3cSp9KlCihunXrKjw8XLGxsXZ9IyIiCsSXkKf/3tpsNrm4uKhatWoaP368UlJSzN+t9Kls2bJq3769fv311wzrOXLkiJ577jn5+fnJxcVF/v7+GjBggP7991+7fteec25ubqpTp45mzZplzk8/d6//PTh9+rRsNps2b95syXGwWk7Puay+NxRUvXr1UufOnc1/3+qz5trzOrOpUqVKkq6ejwMHDryDe+I4ufW+d+1ny913363evXsrMTHxTu5KnpOamqpmzZqpa9eudu1JSUmqUKGCRo4c6aDK7ixHfZ589tlndu3Tpk0zf8cLC8JWIeLm5qZJkybp1KlTmc43DEPBwcEaP368BgwYoL1792rz5s2qUKGCWrZsqRUrVmR723/99ZcWLlyY7eXzgrCwMEVGRuro0aMZ5s2fP1+NGzc2v1F9/fr1OnbsmN3UqFEjs7+np6eOHTumf/75R19++aX279+vJ598MsN6+/Tpo2PHjikuLk5ff/21jhw5omeffda6ncwD5s2bp/79+ysqKkpxcXEZ5qcf219++UVvvfWW9u7dqwYNGth9aXlB0rZtWx07dkyxsbEaMmSIxo4dq7ffftucv3//fh07dkzffvutLl26pA4dOujy5cvm/L/++kuNGzdWbGyslixZoj/++ENz5swxv9T95MmTdttLP+d+//13PfXUUwoPD9eSJUvM+c7Ozlq/fr02bdpk/c7fITk957Ly3nDPPfdYvh95xa0+a6ZPn2733ihdPU7pr3fs2HEny80Tcut9L/2z5ejRo/rwww+1Zs0a9ejR407tRp5UpEgRRUREaO3atVq0aJHZ3r9/f5UqVUpjxoxxYHV31p3+PHFzc9OoUaN05cqVO7aPeZKBQiE0NNR47LHHjFq1ahnDhg0z25cvX26knwafffaZIclYuXJlhuW7du1qlC5d2jh79qxhGIYxZswYo0GDBhn6HTx40JBk/Pzzz4ZhGMamTZsMScawYcOMChUqGBcvXjT7enl5GfPnz8+9nbTYlStXDB8fH+P111+3az9z5oxRvHhxY/bs2Rn2PzPz5883vLy87NpmzJhhSDKSkpLMtocfftgYMGCAXb9PPvnEcHd3z+mu5Fnpx3Lfvn1G9+7djTfffNOcd6Njm5qaarRs2dLw9/c3UlJSDMPI/BjnR6GhoUanTp3s2h599FGjadOm5u/WqVOnzHkrV640JBm//PKL2da2bVvj7rvvNs6fP2+3nmPHjhnu7u7Gf/7zH7Mts3OuevXqRnBwsGEY/3dc+/TpYzzwwANmn1OnThmSjE2bNuVshx0gN865rLw3FGTXnqdZ+ay5niRj+fLlGdozOx8LIivf9958803Dyckpw+9/YTR9+nSjZMmSRlxcnLFixQqjaNGiRkxMjKPLumMc8XnSu3dvo3Tp0sbMmTPN9qlTpxr+/v65um95HVe2CpEiRYrorbfe0nvvvZfp/8AuXrxYNWrUUMeOHTPMGzJkiP79919FRkZma9sDBw5USkqK3nvvvWwtnxc4OzurZ8+eioiIkHHN19MtW7ZMqampevrpp7O13sTERC1fvlxFihRRkSJFbtjv5MmT+vzzz9WkSZNsbSc/+Pzzz1WrVi3VrFlTzz77rD7++GO7Y50ZJycnDRgwQIcOHdLOnTvvUKWOU6xYMbv/aUyXlJRk3q7h4uIi6eo58+233+qll15SsWLF7Pr7+voqJCRES5cuvekxzmx7Y8eO1a+//qovvvgip7vjcLlxzln13pBf3eqzBvasfN8rVqyY0tLSlJKSkttl5zv9+/dXgwYN1KNHD/Xt21ejR49WgwYNHF2WQ1n9eeLp6amRI0dq/PjxOnfunIV7krcRtgqZLl26qGHDhpleNj9w4IBq166d6XLp7QcOHMjWdt3d3TVmzBhNmDBBSUlJ2VpHXvDcc8/pzz//1JYtW8y2+fPnq1u3bvLy8jLbmjVrpuLFi9tN10pKSlLx4sXl4eEhHx8fbdq0SeHh4fLw8LDrN2vWLLNf6dKltX//fn388cfW7qQDzZs3z7xNsm3btkpKSrI71jdSq1YtSVefbyioDMPQ+vXr9e233+qRRx4x2++++24VL15c3t7eWrx4sR5//HHzeMTGxsowjJv+Xp86dUrHjx/PMC81NVWffvqpdu/ebbc9SfLz89OAAQM0cuTIfP9HXG6dc1l9bygsbvZZA3tWve/FxsZqzpw5aty4sUqUKJFr9eZXNptNs2fP1oYNG+Tj46Phw4c7uiSHuZOfJy+99JLc3Nw0ZcoU63YojyNsFUKTJk3SggULtHfv3gzzbvW/aTkRFham0qVLa9KkSZZtw2q1atVSs2bNzMDzxx9/6LvvvlNYWJhdv6VLlyomJsZuulaJEiUUExOjn376Se+++67uu+8+vfnmmxm2FxISopiYGP3yyy/6/vvvVa1aNbVp00ZnzpyxbB8dZf/+/dq+fbt5FcDZ2Vndu3fXvHnzbrls+nl77WAvBcXq1atVvHhxubm5qV27durevbvGjh1rzv/uu++0c+dORUREqEaNGpozZ06GddzO73V6wC9WrJj69OmjQYMG6cUXX8zQ79VXX9Xx48fzdfjPzXMuq+8NhcnNPmtwVW6/76X/R567u7tq1qwpHx8fu+eUCruPP/5Y7u7uOnjwYKG86nqnP08kydXVVePHj9c777yjEydO5HQX8iXCViH00EMPKSgoSCNGjLBrr1Gjxg0/FNPba9SoIenqpeHMrlCdPn1akjL9n1xnZ2e9+eabmj59eqYPAOcXYWFh+vLLL3XmzBnNnz9fVatW1cMPP2zXp0KFCqpWrZrddC0nJydVq1ZNtWvX1uDBg9W0adNM/6D18vIyl2/evLnmzZun2NhYLV261NJ9dIR58+YpJSVFfn5+cnZ2lrOzs2bPnq0vv/zylldD08/PypUr34lS76hWrVopJiZGsbGxunDhghYsWGB3BbRy5cqqWbOmQkND9fzzz6t79+7mvGrVqslms93097pkyZIqW7as2ZYe8A8ePKhz585pypQpcnLK+FHh7e2tESNGaNy4cTp//nwu7vGdk9vnXFbeGwqTG33W4P/k9jmY/h95v/32m86dO6eoqCjzc7uw27p1q6ZOnarVq1frgQceUFhYmKX/wZwX3enPk3TPPvus/P399cYbb+T+TuUDhK1CauLEiVq1apWio6PNtuDgYMXGxmrVqlUZ+r/77rsqXbq0Hn30UUlSzZo1dfToUSUkJNj127Vrl9zc3FSxYsVMt/vkk0+qbt26GjduXC7uzZ311FNPycnJSYsXL9bChQv13HPP5fiKyvDhw7V06VLt2rXrpv3Sn+m6cOFCjraX16SkpGjhwoV699137a4G/vLLL/Lz87MbDe96aWlpmjFjhipXrqx77733DlZ9Z3h4eKhatWqqWLGinJ2db9o3PDxcv/32m5YvXy5J5u/srFmzMpwz8fHxWrRokbp37253/qYH/LvuuivTkHWt/v37y8nJSdOnT8/m3jmOFeecFe8N+V1mnzW4yopzMP0/8qpUqZLhuZrC7Pz58+rVq5defPFFtWrVSvPmzdP27dszvXJTkN3pz5N0Tk5OmjBhgmbPnl2gb/e/EcJWIVW/fn2FhIRoxowZZltwcLC6dOmi0NBQzZs3T3///bd2796tF154QStXrtRHH31k/g9IUFCQatasqaefflpbt27VX3/9pS+++EKjRo3SgAEDbjrQw8SJE/Xxxx/n24clixcvru7du2vEiBE6duyYevXqlaHPv//+q/j4eLvp4sWLN1xnhQoV1KVLF40ePdqu/fz58+byv/zyi1588UW5ubmpTZs2ub1bDrV69WqdOnVKYWFhqlevnt3UrVs3u1tq0o/tX3/9pZUrVyowMFDbt2/XvHnzbnreFQbu7u7q06ePxowZY/6P7fvvv69Lly4pKChIUVFROnLkiNauXatHH31Ud911V6a3r2aVm5ubxo0bZ/c+kl9Ycc5l5b2hsMnsswZX8b5354wYMUKGYZjf/1apUiW98847euWVVwrlH/9ZkdufJx06dFCTJk30wQcf3KldyDMIW4XY+PHjlZaWZr622Wz6/PPP9d///ldTp05VzZo11aJFCx06dEibN282v7RSunpL4Lp161SxYkU9/fTTqlevnsaMGaMBAwbo9ddfv+l2H3nkET3yyCP5+sH6sLAwnTp1SkFBQfLz88swPzAwUOXLl7ebbvU9ZYMGDdI333yj7du3m20ffvihuXyrVq104sQJ/e9//1PNmjVze5ccat68eQoMDMz09tNu3brpp59+UnJysqT/O7b169fX8OHDVbt2be3evVutWrUyl0lLS7vl/9oVVP369dPevXu1bNkySVL16tX1008/qUqVKnrqqadUtWpV9e3bV61atVJ0dLRKlSqVo+2FhoaqSpUquVH6HZXb51y6W703FEbXf9ZkVUH/PbbqHIS9LVu2aObMmZo/f77c3d3N9hdeeEHNmjUrlLcTZlVuf55MmjTppv/xXFDZDM4wAAXMxIkT9emnn+q3335zdCkAsqlWrVp6/vnnNXToUEeXAgDZVnD/ywhAoXP+/Hnt27dP8+fPV7t27RxdDoBsSExM1Jo1a7R//361bt3a0eUAQI4QtgAUGHPnztX48eMVGBiY4fk3APlD27ZtderUKc2YMaNADnoDoHDhNkIAAAAAsAADZAAAAACABQhbAAAAAGABwhYAAAAAWICwBQAAAAAWIGwBAAAAgAUIWwAAAABgAcIWACDf6dWrl2w2m2w2m1xcXFStWjWNHz9eKSkpZp/U1FRNnTpV9evXl5ubm0qWLKl27drphx9+sFtXamqqJk6cqFq1aqlYsWIqVaqUmjRpoo8++uiW285sqlSpkpW7DgDIRwhbAIB8qW3btjp27JhiY2M1ZMgQjR07Vm+//bYkyTAMBQcHa/z48RowYID27t2rzZs3q0KFCmrZsqVWrFhhrmfcuHGaOnWqXn/9df3+++/atGmT+vbtq9OnT2e63enTp+vYsWPmJEnz5883X+/YscPqXQcA5BN8qTEAIN/p1auXTp8+bRea2rRpozNnzig6OlpLly5VcHCwVq5cqY4dO9ot261bN23ZskWHDh2Sh4eHGjZsqC5dumjMmDHZqsVms2n58uXq3LmzJOnVV1/V8uXLdfToUfn6+iokJESjR49W0aJFzWXeeOMNzZgxQxcuXFD37t1VpkwZrV27VjExMZKkzZs365VXXtGePXtUtGhR1a1bV4sXL5a/v3+2agQAOAZXtgAABUKxYsV0+fJlSdLixYtVo0aNDEFLkoYMGaJ///1XkZGRkiRfX19t3LhRx48fz5U6SpQooYiICP3++++aPn26PvzwQ02dOtWcv2jRIr355puaNGmSdu7cqYoVK2r27Nnm/JSUFHXu3FkPP/ywdu/erejoaPXt21c2my1X6gMA3DnOji4AAICcMAxDGzZs0Lfffqv+/ftLkg4cOKDatWtn2j+9/cCBA5KkKVOm6IknnpCvr6/q1q2rZs2aqVOnTmrXrl226hk1apT570qVKmno0KH67LPP9Morr0iS3nvvPYWFhal3796SpNGjR2vdunU6e/asJCk5OVlJSUl67LHHVLVqVbuaAQD5C1e2AAD50urVq1W8eHG5ubmpXbt26t69u8aOHWvOz+pd8nXq1NFvv/2mH3/8Uc8995wSExPVsWNHPf/889mqa+nSpWrevLl8fX1VvHhxjRo1SocPHzbn79+/Xw888IDdMte+LlWqlHr16qWgoCB17NjRfEYMAJD/ELYAAPlSq1atFBMTo9jYWF24cEELFiyQh4eHJKlGjRrau3dvpsult9eoUcNsc3Jy0v3336+BAwfqq6++UkREhObNm6eDBw/eVk3R0dEKCQlR+/bttXr1av38888aOXKkeXtjVs2fP1/R0dFq1qyZli5dqho1aujHH3+8rXUAAByPsAUAyJc8PDxUrVo1VaxYUc7O9nfFBwcHKzY2VqtWrcqw3LvvvqvSpUvr0UcfveG669SpI0k6d+7cbdW0detW+fv7a+TIkWrcuLGqV6+uQ4cO2fWpWbNmhhELMxvB8N5779WIESO0detW1atXT4sXL76tWgAAjsczWwCAAic4OFjLli1TaGio3n77bbVu3VrJycmaOXOmVq5cqWXLlplXwZ544gk1b95czZo1k6+vrw4ePKgRI0aoRo0aqlWr1m1tt3r16jp8+LA+++wz3X///frmm2+0fPlyuz79+/dXnz591LhxY/PK1e7du1WlShVJ0sGDBzV37lw9/vjj8vPz0/79+xUbG6uePXvmzsEBANwxXNkCABQ4NptNn3/+uf773/9q6tSpqlmzplq0aKFDhw5p8+bN5jDtkhQUFKRVq1apY8eOqlGjhkJDQ1WrVi2tW7cuwxWzW3n88cc1aNAg9evXTw0bNtTWrVv12muv2fUJCQnRiBEjNHToUN133306ePCgevXqJTc3N0mSu7u79u3bp27duqlGjRrq27evwsPD9cILL+T4uAAA7iy+ZwsAAAd79NFH5evrq08++cTRpQAAchG3EQIAcAedP39ec+bMUVBQkIoUKaIlS5Zo/fr15vd+AQAKDq5sAQBwB124cEEdO3bUzz//rIsXL6pmzZoaNWqUunbt6ujSAAC5jLAFAAAAABZggAwAAAAAsABhCwAAAAAsQNgCAAAAAAsQtgAAAADAAoQtAAAAALAAYQsAAAAALEDYAgAAAAALELYAAAAAwAL/D7QdkL9e60sMAAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 1000x600 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "# Count the frequency of each unique POS tag\n",
    "pos_count = words_ul['POS'].value_counts()\n",
    "\n",
    "# Create the bar plot\n",
    "plt.figure(figsize=(10, 6))\n",
    "plt.bar(pos_count.index, pos_count.values, color='blue')\n",
    "plt.xlabel('POS Tags')\n",
    "plt.ylabel('Frequency')\n",
    "plt.title('Frequency Distribution of POS Tags')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>POS</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1828</th>\n",
       "      <td>s</td>\n",
       "      <td>ss</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2688</th>\n",
       "      <td>portland</td>\n",
       "      <td>portland</td>\n",
       "      <td>[-0.67776, 0.0077348, -0.48764, -0.44258, 0.09...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8736</th>\n",
       "      <td>ok</td>\n",
       "      <td>ok</td>\n",
       "      <td>[0.30087, 0.47824, 0.54891, 0.033704, 0.14233,...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10540</th>\n",
       "      <td>orc</td>\n",
       "      <td>orc</td>\n",
       "      <td>[0.16322, 0.1405, -0.070897, 0.041023, 0.66704...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10812</th>\n",
       "      <td>like</td>\n",
       "      <td>like</td>\n",
       "      <td>[0.25527, 0.33678, -0.52359, -0.24037, 0.10562...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18451</th>\n",
       "      <td>wy</td>\n",
       "      <td>wy</td>\n",
       "      <td>[-0.59006, -0.57603, 0.26084, -0.11541, -0.133...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23646</th>\n",
       "      <td>playwright</td>\n",
       "      <td>playwright</td>\n",
       "      <td>[-0.0093478, 0.59843, -0.28273, -0.45411, 0.00...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26339</th>\n",
       "      <td>unfaithfulness</td>\n",
       "      <td>unfaithfulness</td>\n",
       "      <td>[0.24544, 0.20927, 0.48207, 0.093218, -0.61773...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33773</th>\n",
       "      <td>hello</td>\n",
       "      <td>hello</td>\n",
       "      <td>[0.26609, 0.21821, -0.10996, -0.48408, -0.1118...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41891</th>\n",
       "      <td>goodness</td>\n",
       "      <td>goodness</td>\n",
       "      <td>[0.46102, 0.17175, 0.64266, 0.56388, -0.79617,...</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  tag   un-lemmatised  \\\n",
       "1828                s              ss   \n",
       "2688         portland        portland   \n",
       "8736               ok              ok   \n",
       "10540             orc             orc   \n",
       "10812            like            like   \n",
       "18451              wy              wy   \n",
       "23646      playwright      playwright   \n",
       "26339  unfaithfulness  unfaithfulness   \n",
       "33773           hello           hello   \n",
       "41891        goodness        goodness   \n",
       "\n",
       "                                               glove_vec   POS  \n",
       "1828   [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...  INTJ  \n",
       "2688   [-0.67776, 0.0077348, -0.48764, -0.44258, 0.09...  INTJ  \n",
       "8736   [0.30087, 0.47824, 0.54891, 0.033704, 0.14233,...  INTJ  \n",
       "10540  [0.16322, 0.1405, -0.070897, 0.041023, 0.66704...  INTJ  \n",
       "10812  [0.25527, 0.33678, -0.52359, -0.24037, 0.10562...  INTJ  \n",
       "18451  [-0.59006, -0.57603, 0.26084, -0.11541, -0.133...  INTJ  \n",
       "23646  [-0.0093478, 0.59843, -0.28273, -0.45411, 0.00...  INTJ  \n",
       "26339  [0.24544, 0.20927, 0.48207, 0.093218, -0.61773...  INTJ  \n",
       "33773  [0.26609, 0.21821, -0.10996, -0.48408, -0.1118...  INTJ  \n",
       "41891  [0.46102, 0.17175, 0.64266, 0.56388, -0.79617,...  INTJ  "
      ]
     },
     "execution_count": 64,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words_ul[words_ul['POS'] == 'INTJ']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>POS</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>8707</th>\n",
       "      <td>etc</td>\n",
       "      <td>etc</td>\n",
       "      <td>[0.491, 0.31059, 0.43001, 0.512, 0.1349, -0.37...</td>\n",
       "      <td>X</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10574</th>\n",
       "      <td>super</td>\n",
       "      <td>super</td>\n",
       "      <td>[-0.66806, 0.7057, -1.6854, 0.098448, -0.05147...</td>\n",
       "      <td>X</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "         tag un-lemmatised                                          glove_vec  \\\n",
       "8707     etc           etc  [0.491, 0.31059, 0.43001, 0.512, 0.1349, -0.37...   \n",
       "10574  super         super  [-0.66806, 0.7057, -1.6854, 0.098448, -0.05147...   \n",
       "\n",
       "      POS  \n",
       "8707    X  \n",
       "10574   X  "
      ]
     },
     "execution_count": 65,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words_ul[words_ul['POS'] == 'X']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "words_ul[[\"tag\", \"POS\"]].head(20)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Joining the words_ul back to the words dataframe"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>ner_model</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(s, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(action, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(twist, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(overrate, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(violent, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2894</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(newspaper, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2895</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(static, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2896</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(repeat, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2897</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(seal, O)]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2898</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[(counterespionage, O)]</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2898 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                   tag                                          glove_vec  \\\n",
       "0                    s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "1               action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "2                twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "3             overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   \n",
       "4              violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...   \n",
       "...                ...                                                ...   \n",
       "2894         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "2895            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "2896            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "2897              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "2898  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "     ner_label                ner_model  \n",
       "0          NaN                 [(s, O)]  \n",
       "1          NaN            [(action, O)]  \n",
       "2          NaN             [(twist, O)]  \n",
       "3          NaN          [(overrate, O)]  \n",
       "4          NaN           [(violent, O)]  \n",
       "...        ...                      ...  \n",
       "2894       NaN         [(newspaper, O)]  \n",
       "2895       NaN            [(static, O)]  \n",
       "2896       NaN            [(repeat, O)]  \n",
       "2897       NaN              [(seal, O)]  \n",
       "2898       NaN  [(counterespionage, O)]  \n",
       "\n",
       "[2898 rows x 4 columns]"
      ]
     },
     "execution_count": 66,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 67,
   "metadata": {},
   "outputs": [],
   "source": [
    "words_ul = words_ul.drop(columns=['un-lemmatised', 'glove_vec'])\n",
    "words_ul"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "metadata": {},
   "outputs": [],
   "source": [
    "words_merge = words.merge(words_ul, on=['tag'], how='inner')\n",
    "words_merge"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "metadata": {},
   "outputs": [],
   "source": [
    "words = words_merge"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Tag Frequency\n",
    "- Combine with semantic - glove vec representation\n",
    "- use the 'tags' dataframe -> this contains all the duplicates etc\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 72,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "\n",
    "sns.set(style=\"whitegrid\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA14AAAIoCAYAAAB51DqaAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/H5lhTAAAACXBIWXMAAA9hAAAPYQGoP6dpAABdBElEQVR4nO3dd3yN9///8efJkkRCSRC1gpBKbaJo+ZBaVR3o0IoaVbNVu9SmaakYLVW1d41So1SNLnytVFURNYOqiFih2cn5/eGXU0eCOMnlJDzut1tunOt6X9f1us55JznPvN/XdUxms9ksAAAAAIBhHOxdAAAAAAA87AheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AcA9TpkyRv7+/1VeFChVUrVo1tWjRQqGhobpy5Uq67dq1ayd/f38lJyff9zFTUlJ09uzZTLW9/TirVq2Sv7+/VqxYcd/Hvd+6du/eLX9/f02aNCnbj2WEqVOn6plnnlHFihXVqlWrdOv//vvvdK/13b6QsbTnp06dOkpJSblju7S+6u/vr//7v/8zrJ6sfk+k/QxYtWrVPdv+3//9n/z9/TVlyhSbjgXg4eVk7wIAILd4/fXXVaNGDUlSamqqYmJi9Mcff2j27NlavXq1Fi1aJF9fX0v7bt266ZVXXpGjo+N9Hefs2bPq1q2bmjVrpvfee++e7W09zv3KqK6yZcvq008/zRUh5Mcff9SUKVMUEBCgXr166bHHHkvXpmDBgvr000+tlm3evFmbN2+2ev2ROZcvX9aePXtUp06dDNevX7/+gdQRGBioTz/9VNWqVXsgxwOAjBC8ACCTqlatqpdeeind8pYtW6pr167q2rWr1q9fLyenmz9an376aZuOc/bsWR0/fjzT7W09zv3KqC5vb+8Mn5OcKDw8XJLUs2dPNWrUKMM27u7u6c7nzJkz2rx58x1ff2SsRIkSOnfunL7//vsMg9eVK1e0a9cueXl56dKlS4bXUqJECUOPAQD3wlRDAMiievXqqUOHDoqIiNDatWvtXQ7uIDExUZLk6elp50oeDYUKFVKNGjW0efPmDKcb/vDDDzKbzWrcuLEdqgOAB4/gBQDZ4JVXXpEkbd261bIso2u8NmzYoDZt2qhWrVqWEZQ5c+YoNTVV0s1rSTp27Cjp5vVI/v7++vvvvy3XUi1cuFCdOnVSxYoVVb9+fZ0/f/6O15LFxsZqzJgxql27tqpUqaI333xT27Zts2qTdu3K7dfXJCcny9/fX+3atctUXbdf47V//35169ZNtWrVUsWKFdWsWTNNnTpVCQkJVu38/f01fPhwbdq0Sa1bt1blypX11FNPaeDAgYqKisrUc3/ixAn17dtXdevWVcWKFfXss89q7NixunbtmtVxpk+fLkl666235O/vr927d2dq/3cTERGhIUOGKCgoSBUrVlTVqlX18ssva/HixRnW2atXL9WuXVvVqlXTO++8oxMnTiggIECDBg2ytLt8+bKGDBmiRo0aqWLFinr66afVu3dvHTt27J71tGvXTo0bN9ahQ4fUtm1bValSRc8884yGDx+uy5cvp2t/4MABy+tUqVIltWjRQnPmzLEKSmnXvX3++efq06ePKlWqpLp16+qPP/64Zz3PPfecZbrh7TZs2KCnnnpK3t7eGW77yy+/qH379qpevboqV66sl156SQsWLLB8ryQlJalu3bp3HL1s3bq1nnrqKSUmJt7xGq/MnP/dhIeHq1u3bgoMDFTNmjU1cODADJ9nAJCYaggA2aJ06dJydXXVoUOH7thm06ZN6tu3r+WNtMlk0saNGzVu3DhdunRJAwYMUOPGjZWYmKgZM2aocePGaty4sQoWLKhz585JkiZOnKjAwEANGzZM58+fV9GiRe94vMmTJ8vLy0udOnWS2WzW4sWL1aVLF02ePFlNmza9r/O7V1232rBhg/r166eCBQsqODhYXl5e2r59u6ZMmaJt27Zp/vz5cnV1tbTfvn271q1bpzZt2uj111/Xrl27tGbNGp09e1Zff/31XesKCwvT22+/LUdHR73xxhsqVqyY9u/fr3nz5unHH3/U0qVLLddt/fDDD9q6dau6deumMmXKqGzZsvf1HNzu7NmzeuWVV+Tq6qo2bdqoSJEiioqK0jfffKPRo0fL0dFRbdq0kXQzdLVp00bJyclq166dvL29tXHjRr355puWICHdvHlJ586d9ffff6tt27YqVqyYzp49q0WLFmn79u36/vvvVahQobvWdfXqVbVv3141atTQwIEDFR4eruXLl2vXrl1atWqVPDw8JN38I8H777+v4sWLq3PnznJ3d9eOHTs0btw47du3T1OmTJHJZLLsd+7cufL399fQoUMVERGhgICAez5HTZs2VUhISLrphhcvXtTevXs1evRoRUZGpttuzpw5GjdunEqVKqV33nlHbm5u2rJli0JCQrR7925NmTJFzs7OevHFFzV37lzt27dP1atXt2x//PhxHTx4UO3atZOLi0uGtd3v+d/uzz//VLt27ZQnTx699dZb8vT01Nq1a7Vly5Z7Pi8AHk0ELwDIBiaTSfnz57/rX7tXrlwpNzc3zZw5Uw4ONyccvPbaa2rfvr1OnDghSXriiSd0+fJlzZgxQ/7+/umuKSpYsKC+/PLLTN1Iw9PTU6tWrVK+fPkkSS+//LKee+45ffLJJ2rUqNF93YzjXnWluXHjhkaMGKH8+fNr7dq18vLykiS1bdtWoaGhmjlzpmbNmqV3333Xss25c+f09ddfW944v/baa7p48aL27NmjiIgIqxuW3Co1NVUffvihUlNTtWrVKkuQevPNN1WtWjWNHDlS48eP1yeffKKXXnpJJ0+e1NatW1W3bl099dRTmT73O1m0aJGuX7+uefPmqWLFipblTZs21fPPP6+ffvrJErw+/fRTXb9+XcuXL1flypUtz0m3bt3066+/WrY9fPiwDh06pP79++udd96xLPf399cXX3yhQ4cOqUGDBnetKyYmRq+99prGjBljWVauXDl9/PHHmjVrlnr37q24uDgNGTJE5cuX19KlSy3hJDg4WJMnT9aXX36p77//Xs2bN7fa96xZsyzBLTO8vb0VGBiozZs3a8SIEZY+t3HjRjk6OqpJkyZasGCB1TZnz57VhAkTVLZsWX3zzTdyd3eXJLVv3179+/fXd999pzVr1qhly5Z65ZVXNHfuXK1Zs8YqeH377beS/huJvp2t53+rcePGKTU1VV9//bXKlCkj6Wbfa9++vfbt25fp5wjAo4OphgCQTZKSku76F3IfHx/FxsYqJCREhw4dktlslqOjoxYtWmSZBncvtWrVynRgCg4OtoQuSSpSpIheeuklnT9/Xn/++Wem9nG/duzYoZiYGMtI16169uwpV1dXbdiwwWp58eLFrd40S7IEmejo6Dse6/Dhwzp9+rRatGiRbvSqTZs2KlasmH744YdMTxu7X4MGDdKOHTusQldqaqplyueNGzckSdevX9f27dv19NNPW0KXJDk6Oqp79+5W+yxcuLAcHR21fPlyfffdd5bpks2bN9f69evvGbrS9OrVy+rxm2++KU9PT23atEnSzdfpypUratq0qW7cuKHLly9bvtLCxubNm632UalSpfsKXWkymm64fv16PfPMM8qfP3+69ps3b1ZycrLeeecdS+iSbv5xo0+fPpJk6UN+fn6qUqWKNm7caLmGLzU1VevWrdOTTz6pJ554IsOabDn/W125ckVhYWF65plnLKFLklxcXNS+ffvMPjUAHjGMeAFANkhOTtb169dVuHDhO7Z57733FB4erkWLFmnRokUqWLCgateurUaNGqlp06aWuyHezZ2uh8mIn59fumVpo0enT59W1apVM72vzDpz5swdj+3m5qYSJUpY2qTJaOpc2gjE3ULT3Y5lMplUrlw5/fzzz7py5cp9PW+ZZTKZlJycrKlTp+rgwYM6d+6czpw5Y7mOLW0K4ZkzZ5ScnKzSpUun28fttRcpUkRDhw7VuHHj1K9fPzk4OCggIED16tXTyy+/fMfRv1sVKFAg3XPq7OysEiVKWO5KeerUKUk3p65OnDgxw/3cPo3U1uewSZMmGjNmjDZu3Kg6dero/Pnz2r9/v8aPH59h+7u9rsWLF5e7u7v+/vtvy7JXXnlFw4YN0y+//KLGjRvr//7v/3ThwgV17dr1jjXZcv63+vvvv2U2m1WqVKl06zKqGwAkghcAZIvw8HAlJSVZjX7cztvbW8uXL9eff/6pX375Rbt27dLmzZu1YcMGVa1aVYsWLZKzs/Ndj5M2RTEzMmprNpsl6Z4hz9ZRorT9322/t19zc7dRwqxIO4c7XeOTVVu3blXv3r3l6uqqOnXqqFGjRipXrpxq1Kih+vXrW9olJSVJUoav7a3XuqV588039fzzz+uXX37Rjh07tHv3bn355ZeaOXOmJk+efM+7AN7pfJOTky2ve9rr9O67797xs8ny5s1r9fh++t6tChYsqKeeekqbN2/W8OHD9f3338vV1VXPPvtshu3v1YdSU1OtzrF58+b6+OOPtWbNGjVu3FirV69Wnjx51KJFizvuw5bzz0jaKNvt9QFARgheAJAN0m4jf6ebVpjNZh07dkzx8fGqXLmyKlWqpHfffVc3btzQgAED9OOPP2r79u1q2LBhttV0+8iSJJ08eVLSfyNfadMWb38DefHiRZuOWbJkSUnK8HPI4uLidO7cuQxHCWyR9rlMGR3LbDbr5MmT8vDwsJpumZ3Gjh0rFxcXrV+/3mqk88KFC1btSpUqJZPJZBlluVXa65HmypUrOnbsmJ544gm9+OKLevHFFyVJO3fu1Ntvv60vv/zynsHr4sWL+vfff62CQ2Jiov7++2/LqFvx4sUlSXny5FHdunWttr9x44a2b99+z5t43I/nnntOO3bsUFhYmGXK5K3TCG91ax+qVKmS1bqzZ88qPj7e6qYyHh4eatq0qTZs2KCLFy9qy5YtatSoUYbTGNNk9fxLlCghBweHdK+fdHM0GQAywjVeAJBFe/bs0ddffy0/P787Bi+TyaR3331X3bt31/Xr1y3LPTw8VL58eUn/haC0kYWs/uV8xYoVVoHq77//1po1a+Tr66sKFSpIkiUwHDx40Grb1atXp9tfZup6+umn5eHhoUWLFqX7UNwvv/xSCQkJ931HxTsJCAhQiRIltG7dOsvNSdIsX75c586dU5MmTbLlWBm5cuWKChYsmO4N+syZMyX9N+JWoEAB1alTR9u3b7e6JbzZbNacOXOstt22bZvatWunpUuXWi2vVKmSnJycMjUdNTU1VbNnz7ZaNm/ePMXGxlpGgZ555hnlzZtXCxYsSHdDmOnTp+v999/XL7/8cs9jZVbjxo3l7OysuXPn6uDBg3cdjWrcuLEcHR01c+ZMxcbGWpabzWZNnjxZktSsWTOrbV555RUlJiZq1KhRiouLU+vWre9aT1bP/7HHHlPdunW1c+dO7d+/37I8JSVF8+bNu+uxATy6GPECgEzav3+/JRyZzWZdu3ZN+/fv16ZNm1SwYEFNmTLlrm+Me/bsqYEDB+r1119Xq1atlD9/fsutvgMCAix/eU+7lmbr1q16/PHHbf6A2ejoaLVp00atW7fWlStXtHjxYqWmpmrMmDGWENWkSROFhIRo+vTpio2NVenSpbVnzx5t27ZNBQsWtNpfZury9PTUiBEj9MEHH+jFF1/U66+/Li8vL+3YsUNbt27Vk08+qc6dO9t0PrdzdHTURx99pC5duujVV1/VG2+8oeLFi2v//v1as2aNihUrpv79+2fLsTLy7LPPavXq1erevbsaNmyouLg4bdq0Sfv27ZOLi4tiYmIsbQcPHqw2bdqoTZs2Cg4OVqFChbR161bL3e/Spls2btxY5cuX12effaazZ8+qUqVKio2N1apVq5SYmKhOnTplqrbZs2fr7Nmzqlatmg4cOKBvv/1WVapUUXBwsCQpX758Gj58uAYPHmx5nQoXLqxdu3Zpw4YNqly5st58881se64ee+wx1alTRz/99JM8PT2tpmLermTJkurdu7cmTJigl19+Wa1atbLcTn7Pnj1q2LChZSQwTWBgoEqVKqXNmzfr8ccft7p1fUay4/yHDh2qNm3aqGPHjgoODlbhwoW1fv36DEeaAUAieAFApi1btkzLli2TdPONsru7u3x9ffXOO++offv2KlCgwF23f+mll5Q3b17Nnz9fs2fP1vXr11W0aFG1a9dO3bt3t4Q2Pz8/dejQQStXrlRISIiKFy9u0/U1I0eO1C+//KLJkycrOTlZ1atXV+/eva2mb+XLl0/z58/X5MmT9fXXX8tkMqlWrVpasmRJujvjZbauF198UUWLFtWMGTO0YMECJSYmWt5Md+rUSXny5Lnvc7mT2rVra/ny5Zo2bZpWrlypGzdu6PHHH1enTp3UrVs3w6YZStLw4cP12GOPadOmTdqxY4cKFiyo8uXLa8GCBVq2bJnWr1+vs2fPqkSJEipfvryWLFmiiRMnauHChTKbzXrqqac0adIkde/e3XL9l5ubm+bOnauvvvpKv/zyi9auXStnZ2dVqlRJM2fOVL169TJV28KFC/XRRx9p48aNKlSokLp166bu3btbXRv18ssvq2jRopo1a5YWLFighIQEPf744+revbvefvvtO04FtFXz5s3166+/qlGjRve87q5Lly4qU6aM5s2bp6+++krSzc/KGz58uN54440M+13r1q01ceJEtWzZMlPfL1k9/9KlS2v58uWaNGmSli9frsTERNWtW1d9+vTRW2+9dc/jA3j0mMz3uooVAABkycWLF+Xt7Z3uRiL79u3TG2+8oXfffVfvvfdelo/Trl077dmzR4cOHcrUtEQAwIPDNV4AABjsrbfeUrNmzdLdLTLtpixG3NofAJCz8OcwAAAM1rp1a40fP17t27fXc889JwcHB+3evVvff/+9GjZsqGeeecbeJQIADEbwAgDAYJ07d1ahQoX09ddf67PPPlNiYqJKlCihAQMGqEOHDoZ9lhkAIOfgGi8AAAAAMBjXeAEAAACAwQheAAAAAGAwrvGywe+//y6z2Wz53BUAAAAAj6akpCSZTCZVq1btru0Y8bKB2WxWTrk0zmw2KzExMcfUg9yF/oOsoP/AVvQdZAX9B1lhRP/JbDZgxMsGaSNdlSpVsnMlUmxsrMLDw+Xn5yd3d3d7l4Nchv6DrKD/wFb0HWQF/QdZYUT/+fPPPzPVjhEvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgznZu4BLly5p7Nix2rZtmxISEhQYGKgPPvhAZcuWlSSFh4crJCREBw8eVMGCBdWhQwe99dZblu1TU1M1depUrVixQtevX1dgYKCGDx+uEiVKWNrcax+5XWRkpOLj4+Xm5mbvUuTt7a2SJUvauwwAAAAgR7F78OrZs6dSU1M1Y8YM5c2bV5999pk6dOigTZs2KT4+Xh07dlRQUJBGjRql/fv3a9SoUcqbN69at24tSZo2bZqWLFmisWPHysfHR+PHj1fnzp21bt06ubi46MqVK/fcR2529uxZvfLKK4qPj7d3KZIkN3d3HQkPJ3wBAAAAt7Br8Lp27ZqKFSumrl27qnz58pKkHj166KWXXtKxY8e0c+dOOTs7a/To0XJyclLZsmV1+vRpzZgxQ61bt1ZiYqLmzJmj/v37q0GDBpKkSZMmqV69etq0aZNatGih5cuX33UfuV10dLTi4+PV7dPpKl7uCbvW8s+Jo5rWv4uio6MJXgAAAMAt7Bq88ufPrwkTJlgeX758WfPmzZOPj4/8/Pw0ZcoU1apVS05O/5VZu3ZtffXVV4qOjtY///yjf//9V3Xq1LGsz5cvnwICArR37161aNFCYWFhd92Ht7f3gzlZgz1eprxKP1nV3mUAAAAAyIDdpxqmGTZsmJYvXy4XFxd9+eWXcnd3V2RkpGUkLE3hwoUlSefPn1dkZKQkqWjRounapK271z4eluAFAAAAIOfKMcGrffv2ev3117V48WL17NlTS5YsUXx8vFxcXKza5cmTR5KUkJCguLg4ScqwzbVr1yTpnvuwldlsVmxsrM3bZ5e0c0g1pyolJcWutaSmpEqS4uLicsRzg3tL+x5K+xe4H/Qf2Iq+g6yg/yArjOg/ZrNZJpPpnu1yTPDy8/OTJIWEhOiPP/7QokWL5OrqqsTERKt2aUHD3d1drq6ukqTExETL/9PapN3h7177sFVSUpLCw8Nt3j67nD9/XpKUmJBo97CTdoOPiIgIq9cDOV9ERIS9S0AuRv+Breg7yAr6D7Iiu/vP7QM9GbFr8Lp8+bJ27typpk2bWq7BcnBwkJ+fn6KiouTj46OoqCirbdIeFylSRMnJyZZlt97MISoqSv7+/pJ0z33YytnZ2RIW7SltZM8lj0uWgmR2SAtbvr6+qlChgl1rQebExcUpIiJCvr6+OeLjCJC70H9gK/oOsoL+g6wwov8cP348U+3sGryio6PVt29fzZo1S/Xq1ZN0cyTp8OHDCgoKkre3t5YuXaqUlBQ5OjpKknbt2qXSpUvLy8tLnp6e8vDw0O7duy3BKyYmRocPH1ZwcLAkKTAw8K77sJXJZLJ70JH+mzbpYHKwnJ+9ODje/DxuNze3HPHcIPN4zZAV9B/Yir6DrKD/ICuys/9kZpqhJDlky9FsVL58edWvX18fffSR9u7dq6NHj2rQoEGKiYlRhw4d1Lp1a924cUNDhgzR8ePHtWrVKs2bN09du3aVdHNILzg4WKGhodq6dauOHDmiPn36yMfHR02aNJGke+4DAAAAAIxm92u8Jk6cqAkTJqhPnz66fv26atasqcWLF+vxxx+XJM2aNUshISFq2bKlChUqpIEDB6ply5aW7Xv16qXk5GQNHTpU8fHxCgwM1OzZs+Xs7CxJ8vLyuuc+AAAAAMBIdg9enp6eGjlypEaOHJnh+sqVK2vZsmV33N7R0VEDBgzQgAED7tjmXvsAAAAAACPZdaohAAAAADwKCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDB7B68rl69quHDh6t+/fqqXr263njjDYWFhVnWd+zYUf7+/lZf7dq1s6xPSEjQqFGjVKdOHVWrVk39+vXT5cuXrY6xc+dOtWrVSlWqVFGzZs20fv36B3Z+AAAAAOBk7wL69u2rixcvauLEifLy8tLChQv19ttv69tvv1WZMmX0119/aeTIkWrUqJFlG2dnZ8v/R44cqbCwME2ZMkUuLi4aMWKEevXqpUWLFkmSTpw4oa5du6pjx44aP368fv75Zw0cOFAFCxZUnTp1Hvj5AgAAAHj02DV4nT59Wjt27NCSJUtUo0YNSdKwYcO0bds2rVu3TsHBwbp06ZKqVKmiQoUKpdv+woULWr16taZPn66aNWtKkiZOnKhmzZrp999/V7Vq1TR//nz5+/urT58+kqSyZcvq8OHDmjVrFsELAAAAwANh16mGBQoU0IwZM1SpUiXLMpPJJJPJpJiYGP31118ymUwqXbp0htv/9ttvkqTatWtblpUuXVpFihTR3r17JUlhYWHpAlbt2rX122+/yWw2Z/cpAQAAAEA6dh3xypcvn/73v/9ZLfvhhx90+vRpffjhhzp69Kg8PT01evRo7dixQ+7u7mrWrJl69OghFxcXXbhwQQUKFFCePHms9lG4cGFFRkZKkiIjI+Xj45NufVxcnK5cuaKCBQvaVLvZbFZsbKxN22anhIQESVKqOVUpKSl2rSU1JVWSFBcXlyOeG9xbXFyc1b/A/aD/wFb0HWQF/QdZYUT/MZvNMplM92xn92u8brVv3z4NHjxYTZo0UYMGDfThhx8qISFBlStXVseOHRUeHq5PP/1U//zzjz799FPFxcXJxcUl3X7y5MljCSTx8fHp2qQ9TkxMtLnWpKQkhYeH27x9djl//rwkKTEh0e5hJz4+XpIUEREhV1dXu9aC+xMREWHvEpCL0X9gK/oOsoL+g6zI7v6TUSa5XY4JXlu2bFH//v1VvXp1hYaGSpJGjx6tDz74QPnz55cklS9fXs7OzurTp48GDhwoV1fXDMNTQkKC3NzcJN0MYbe3SXuc1sYWzs7O8vPzs3n77HLt2jVJkkseF7m7u9u1lrSw5evrqwoVKti1FmROXFycIiIi5Ovrm6XvBzya6D+wFX0HWUH/QVYY0X+OHz+eqXY5IngtWrRIISEhatasmcaNG2dJjE5OTpbQlaZcuXKS/ptCePXqVSUmJlqlzKioKBUpUkSSVLRoUUVFRVntIyoqSu7u7vL09LS5ZpPJZPegI8kyzdLB5CBHR0e71uLgePOSQTc3txzx3CDzeM2QFfQf2Iq+g6yg/yArsrP/ZGaaoZQDPsdryZIlGjNmjNq2bauJEydaBah27dpp8ODBVu3//PNPOTs7y9fXVzVq1FBqaqrlJhuSdOrUKV24cEGBgYGSpJo1a2rPnj1W+9i1a5eqV68uBwe7nz4AAACAR4Bdk8epU6f08ccfq3Hjxuratauio6N18eJFXbx4UdevX1fTpk21Zs0aff311zp79qw2bNigTz/9VG+//bY8PDxUpEgRPf/88xo6dKh2796tAwcOqG/fvqpVq5aqVq0q6WZ4O3DggEJDQ3XixAnNmTNHGzduVOfOne156gAAAAAeIXadavjDDz8oKSlJmzdv1ubNm63WtWzZUmPHjpXJZNLChQv18ccfq1ChQurQoYO6dOliaTdmzBh9/PHHevfddyVJ9evX19ChQy3ry5Urp2nTpmn8+PGaP3++ihcvrvHjx/MZXgAAAAAeGLsGr27duqlbt253bdO2bVu1bdv2juvd3d310Ucf6aOPPrpjm/r166t+/fo21wkAAAAAWcFFTgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMLsHr6tXr2r48OGqX7++qlevrjfeeENhYWGW9Tt37lSrVq1UpUoVNWvWTOvXr7faPiEhQaNGjVKdOnVUrVo19evXT5cvX7Zqc699AAAAAICR7B68+vbtq99//10TJ07UypUrVaFCBb399ts6efKkTpw4oa5du6pevXpatWqVXn31VQ0cOFA7d+60bD9y5Eht375dU6ZM0fz583Xy5En16tXLsj4z+wAAAAAAIznZ8+CnT5/Wjh07tGTJEtWoUUOSNGzYMG3btk3r1q3TpUuX5O/vrz59+kiSypYtq8OHD2vWrFmqU6eOLly4oNWrV2v69OmqWbOmJGnixIlq1qyZfv/9d1WrVk3z58+/6z4AAAAAwGh2HfEqUKCAZsyYoUqVKlmWmUwmmUwmxcTEKCwsLF04ql27tn777TeZzWb99ttvlmVpSpcurSJFimjv3r2SdM99AAAAAIDR7DrilS9fPv3vf/+zWvbDDz/o9OnT+vDDD/Xtt9/Kx8fHan3hwoUVFxenK1eu6MKFCypQoIDy5MmTrk1kZKQkKTIy8q77KFiwoE21m81mxcbG2rRtdkpISJAkpZpTlZKSYtdaUlNSJUlxcXE54rnBvcXFxVn9C9wP+g9sRd9BVtB/kBVG9B+z2SyTyXTPdnYNXrfbt2+fBg8erCZNmqhBgwaKj4+Xi4uLVZu0x4mJiYqLi0u3XpLy5MljCST32oetkpKSFB4ebvP22eX8+fOSpMSERLuHnfj4eElSRESEXF1d7VoL7k9ERIS9S0AuRv+Breg7yAr6D7Iiu/tPRpnkdjkmeG3ZskX9+/dX9erVFRoaKulmgLo9HKU9dnNzk6ura4bhKSEhQW5ubpnah62cnZ3l5+dn8/bZ5dq1a5Iklzwucnd3t2staWHL19dXFSpUsGstyJy4uDhFRETI19c3S98PeDTRf2Ar+g6ygv6DrDCi/xw/fjxT7XJE8Fq0aJFCQkLUrFkzjRs3zpIYixYtqqioKKu2UVFRcnd3l6enp3x8fHT16lUlJiZapcyoqCgVKVIkU/uwlclksnvQkWSZZulgcpCjo6Nda3FwvHnJoJubW454bpB5vGbICvoPbEXfQVbQf5AV2dl/MjPNUMoBt5NfsmSJxowZo7Zt22rixIlWAapmzZras2ePVftdu3apevXqcnBwUI0aNZSammq5yYYknTp1ShcuXFBgYGCm9gEAAAAARrNr8jh16pQ+/vhjNW7cWF27dlV0dLQuXryoixcv6vr162rXrp0OHDig0NBQnThxQnPmzNHGjRvVuXNnSVKRIkX0/PPPa+jQodq9e7cOHDigvn37qlatWqpataok3XMfAAAAAGA0u041/OGHH5SUlKTNmzdr8+bNVutatmypsWPHatq0aRo/frzmz5+v4sWLa/z48Va3hx8zZow+/vhjvfvuu5Kk+vXra+jQoZb15cqVu+c+AAAAAMBIdg1e3bp1U7du3e7apn79+qpfv/4d17u7u+ujjz7SRx99ZPM+AAAAAMBIXOQEAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGMym4PXdd98pMTExu2sBAAAAgIeSTcFr4MCBevrppzVy5EgdOHAgu2sCAAAAgIeKTcHrxx9/VKdOnbRr1y69/vrrat68uWbPnq2LFy9md30AAAAAkOvZFLx8fHzUvXt3bdy4UYsXL1bNmjU1c+ZMNWzYUN26ddOmTZuUnJyc3bUCAAAAQK7klNUdVK9eXdWrV9err76qTz/9VD///LN+/vlneXt7q3379urUqZMcHR2zo1YAAAAAyJWyFLzOnTunNWvWaM2aNTpz5oxKliypvn37qkGDBvr555/1xRdf6Pjx4xo3blx21QsAAAAAuY5NwWvFihVas2aN9u3bpzx58qhZs2YKCQlRzZo1LW3Kly+vK1euaOnSpQQvAAAAAI80m4LXsGHDVKVKFY0cOVLNmzeXh4dHhu38/f31+uuvZ6lAAAAAAMjtbApe3333nfz8/JSSkmK5fis+Pl5JSUny9PS0tHv55ZezpUgAAAAAyM1suquhr6+vRowYoddee82ybN++fapTp47GjRun1NTUbCsQAAAAAHI7m4LX559/rrVr16pFixaWZQEBAerfv7+WL1+uWbNmZVuBAAAAAJDb2TTVcN26dfrggw/Upk0by7LHHntMHTp0kJOTkxYsWKAuXbpkW5EAAAAAkJvZNOJ15coVlShRIsN1ZcqUUWRkZJaKAgAAAICHiU3Bq0yZMvrhhx8yXPfjjz+qVKlSWSoKAAAAAB4mNk01fOuttzRo0CBdvXpVjRo1kpeXly5fvqyffvpJ33//vT755JPsrhMAAAAAci2bgtfLL7+sf//9V9OmTdOmTZssywsUKKBhw4ZxG3kAAAAAuIVNwUuS2rZtqzfffFOnTp3S1atXlS9fPpUpU0YODjbNXgQAAACAh5bNwUuSTCaTypQpk121AAAAAMBDyabgdfnyZYWEhOjnn39WXFyczGaz1XqTyaTDhw9nS4EAAAAAkNvZFLxGjx6tn376Sc8//7x8fHyYXggAAAAAd2FT8Pr111/14Ycf6vXXX8/uegAAAADgoWPTUJWzs/MdP0AZAAAAAGDNpuDVuHFjfffdd9ldCwAAAAA8lGyaahgQEKDJkyfr7NmzqlKlilxdXa3Wm0wm9ezZM1sKBAAAAIDczuaba0jS3r17tXfv3nTrCV4AAAAA8B+bgteRI0eyuw4AAAAAeGhl+T7w169f14kTJ5SYmKiUlJTsqAkAAAAAHio2B6/du3fr1VdfVa1atfTCCy/o2LFj6tevn8aOHZud9QEAAABArmdT8Nq5c6fefvttubq6qn///jKbzZKkJ554QgsWLNDcuXOztUgAAAAAyM1sCl6TJ0/Ws88+q4ULF6p9+/aW4NWtWzd17txZK1asyNYiAQAAACA3syl4hYeHq3Xr1pJu3sHwVk8//bTOnTuX9coAAAAA4CFhU/Dy9PTUxYsXM1x3/vx5eXp6ZqkoAAAAAHiY2BS8nn32WU2aNEl//vmnZZnJZFJkZKSmT5+uBg0aZFd9AAAAAJDr2fQ5Xv369dMff/yh1157Td7e3pKkvn37KjIyUkWLFlXfvn2ztUgAAAAAyM1sCl758+fXihUrtHr1au3atUtXr16Vp6en2rVrp1atWsnNzS276wQAAACAXMum4CVJLi4ueu211/Taa69lZz0AAAAA8NCxKXitXr36nm1efvllW3YNAAAAAA8dm4LXoEGDMlxuMpnk6OgoR0dHghcAAAAA/H82Ba+tW7emWxYbG6uwsDDNnDlTX3zxRZYLAwAAAICHhU3Bq1ixYhkuL1eunJKSkjRmzBgtWbIkS4UBAAAAwMPCps/xuht/f38dOnQou3cLAAAAALlWtgavxMREffPNN/Ly8srO3QIAAABArmbTVMOgoCCZTCarZampqbpy5YoSEhL0wQcfZEtxAAAAAPAwsCl41apVK13wkiQPDw81bNhQdevWzXJhAAAAAPCwsCl4jR07NrvrkCR99dVX2r59uxYuXGhZNnToUK1YscKqXbFixfTjjz9KujnSNnXqVK1YsULXr19XYGCghg8frhIlSljah4eHKyQkRAcPHlTBggXVoUMHvfXWW4acAwAAAADczqbg9c8//9xX+8cff/yebRYvXqzJkyerZs2aVsv/+usvdevWTcHBwZZljo6Olv9PmzZNS5Ys0dixY+Xj46Px48erc+fOWrdunVxcXHTlyhV17NhRQUFBGjVqlPbv369Ro0Ypb968at269X2dBwAAAADYItuu8bqb8PDwO667cOGCRowYod27d8vX19dqndls1vHjx9WlSxcVKlQo3baJiYmaM2eO+vfvrwYNGkiSJk2apHr16mnTpk1q0aKFli9fLmdnZ40ePVpOTk4qW7asTp8+rRkzZhC8AAAAADwQNgWvyZMna8SIEXryySf14osvqkiRIrpy5Yp+/PFHff/99+revfsdP+vrdocOHZKzs7PWrl2rL774QufOnbOsO3PmjGJjY1WmTJkMtz1y5Ij+/fdf1alTx7IsX758CggI0N69e9WiRQuFhYWpVq1acnL671Rr166tr776StHR0fL29rblKQAAAACATLMpeK1Zs0YNGzZMd61X8+bN5eXlpX379undd9/N1L6CgoIUFBSU4bqjR49KkhYuXKhff/1VDg4Oql+/vvr06SNPT09FRkZKkooWLWq1XeHChS3rIiMjVb58+XTrJen8+fMELwAAAACGsyl47dy5U1OnTs1wXf369bV06dIsFZXm6NGjcnBwUOHChTV9+nSdOXNGn376qY4dO6b58+crLi5OkuTi4mK1XZ48eXTt2jVJUnx8fIbrJSkhIcHm2sxms2JjY23ePruknUOqOVUpKSl2rSU1JVWSFBcXlyOeG9xb2vdQ2r/A/aD/wFb0HWQF/QdZYUT/MZvNmboMy6bgVaBAAf3xxx965pln0q3buXOnihQpYstu0+nevbvefPNNFShQQJJUvnx5FSpUSK+99pr+/PNPubq6Srp5rVfa/6WbYcTNzU2S5OrqqsTERKv9poUVd3d3m2tLSkq667VrD8r58+clSYkJiXYPO/Hx8ZKkiIgIq9cDOV9ERIS9S0AuRv+Breg7yAr6D7Iiu/vP7QM9GbEpeL3yyiv68ssvFRcXp6CgIBUsWFDR0dHauHGjvv76aw0bNsyW3abj4OBgCV1pypUrJ+nmFMK0KYZRUVEqWbKkpU1UVJT8/f0lST4+PoqKirLaR9rjrAREZ2dn+fn52bx9dkkb2XPJ45KlIJkd0sKWr6+vKlSoYNdakDlxcXGKiIiQr6+v5Y8VQGbRf2Ar+g6ygv6DrDCi/xw/fjxT7WwKXj169ND169c1b948zZ49W9LNITY3Nzf16dNHbdq0sWW36QwcOFBRUVGaN2+eZdmff/4pSfLz81OJEiXk4eGh3bt3W4JXTEyMDh8+bLn9fGBgoJYuXaqUlBTLbeh37dql0qVLy8vLy+baTCaT3YOO9N+0SQeTg9Vt9u3BwdFBkuTm5pYjnhtkHq8ZsoL+A1vRd5AV9B9kRXb2n8ze7d2m4GUymTRo0CD16NFD+/fv17Vr11SgQAFVrVpVHh4etuwyQ02bNlWPHj00depUvfjiizp16pRGjx6tFi1aqGzZspKk4OBghYaGqmDBgipWrJjGjx8vHx8fNWnSRJLUunVrzZo1S0OGDFHnzp114MABzZs3T6NGjcq2OgEAAADgbmwKXmk8PDwsdwisWrWqkpOTs6WoNM8++6wmT56sGTNmaObMmfL09NQLL7yg3r17W9r06tVLycnJGjp0qOLj4xUYGKjZs2fL2dlZkuTl5aVZs2YpJCRELVu2VKFChTRw4EC1bNkyW2sFAAAAgDuxOXitWbNGEyZM0MWLF2UymbRixQpNmTJFzs7OmjBhQqYuMLvd7benl6TnnntOzz333B23cXR01IABAzRgwIA7tqlcubKWLVt23/UAAAAAQHZwsGWjDRs26IMPPlDt2rU1ceJEpabevI1448aN9csvv2jatGnZWiQAAAAA5GY2jXhNnz5dbdq00ciRI60+O6p169a6fPmyli9fbjUdEAAAAAAeZTaNeJ06dUqNGzfOcF2VKlV04cKFLBUFAAAAAA8Tm4KXl5eXTpw4keG6EydOZOk27QAAAADwsLEpeDVv3lyff/65Nm7cqMTEREk3bzF/8OBBTZs2Tc2aNcvWIgEAAAAgN7PpGq/evXvr6NGj6t27txwcbma3du3aKTY2VjVr1tT777+frUUCAAAAQG5mU/BycXHRrFmztGPHDu3atUtXr16Vp6enatWqpf/973+Z/vRmAAAAAHgU2BS83n77bXXu3FlPP/20nn766eyuCQAAAAAeKjZd47Vv3z5GtQAAAAAgk2wKXvXq1dPatWuVlJSU3fUAAAAAwEPHpqmGefLk0dq1a/X999+rbNmycnd3t1pvMpk0f/78bCkQAAAAAHI7m4JXZGSkqlWrZnlsNput1t/+GAAAAAAeZZkOXps2bVLt2rWVL18+LVy40MiaAAAAAOChkulrvN5//31FRERYLZs5c6YuXbqU3TUBAAAAwEMl08Hr9umDKSkpmjhxoiIjI7O9KAAAAAB4mNh0V8M0XMsFAAAAAPeWpeAFAAAAALg3m+5qCNxNeHi4vUuQJHl7e6tkyZL2LgMAAADIevAymUzZUQceAlcvXpDJZFJwcLC9S5Ekubm760h4OOELAAAAdndfwatnz55ycXGxWtatWzc5OztbLTOZTNqyZUvWq0OuEhtzTWazWR3HfK6yFSvbtZZ/ThzVtP5dFB0dTfACAACA3WU6eLVs2dLIOvAQKVraT6WfrGrvMgAAAIAcI9PB65NPPjGyDgAAAAB4aHFXQwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAg+Wo4PXVV1+pXbt2VsvCw8MVHBysqlWrKigoSAsWLLBan5qaqs8//1z16tVT1apV9c477+js2bP3tQ8AAAAAMFKOCV6LFy/W5MmTrZZduXJFHTt2VMmSJbVy5Ur17NlToaGhWrlypaXNtGnTtGTJEo0ZM0ZLly5VamqqOnfurMTExEzvAwAAAACM5GTvAi5cuKARI0Zo9+7d8vX1tVq3fPlyOTs7a/To0XJyclLZsmV1+vRpzZgxQ61bt1ZiYqLmzJmj/v37q0GDBpKkSZMmqV69etq0aZNatGhxz30AAAAAgNHsPuJ16NAhOTs7a+3atapSpYrVurCwMNWqVUtOTv/lw9q1aysiIkLR0dE6cuSI/v33X9WpU8eyPl++fAoICNDevXsztQ8AAAAAMJrdR7yCgoIUFBSU4brIyEiVL1/ealnhwoUlSefPn1dkZKQkqWjRounapK271z68vb1tqttsNis2NtambbNTQkKCJCnVnKqUlBS71pKamppzakm5WUtcXFyOeJ1yqri4OKt/gftB/4Gt6DvICvoPssKI/mM2m2Uyme7Zzu7B627i4+Pl4uJitSxPnjySbgaOtCcsozbXrl3L1D5slZSUpPDwcJu3zy7nz5+XJCUmJNo9YCQmJOaYWuLj4yVJERERcnV1tWstuUFERIS9S0AuRv+Breg7yAr6D7Iiu/vP7XkjIzk6eLm6ulpukpEmLSy5u7tb3lAnJiZavblOSEiQm5tbpvZhK2dnZ/n5+dm8fXZJC5gueVyydD7ZwSWPS46pJa0/+Pr6qkKFCnatJSeLi4tTRESEfH19Ld8zQGbRf2Ar+g6ygv6DrDCi/xw/fjxT7XJ08PLx8VFUVJTVsrTHRYoUUXJysmVZyZIlrdr4+/tnah+2MplMdg8X0n+jdw4mBzk6Otq1FgcHh5xTi+PNWtzc3HLE65TT8TwhK+g/sBV9B1lB/0FWZGf/ycw0QykH3FzjbgIDA/Xbb79ZXS+0a9culS5dWl5eXnriiSfk4eGh3bt3W9bHxMTo8OHDCgwMzNQ+AAAAAMBoOTp4tW7dWjdu3NCQIUN0/PhxrVq1SvPmzVPXrl0l3ZxLGRwcrNDQUG3dulVHjhxRnz595OPjoyZNmmRqHwAAAABgtBw91dDLy0uzZs1SSEiIWrZsqUKFCmngwIFq2bKlpU2vXr2UnJysoUOHKj4+XoGBgZo9e7acnZ0zvQ8AAAAAMFKOCl5jx45Nt6xy5cpatmzZHbdxdHTUgAEDNGDAgDu2udc+AAAAAMBIOXqqIQAAAAA8DAheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgsBx1O3kgu4WHh9u7BAtvb2+VLFnS3mUAAADADgheeChdvXhBJpNJwcHB9i7Fws3dXUfCwwlfAAAAjyCCFx5KsTHXZDab1XHM5ypbsbK9y9E/J45qWv8uio6OJngBAAA8ggheeKgVLe2n0k9WtXcZAAAAeMRxcw0AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMliuC14ULF+Tv75/ua9WqVZKk8PBwBQcHq2rVqgoKCtKCBQustk9NTdXnn3+uevXqqWrVqnrnnXd09uxZe5wKAAAAgEeQk70LyIwjR44oT5482rJli0wmk2W5p6enrly5oo4dOyooKEijRo3S/v37NWrUKOXNm1etW7eWJE2bNk1LlizR2LFj5ePjo/Hjx6tz585at26dXFxc7HVaAAAAAB4RuSJ4HT16VL6+vipcuHC6dfPnz5ezs7NGjx4tJycnlS1bVqdPn9aMGTPUunVrJSYmas6cOerfv78aNGggSZo0aZLq1aunTZs2qUWLFg/4bAAAAAA8anLFVMO//vpLZcuWzXBdWFiYatWqJSen/zJk7dq1FRERoejoaB05ckT//vuv6tSpY1mfL18+BQQEaO/evYbXDgAAAAC5IngdPXpUly9fVtu2bVW3bl298cYb+vXXXyVJkZGR8vHxsWqfNjJ2/vx5RUZGSpKKFi2ark3aOgAAAAAwUo6fapicnKyTJ0/Kz89PgwYNkoeHh9avX68uXbpo7ty5io+PT3edVp48eSRJCQkJiouLk6QM21y7ds3musxms2JjY23ePrskJCRIklLNqUpJSbFrLampqdRyB6kpN+uJi4vLEf0mTdr3R9q/wP2g/8BW9B1kBf0HWWFE/zGbzVb3obiTHB+8nJyctHv3bjk6OsrV1VWSVLFiRR07dkyzZ8+Wq6urEhMTrbZJCyPu7u6WbRITEy3/T2vj5uZmc11JSUkKDw+3efvscv78eUlSYkKi3d/QJyYkUssdxMfHS5IiIiKs+mFOERERYe8SkIvRf2Ar+g6ygv6DrMju/pOZG/bl+OAlSXnz5k23rFy5ctq+fbt8fHwUFRVltS7tcZEiRZScnGxZVrJkSas2/v7+Ntfk7OwsPz8/m7fPLmmjdi55XOTu7m7XWlzyuFDLHaSFLV9fX1WoUMHO1fwnLi5OERER8vX1zdIfIvBoov/AVvQdZAX9B1lhRP85fvx4ptrl+OB17Ngxvf766/ryyy/11FNPWZYfPHhQfn5+qlChgpYuXaqUlBQ5OjpKknbt2qXSpUvLy8tLnp6e8vDw0O7duy3BKyYmRocPH1ZwcLDNdZlMphzxhj5tWqWDycFy/vbi4OBALXfg4HizHjc3txzRb26XU+tC7kD/ga3oO8gK+g+yIjv7T2amGUq54OYaZcuWVZkyZTR69GiFhYXpxIkT+uSTT7R//351795drVu31o0bNzRkyBAdP35cq1at0rx589S1a1dJN4f9goODFRoaqq1bt+rIkSPq06ePfHx81KRJEzufHQAAAIBHQY4f8XJwcND06dM1YcIE9e7dWzExMQoICNDcuXNVvnx5SdKsWbMUEhKili1bqlChQho4cKBatmxp2UevXr2UnJysoUOHKj4+XoGBgZo9e7acnZ3tdVoAAAAAHiE5PnhJkre3tz755JM7rq9cubKWLVt2x/WOjo4aMGCABgwYYER5AAAAAHBXOX6qIQAAAADkdgQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgznZuwDgURIeHm7vEiRJ3t7eKlmypL3LAAAAeGQQvIAH4OrFCzKZTAoODrZ3KZIkN3d3HQkPl7e3t71LAQAAeCQQvIAHIDbmmsxmszqO+VxlK1a2ay3/nDiqaf27KDo6muAFAADwgBC8gAeoaGk/lX6yqr3LAAAAwAPGzTUAAAAAwGCMeAGPqPDwcMXFxSkiIkLx8fFyc3OzSx3c6AMAADwKCF7AIyan3uiD8AUAAB5mBC/gEXPrjT5KV6io+Ph4ubq6ysHxwc88vvVGHwQvAADwMCN4AY+ooqX95PtkFcXGxsrd3V2Ojo72LgkAAOChxc01AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADAYwQsAAAAADEbwAgAAAACDEbwAAAAAwGAELwAAAAAwGMELAAAAAAxG8AIAAAAAgxG8AAAAAMBgBC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYAQvAAAAADCYk70LAIDw8HB7lyBJ8vb2VsmSJe1dBgAAeAgRvADYzdWLF2QymRQcHGzvUiRJbu7uOhIeTvgCAADZjuAFwG5iY67JbDar45jPVbZiZbvW8s+Jo5rWv4uio6MJXgAAINsRvADYXdHSfir9ZFV7lyEp50x7lJj6CADAw4TgBQDKedMeJaY+AgDwMCF4AYBy1rRHiamPAAA8bAheAHCLnDTtEQAAPDz4HC8AAAAAMBjBCwAAAAAMRvACAAAAAIMRvAAAAADAYNxcAwBwT2fOnFF0dLTVsri4OEVERCg+Pl5ubm4PrBY+3wwAkBsRvAAAd3XmzBk9UaGC4mJj7V2KJD7fDACQOxG8ACAHCw8Pt3cJCg8PV1xsrHqEztDjZctblqempCo+Pl6urq5ycHwwM9f5fDMAQG71yASv1NRUTZ06VStWrND169cVGBio4cOHq0SJEvYuDQDSuXrxgkwmk4KDg+1dioV3cV+rzzhLSUlRbGys3N3d5ejoaL/CAADIBR6Z4DVt2jQtWbJEY8eOlY+Pj8aPH6/OnTtr3bp1cnFxsXd5AGAlNuaazGazOo75XGUrVrZrLX/8slkrJocoOTnZrnXcKieMBEpcbwYAyLxHInglJiZqzpw56t+/vxo0aCBJmjRpkurVq6dNmzapRYsW9i0QAO6gaGk/q1Eme/jnxFG7Hv9WOW0kMI+rq1Z+842KFi1q71IIgQCQwz0SwevIkSP6999/VadOHcuyfPnyKSAgQHv37iV4AUAukZNGAv8K26lFH3+YY36H5KQQKBEEAeB2JrPZbLZ3EUbbtGmT3nvvPf3xxx9ydXW1LH///fcVHx+vr7766r72t2/fPpnNZjk7O2d3qfctISFB//zzj/J5ecvJyb5TJhPi4/TvtSvyLOgtZ2dqyan13FqLk7OzZJZkkkwy2bWWnPS82LuWnFbPnWoxy/zA+09OfF7cPfPL0c6/D5KTEhV/47py0q90BwcHFSpU6I7X/yUnJ8vJ6cH8/ddkMuWY54Za7ux+6jG6/+Sk54Za7szJyem+rzE2m82W/mMyZc/vrqSkJJlMJlWvXv2u7R6JEa+4uDhJSnctV548eXTt2rX73l/ai5RdL1ZWuLq6qkyZMvYu46a8rpJXAXtXcVNOqkXKWfVQS8ZyUi1SzqqHWjKWk2qRpELe9q4AAHI8k8mU7fd3MJlMmcoFj0TwShvlSkxMtBrxSkhIsOlDP6tVq5ZttQEAAAB4+D2YD16xs7T57lFRUVbLo6KiVKRIEXuUBAAAAOAR8kgEryeeeEIeHh7avXu3ZVlMTIwOHz6swMBAO1YGAAAA4FHwSEw1dHFxUXBwsEJDQ1WwYEEVK1ZM48ePl4+Pj5o0aWLv8gAAAAA85B6J4CVJvXr1UnJysoYOHar4+HgFBgZq9uzZOeLOhAAAAAAebo/E7eQBAAAAwJ4eiWu8AAAAAMCeCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAAAAAGAwghcAAAAAGIzglUulpqbq888/V7169VS1alW98847Onv2rL3LQi7w1VdfqV27dlbLwsPDFRwcrKpVqyooKEgLFiywU3XIia5evarhw4erfv36ql69ut544w2FhYVZ1u/cuVOtWrVSlSpV1KxZM61fv96O1SInuXTpkgYMGKDatWurWrVq6tKli06cOGFZz88eZNapU6dUrVo1rVq1yrKM/oO7uXDhgvz9/dN9pfUhe/QfglcuNW3aNC1ZskRjxozR0qVLlZqaqs6dOysxMdHepSEHW7x4sSZPnmy17MqVK+rYsaNKliyplStXqmfPngoNDdXKlSvtUyRynL59++r333/XxIkTtXLlSlWoUEFvv/22Tp48qRMnTqhr166qV6+eVq1apVdffVUDBw7Uzp077V02coCePXvq9OnTmjFjhr755hu5urqqQ4cOiouL42cPMi0pKUn9+/dXbGysZRn9B/dy5MgR5cmTR9u2bdP27dstX82bN7db/3EydO8wRGJioubMmaP+/furQYMGkqRJkyapXr162rRpk1q0aGHfApHjXLhwQSNGjNDu3bvl6+trtW758uVydnbW6NGj5eTkpLJly1reKLVu3do+BSPHOH36tHbs2KElS5aoRo0akqRhw4Zp27ZtWrdunS5duiR/f3/16dNHklS2bFkdPnxYs2bNUp06dexZOuzs2rVrKlasmLp27ary5ctLknr06KGXXnpJx44d086dO/nZg0yZMmWKPDw8rJbxuwv3cvToUfn6+qpw4cLp1s2fP98u/YcRr1zoyJEj+vfff63e1OTLl08BAQHau3evHStDTnXo0CE5Oztr7dq1qlKlitW6sLAw1apVS05O//0dpnbt2oqIiFB0dPSDLhU5TIECBTRjxgxVqlTJssxkMslkMikmJkZhYWHpAlbt2rX122+/yWw2P+hykYPkz59fEyZMsISuy5cva968efLx8ZGfnx8/e5Ape/fu1bJlyzR27Fir5fQf3Mtff/2lsmXLZrjOXv2H4JULRUZGSpKKFi1qtbxw4cKWdcCtgoKCNGXKFJUoUSLdusjISPn4+FgtS/vr0Pnz5x9Ifci58uXLp//9739ycXGxLPvhhx90+vRp1atX7479J20qGSDdHCWtU6eO1q9fr5CQELm7u/OzB/cUExOjgQMHaujQoene89B/cC9Hjx7V5cuX1bZtW9WtW1dvvPGGfv31V0n26z8Er1woLi5OkqzeCElSnjx5lJCQYI+SkIvFx8dn2Jck0Z+Qzr59+zR48GA1adJEDRo0yLD/pD3mmlOkad++vVauXKkWLVqoZ8+eOnToED97cE8jR45UtWrV9MILL6RbR//B3SQnJ+vkyZO6du2a3nvvPc2YMUNVq1ZVly5dtHPnTrv1H67xyoVcXV0l3XxTk/Z/6WZHcXNzs1dZyKVcXV3TvUFO+6Hj7u5uj5KQQ23ZskX9+/dX9erVFRoaKunmL6rb+0/aY34eIY2fn58kKSQkRH/88YcWLVrEzx7c1erVqxUWFqZ169ZluJ7+g7txcnLS7t275ejoaHmvXLFiRR07dkyzZ8+2W/9hxCsXShtuj4qKsloeFRWlIkWK2KMk5GI+Pj4Z9iVJ9CdYLFq0SO+9954aNmyo6dOnW/4yWLRo0Qz7j7u7uzw9Pe1RKnKIy5cva/369UpOTrYsc3BwkJ+fn6KiovjZg7tauXKlLl26pAYNGqhatWqqVq2aJGnEiBHq3Lkz/Qf3lDdvXqsBCkkqV66cLly4YLf+Q/DKhZ544gl5eHho9+7dlmUxMTE6fPiwAgMD7VgZcqPAwED99ttvSklJsSzbtWuXSpcuLS8vLztWhpwi7aMr2rZtq4kTJ1pNz6hZs6b27Nlj1X7Xrl2qXr26HBz4FfMoi46OVt++fa0+WiApKUmHDx9W2bJl+dmDuwoNDdWGDRu0evVqy5ck9erVSyEhIfQf3NWxY8dUvXp1q/fKknTw4EH5+fnZrf/wWzEXcnFxUXBwsEJDQ7V161YdOXJEffr0kY+Pj5o0aWLv8pDLtG7dWjdu3NCQIUN0/PhxrVq1SvPmzVPXrl3tXRpygFOnTunjjz9W48aN1bVrV0VHR+vixYu6ePGirl+/rnbt2unAgQMKDQ3ViRMnNGfOHG3cuFGdO3e2d+mws/Lly6t+/fr66KOPtHfvXh09elSDBg1STEyMOnTowM8e3FWRIkVUqlQpqy9J8vLyUpEiReg/uKuyZcuqTJkyGj16tMLCwnTixAl98skn2r9/v7p37263/mMyc7/fXCklJUUTJ07UqlWrFB8fr8DAQA0fPlzFixe3d2nI4QYNGqRz585p4cKFlmUHDhxQSEiIDh8+rEKFCqlTp04KDg62Y5XIKaZPn65JkyZluK5ly5YaO3asfv31V40fP14REREqXry43nvvPTVv3vwBV4qc6Pr165owYYK2bNmi69evq2bNmho0aJDKlSsniZ89uD/+/v765JNP1KpVK0n0H9xddHS0JkyYoG3btikmJkYBAQHq37+/atasKck+/YfgBQAAAAAGY6ohAAAAABiM4AUAAAAABiN4AQAAAIDBCF4AAAAAYDCCFwAAAAAYjOAFAAAAAAYjeAEAAACAwQheAPAIaNeunQICAvTnn39muD4oKEiDBg16ILUMGjRIQUFBD+RY9yM5OVmDBg1StWrVVL16de3atStdm927d8vf31+7d+/OcB+rVq2Sv7+//v7770wf9++//5a/v79WrVplc+3ZKSgoSP7+/nf9mjJlir3LBIBcx8neBQAAHoyUlBQNHjxYq1atkouLi73LyXG2bdumb7/9Vj169FDdunUVEBDwQI5buHBhLVu2TCVLlnwgx7uXqVOnKjEx0fL43XffVUBAgHr06GFZ5uPjY4/SACBXI3gBwCPC09NTx44d0xdffKE+ffrYu5wc5+rVq5KkVq1aqUSJEg/suC4uLqpateoDO9693B44XVxcVLBgwRxVIwDkRkw1BIBHRIUKFfTyyy9r1qxZOnjw4F3bZjSdbMqUKfL397c8HjRokN5++20tW7ZMjRo1UuXKldWmTRudOnVKP/30k1544QVVqVJFr776qsLDw9MdY9myZWrQoIEqV66s9u3b6/Dhw1br//nnH/Xt21e1atVSlSpV0rVJm6I3d+5cNWvWTFWqVNHKlSszPJ+UlBQtXrxYL7zwgipXrqwGDRooNDRUCQkJlnNJm2rZqFEjtWvX7q7PT2atWrVKAQEB+uOPP/T666+rUqVKatiwoWbPnp3uPG6danjkyBF16NBB1apVU1BQkFasWKEOHTpYarzT9MSMpnFu2bJFrVq1UqVKlfT000/ro48+UmxsbJbOKz4+XhMmTFCTJk1UsWJFVa9eXR07dkz3On/77bdq3ry5KlWqpBdffFE7d+5UQECApe7U1FRNmjRJQUFBqlixooKCgjRhwgQlJSVlqT4AyIkY8QKAR8iHH36oHTt2aPDgwVq5cmWWpxz+/vvvioqK0qBBg5SQkKCRI0eqS5cuMplM6tWrl9zc3DRixAj1799f69evt2wXGRmpqVOnql+/fvLw8NDUqVPVrl07rVu3To8//rguX76sNm3ayM3NTcOGDZObm5vmz5+vtm3b6ptvvlHZsmUt+5oyZYqGDBkiDw8PValSJcM6hw8frjVr1uidd95RzZo1dfjwYX3xxRcKDw/XrFmz1KNHD/n4+OjLL7/U1KlTVbp06Sw9L7dKTU1V79691aFDB/Xu3VvffPONPv30U5UvX1716tVL1z4yMlJt27ZVqVKlNH78eMXExGjixIlKSEi47yl+69atU//+/fXCCy+od+/eOnfunCZNmqTjx49r7ty5MplMNp3TwIEDFRYWpr59+6pkyZI6ffq0PvvsM/Xr10/r16+XyWTS6tWrNWjQIL366qsaPHiwDhw4oB49eiglJcWyn5kzZ+rrr7/WBx98oBIlSuiPP/7QpEmT5OzsrF69etlUGwDkVAQvAHiE5M+fX6NHj1b37t2zZcrhv//+q8mTJ1uC0J49e7R06VLNmzdPderUkSSdPn1a48aNU0xMjPLlyyfp5gjUF198ocqVK0uSqlSpokaNGmnhwoX64IMPNH/+fF29elVff/21ihUrJkmqX7++mjdvrs8++0yff/65pYbnnntOrVu3vmONx48f1zfffKN+/fqpS5cukqSnn35ahQsX1sCBA/Xrr7/qf//7n+UaqwoVKqh48eJZel5uZTab1aNHD7366quSpBo1amjz5s36+eefMwxe8+fPV0pKimbOnCkvLy9JUqlSpfTmm2/e93FDQ0NVr149hYaGWpb7+vqqQ4cO+uWXX9SgQYP7Pp/ExET9+++/Gjp0qJo3by5JqlWrlm7cuKGxY8cqOjpahQoV0meffaaGDRvqo48+kiTVq1dPzs7OmjBhgmVfe/bsUcWKFS2vX61ateTm5iZPT8/7rgsAcjqmGgLAIyYoKEgvvviiZs2apUOHDmVpX/nz57caffL29pYkq5Gnxx57TJIUExNjWVaiRAlL6JKkQoUKqWrVqtq7d68kaefOnapQoYKKFCmi5ORkJScny8HBQfXr19f//d//WdVQoUKFu9a4Z88eSdLzzz9vtfz555+Xo6PjHe9QmJHMjhDd3q5atWqW/6ddM3Wn6X5hYWGqWrWqJXRJN8NaWgDNrJMnTyoyMlJBQUGW5zA5OVmBgYHy8PDQjh077mt/t9Y/e/ZsNW/eXBcuXNCuXbu0dOlS/fTTT5JuBrPTp0/rn3/+UbNmzay2vf01eOqpp7Rjxw69+eabmjVrlo4fP67g4GC99NJLNtUGADkZI14A8AgaOnSodu7caZlyaCsPD48Ml7u7u991u7SAdisvLy+dP39e0s0bXZw+fVpPPvlkhtvHxcVl+ljXrl2TdDPc3crJyUkFChTQ9evX77r9rdzc3CTJ6q5/t0pbntYujaurq9VjBwcHmc3mO9ab0c09ihQpkuk6pf9uFjJq1CiNGjUq3fqoqKj72t+ttm3bpo8//lgnT55U3rx59cQTT1heB7PZrMuXL0uSVXiU0r/unTt3Vt68ebVy5UqFhoZq/PjxKleunIYOHaratWvbXB8A5EQELwB4BOXPn18jR45Uz549NW3atAzb3HotjqQs35DhVmlh6FYXL15UwYIFJd28A2OtWrU0cODADLe/n2vT8ufPb9n/raNGSUlJunLligoUKJDpfaWFtzuFlsjISLm4uFiOaYsCBQooOjo63fKrV6+qVKlSkv4bUbvba5Q2rXPgwIGqVatWuv3ZWuOZM2fUs2dPNWrUSF999ZVKlCghk8mkxYsXa9u2bZL+u938pUuXrLa9/bGDg4Patm2rtm3b6tKlS/rll180ffp0vffee9qxYwcfewDgocJUQwB4RDVq1EgtWrTQjBkzLCMUaTw8PHThwgWrZfv27cu2Y586dUpnzpyxPD5//rx+//13PfXUU5JuXutz6tQplS5dWpUqVbJ8rVmzRt98840cHR0zfay00HHrzT3SHqekpKhGjRqZ3pePj49Kliyp77//Pt26lJQUbdmyRYGBgfdV3+3q1Kmj33//3er5P3nypE6fPm15nDbSeGubpKQkHThwwPK4TJky8vLy0t9//231HBYpUkQTJkxIdxfJzDp48KASEhLUpUsXlSxZ0hIC00KX2Wy2PE+bN2+22nbTpk1Wj9u0aWO5BszLy0utWrVS27ZtFRMToxs3bthUHwDkVIx4AcAjbNiwYdq1a1e6EZYGDRpo/fr1qlKlikqVKqVVq1ZZvfHPqjx58qh79+7q06ePUlJS9Nlnn+mxxx5T+/btJUkdOnTQmjVr1KFDB3Xq1EkFChTQhg0btHz5cg0ePPi+juXn56eWLVvq888/V1xcnAIDAxUeHq6pU6fqqaeeyvAGF3fTv39/9e7dW926dVPr1q1VoEABRUVFaenSpTp37pzGjh17X/u7Xfv27bV69Wp16tRJ7733nsxmsyZPnqzU1FRLm/z586tatWpauHChSpUqpfz582vBggWKj4+3TPlzdHRUnz59NHz4cDk6Oqphw4aKiYnRtGnTdOHChTtO47yXJ598Uk5OTho/frw6deqkxMRErVq1Sj///LOkm6NuaXe17N+/v0aMGKHGjRvryJEj+uKLLyTdHOmSpMDAQM2ZM0fe3t6qVq2aLly4oLlz56pWrVqW0U8AeFgQvADgEfbYY49p5MiRevfdd62WDx48WMnJyRo3bpycnJzUvHlz9evXT0OHDs2W4wYEBKhp06YaOXKkrl+/rjp16ujDDz+0vNkuUqSIli5dqgkTJmjkyJFKSEiQr6+vQkJC9Morr9z38UJCQlSqVCmtXLlSM2fOVOHChfXWW2+pR48elhCQWU2bNtWcOXM0b948jRgxQjExMSpYsKACAwO1fPlylStX7r7ru1WBAgW0ePFiffzxxxo0aJA8PDzUuXNnLViwwKrd2LFjNWbMGA0dOlQeHh565ZVXVKNGDa1YscLS5tVXX1XevHk1a9YsLVu2TO7u7qpevbpCQ0Nt/pDoUqVKacKECZo6daq6d++u/Pnzq2rVqlq4cKHatWunsLAw+fv764UXXlBsbKxmz56tlStXqly5choyZIiGDBliCYfvv/++XFxctHLlSn3xxRfy9PRUUFCQ+vXrZ/sTCAA5lMl8p6t7AQBAjhEUFKRatWpleUTtQfnuu+8UEBCgMmXKWJb9/PPP6tq1q9asWaMnnnjCjtUBwIPHiBcAAMh2a9eu1aRJk9S7d28VLVpUp0+f1ueff65atWoRugA8kgheAAAg240bN04TJkzQ+PHjdfnyZXl7e6tZs2bq1auXvUsDALtgqiEAAAAAGIzbyQMAAACAwQheAAAAAGAwghcAAAAAGIzgBQAAAAAGI3gBAAAAgMEIXgAAAABgMIIXAAAAABiM4AUAAAAABiN4AQAAAIDB/h+6QcWADJ0esAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 1000x600 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "tags_per_movie = tags.groupby('movieId')['tag'].nunique()\n",
    "\n",
    "plt.figure(figsize=(10, 6))\n",
    "sns.histplot(tags_per_movie, bins=20, kde=False, color='skyblue', edgecolor='black')\n",
    "plt.xlabel('Number of Unique Tags', fontsize=12)\n",
    "plt.ylabel('Frequency', fontsize=12)\n",
    "plt.title('Distribution of Tags per MovieId', fontsize=14)\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAABroAAAOqCAYAAADDhYW0AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/H5lhTAAAACXBIWXMAAA9hAAAPYQGoP6dpAAEAAElEQVR4nOzdeZRfg/3/8dfMZG9iC0kUIbb4xhZKaim1JbVX7BKpLRqlX5TYtZQqJY0lte+qijSRqMbSVrXlh1qqtBJEEoJEhFgi+8z8/nAy344EyWQmn89NHo9zeo753Pu57/dncE55uvdTUVtbWxsAAAAAAAAomMpSLwAAAAAAAAANIXQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhdSs1AsAAAClN2TIkPzqV79apHN79+6dSy65pIk3+j/9+vXLP/7xj4Ueu+OOO/LNb36z7ufnn38+V111Vf7zn/+ktrY2W221VQYOHJj1119/seaMHDkyG2200ULPe+utt7LrrrsmSY477rj86Ec/WtyPtFgmTJiQddZZ5yvP69q161eec9ZZZ+XII49c8qUKqrq6Ou+8807WWmutLzxnUX6P8/35z3/Ommuu2RirAQAADSR0AQAA6dmzZzp37lzvtYsvvjjTpk3LpZdeWu/1z5/X1F555ZVsvvnm6du37wLH1ltvvbo/fvrpp3PMMcdkjTXWyIABA1JTU5M77rgjhxxySO699956536Vhx566AtD16hRoxb/QzTQNddck2uuuSb//ve/F+n8lVdeOWedddYXHt9kk00aa7XCmThxYo477rjsvvvu+d///d8vPO/zf70/99xzueeee9KzZ8/07Nmz3rFVVlmlSXYFAAAWndAFAABko402WiDsXHnllZk2bVq++93vlmirZNKkSfnoo4+y7bbbfuketbW1ueCCC7LSSivlnnvuyUorrZQk6dWrV/bdd99ccsklufHGGxdp5tprr52HHnooJ5988kKPjxo1Ku3bt8/777+/uB9nsf3973/P3LlzF/n8Nm3alPTPVzmbOHFixo4d+5Xnff73V11dnXvuuSddu3b1uwUAgDLkO7oAAICy9corryRJNthggy8976WXXsrYsWOz33771UWuJFlnnXXSs2fPPP7445kyZcoizdxjjz0yfvz4utn/bdy4cRk9enR23333Rf8QAAAANBmhCwAAWGwvvPBCjjvuuPTo0SObbLJJdt999/zqV7/K7Nmz653XtWvXnHPOOXnggQey5557ZtNNN02vXr1y/fXXp7q6+ivnjBkzJsn/ha4ZM2akpqZmofskSffu3Rc4tvnmm6empiYvvfTSIn22PfbYI8lnjy/8vFGjRuVrX/tavv3tby/0va+//npOOeWUbLfddtlkk02y66675pJLLslHH31U77wPPvgg55xzTnbbbbdssskm2X777XPyySfntddeqzuna9euef755+v++Mwzz1yk/RfF8OHD07Vr19x///058MADs8kmm+Q73/lOZs6cmeSzoHfKKadk2223zSabbJJevXrliiuuyKxZsxa41t1335199tknm222WXbbbbfccccdufnmm9O1a9e88cYbST57rGTXrl1z+eWXL/D+ww47bIHvxaqpqcmvf/3rfPe7381mm22WrbbaKv37989zzz1X77whQ4aka9euee211/KTn/wk22+/fTbddNPsu+++GTFiRL3zjjrqqCTJr371q3Tt2jVvvfXWEv0Ok2TKlCm56KKL8p3vfCebbbZZNttss+y55565+uqrM2/evHrnvvvuuznrrLPyrW99q+5RnP/85z/Ts2fP9OvXr+68mTNn5uKLL87uu++ezTbbLN/85jczYMCABT47AADwGY8uBAAAFsuoUaNy6qmnZpVVVsnhhx+e9u3b5/HHH8+QIUPy97//PbfffntatWpVd/6TTz6ZESNG5KCDDkqfPn3y6KOPZvDgwRk9enSuuOKKL501P3T97ne/y6hRozJ16tS0adMmPXv2zBlnnJH27dsnSSZPnpwk6dSp0wLXmP/aooaN9ddfPxtssEEeeuihnHTSSfWOPfjgg9l1113rfb75nn322RxzzDGpqqrKYYcdljXWWCMvvPBCbrvttjz66KO5++67s8oqq6S6ujr9+/fPW2+9lb59+2aNNdbIxIkTc+edd+bxxx/Pgw8+mNVWWy2XXnpprrnmmkyYMCGXXnrpIn03Wk1NTT744IOFHmvbtm1atGhR77XzzjsvPXv2zIEHHpjp06endevWefHFF3PkkUembdu26du3b1ZZZZW88MILue666/Lkk0/mjjvuSMuWLZMkl1xySW699dZ07949AwcOzJQpUzJ48OB06NBhkX7XX+TUU0/NqFGj8p3vfCcHH3xwPvroowwfPjz9+vXL4MGDF7ijbsCAAenQoUMGDBiQOXPm5Pbbb88ZZ5yRDh06ZLvttkvPnj0zZ86c3HDDDXXftbWk36/1ySef5JBDDsnHH3+cPn36pHPnzvnwww8zYsSIXHXVVZk1a1ZOPfXUJJ+FzUMOOSRTp07NoYcemi5duuRvf/tbjjjiiFRVVdX76/aUU07JE088kb59+2bdddfN1KlT85vf/CZHHHFEfve7333hd8cBAMDySugCAAAW2fTp03PeeedlxRVXzP33318Xmvr27ZtBgwblxhtvzE033ZQf/vCHde95++23c9lll2XfffetO/d///d/8+CDD+aQQw7Jtttu+4Xz5j8+cMyYMTn99NPTsmXLPPHEExk6dGj++c9/ZujQoVlppZUyffr0JJ99R9XnzY9S8+9WWhR77LFHrrrqqrzyyit1dxu98sorGTt2bE4//fQFzq+pqcnZZ5+dmpqaDB8+POutt16SpE+fPtliiy1y/vnn57LLLsvFF1+cl19+Of/5z38ycODAHHvssXXX6Nq1a66++ur85z//yU477ZTvfve7ufvuuzNhwoRF/m6oSZMmfeHv8+KLL87+++9f77WNN944l156ad3PtbW1Ofvss7PCCitkxIgRdY+B7NOnT7beeuuce+65ueOOO3Lsscdm3Lhxue2227L55pvnzjvvTPPmzZMku+66aw477LBF2ndhRo0alVGjRuW0005L//79614/4ogjcuCBB+b888/Pt7/97bRu3bruWJcuXXLTTTeloqIiSbLZZpulX79+GTZsWLbbbrtstNFG+eCDD3LDDTc02ndt3XfffXnnnXdy1VVX5Tvf+U7d64cccki22267/OUvf6kLXb/61a8yadKkeuf27ds3P/nJT3LPPffUvfeDDz7Io48+msMOOyxnnHFG3evbbLNNzjzzzLz00ktCFwAAfI5HFwIAAIvsiSeeyMcff1x3J9d/O+GEE9KqVauMGjWq3uvrrrtuXeRKkoqKinz/+99Pkjz88MNfOq9Pnz459dRTc8cdd+S73/1udt9991x44YU544wz8uabb+bGG29M8lmg+SLzj1VWLvo//izs8YWjRo3KSiutlO22226B819++eW88cYb2Xvvvesi13yHHnpo1lhjjTz88MOprq5Ohw4dUlVVlXvvvTcPPPBA3WMN99xzz/zhD3/ITjvttMh7ft6qq66aW2+9daH/+9a3vrXA+dtss029n1955ZW89tpr+fa3v113d9j8/+28885p2bJl/vjHPyZJHn300dTW1uaII46oi1xJssUWW2THHXds8Gf4wx/+kCT5zne+U2/+7Nmz06tXr0ybNi3PPPNMvffss88+dZErSTbZZJMkydSpUxu8x1f53ve+l//3//5fevbsWe/1Dz74IO3atauLr8lndwKus8469YJY8tnfM/+tbdu2adeuXR5++OEMHTo07733XpLPfqcPP/xwDjrooCb6NAAAUFzu6AIAABbZm2++meSzx/t9XuvWrbPWWmvVnTPf/O/X+m/rrrtukmTixIlfOu+/v7vov/Xt2zeXXXZZHn/88Zx22mn52te+liQL/Q6p+a+1a9fuS2d9fr+NNtqo3uMLR40alV69etWLOvN92e+loqIiG2ywQR577LFMmzYtHTt2zLnnnptf/OIXOfXUU1NZWZlu3bplhx12yH777Zd11llnkff8vJYtWy40xH2RVVddtd7P48aNS/LZ927dfffdC33P22+/neT/HgW59tprL3DOBhtskL/+9a+LvMd/Gz9+fJJkt912+8Jz5u8w3+c/x/xHNC7s+9waU2VlZW655Zb861//yptvvpmJEyfm008/TZJ07NgxSfLhhx/mgw8+yOabb77A+zt27Fjvr8sWLVrkkksuyVlnnZVzzz03SbLhhhvmW9/6VvbZZ59069atST8PAAAUkdAFAAAssi+7cypJqqurF/geqM//nCTz5s1LkjRr1rB/JGnRokVWWGGFuqiw5pprJvnsu7o+HwPmf3/X6quvvlgz9thjj1x++eV59dVXM2fOnLz55pu58MILG7RvdXV13d7JZ3eq7bXXXvnrX/+aJ554Ik8//XSuvfba3HjjjbniiisWuEuoqVRVVdX7ef6f30MPPXSBu4/m+/yfs4X9NbGw7zD7IvN/N/PV1NSkdevWueaaa77wPV26dKn38+LcrddYXnzxxRx99NGZN29ettlmm+ywww7ZYIMNsuWWW6Zfv351kW3u3LlJFv73QbLg72q33XbL9ttvn7///e95/PHH8/TTT+eWW27JrbfemrPPPjvf+973mvaDAQBAwQhdAADAIuvcuXOSZOzYsQscmzlzZt5+++0F7vCZMGHCAufOv3Po88Hiv40ePToDBw7M9ttvn7PPPrvesffffz/Tpk3LxhtvnOSz72RKPosPu+yyS71zX3zxxVRUVCz0jpovs+eee+byyy/Pww8/nBkzZmS11VZLjx49FnruWmutlWThv5fa2tqMGzcubdu2zQorrJBp06bltddey0YbbZR999237rGOTz75ZI455phce+21Sy10fd78YFhbW7vAnWE1NTV5+OGH6z7r/LvyXn/99Wy66ab1zv38n/P5QW3OnDkLzPz84wXXXHPNjB8/PhtssEFWW221esdGjx6dKVOm1Pt+rlIZPHhwpk+fnvvvvz8bbrhh3etz587NtGnTsuKKKyZJ2rdvn3bt2tXdqfbfPvroo0ydOrXu74Pp06fnlVdeyZprrplevXqlV69eST773N/73vdy9dVXC10AAPA5vqMLAABYZNtvv33atm2bO++8M++//369Y9dee21mz569wJ1AL730Up566qm6n2tqanL99denoqIie+211xfOWmeddfLuu+/mvvvuq7srK/kswvzyl79Mkuy///5JPgtdXbp0ye9+97t8+OGHdedOmDAhf/zjH7Pzzjtn5ZVXXqzP2rlz52y88cZ55JFH8vDDD2ePPfb4wjuHunXrlrXWWiu///3v8/rrr9c7du+99+btt9+uixZ///vf069fvwUeDbjpppumWbNm9e6Ymh+ImvoRfPNtsskmWWONNTJy5MgFwsw999yTk08+OcOGDUuSusc43nLLLZk9e3bdeRMnTswjjzxS773zH+P3n//8p97rzzzzzAKPIZz/18+VV15Z7/Xp06fn5JNPzgknnFBv3qKa/+eusX6X06ZNS6tWrRYIu7/+9a8za9asujvVKisrs/vuu+fVV1/NE088Ue/cW265pd4dca+88kr69OmzwN1sG2ywQdq1a9fgOyABAGBZ5v8lAwAAi6xdu3Y577zzcsYZZ2TffffNIYcckvbt2+eJJ57In//852y88cbp379/vfe0bNkyxx13XPr27ZvVV189Dz/8cP7xj3/kyCOPXOBOoP/WunXrnHvuuTnzzDNz8MEH57DDDkvbtm3zpz/9KU899VT22WefeqHsJz/5SY499tgccsgh6du3b2bPnp3bb789rVu3zmmnndagz7vHHntk0KBBSfKlUa6qqio/+9nP8v3vfz8HHXRQDjvssKy55pp54YUXMnLkyKyxxhoZOHBgkqRnz57ZcMMNc+WVV2bixInZdNNNM2PGjAwfPjxz5szJ0UcfXXfd9u3bJ0muuuqq9OjRY7G+f6sh5n+OAQMG5MADD8yhhx6atddeOy+99FKGDRuWzp075/jjj0+SdOrUKWeccUZ+9rOf5aCDDkrv3r0zY8aM3HnnnamoqKh33bXWWivf+MY38vTTT+fkk0/O9ttvn/Hjx+eee+5Jly5d6kW1/fffPw899FCGDh2aiRMnZtddd828efMydOjQTJgwIaeddlpdOFsc87/H689//nO+/vWvp2fPnllppZUa/Lvaddddc/XVV+eoo47K3nvvndra2vztb3/LY489llatWmX69Ompra1NRUVFTjrppDz22GMZMGBA+vTpk3XWWSdPPfXUAt9jtuWWW2a77bbL3XffnY8//jg9evRIdXV1Hnzwwbz99ts544wzGrwvAAAsq4QuAABgsey7775ZffXVc8MNN+SOO+7InDlz0rlz55x88sk5+uij07Jly3rnb7zxxunTp0+uuuqqvPvuu+nSpUsuuuiiHHjggV85a7/99kuHDh1y/fXX54Ybbkh1dXXWXXfd/OQnP8lhhx1W79ztttsuN998c4YMGZJf/vKXad26db7xjW/klFNOqXvM3uKaH7rWWGONdO/e/UvP3WabbXLvvffmmmuuybBhwzJ9+vR8/etfz9FHH53jjjsuK6ywQpLPAt6tt96a66+/Pn/9619z//33p3nz5tl0001z4403Zocddqi75nHHHZdx48blpptuyr/+9a8mD13JZ7/He++9N9dee22GDx+eTz75JJ06dUqfPn0yYMCAeo8T7NevXzp16pTrrrsugwcPTvv27XPEEUdk3LhxGTlyZL3rXnnllfnlL3+Zxx57LI8++mi6du2awYMH569//Wu90FVVVZXrrrsut99+e0aOHJlBgwaldevWWW+99TJkyJC6O+MW1/rrr58jjzwyw4YNy0UXXZQ111wz2267bcN+SUmOP/74VFVVZcSIEbn44ouz4oorpkuXLrn66qvz0ksv5brrrss//vGPfPOb38xqq62W3/72txk8eHBGjBiRmTNnpnv37rn55pvTt2/fuu/vqqioyJAhQ3LLLbfkwQcfzGOPPZYk2WijjTJo0KDss88+Dd4XAACWVRW1X/Vt0gAAAA3UtWvXbLnllvntb39b6lVYis4888zcd999eeSRRxZ4tN/yaOrUqVl55ZXrHkU537vvvpsdd9wxvXv3ziWXXFKi7QAAoNh8RxcAAAA0oTPPPDM9evTI9OnT671+//33J8lX3i0IAAB8MY8uBAAAgCZ0wAEH5O9//3v69u2b3r17p3Xr1nnppZcyfPjwbLzxxtl///1LvSIAABSW0AUAAABNaI899qj33WyffvppVl999Rx77LEZMGBA3Xd0AQAAi893dAEAAAAAAFBIvqMLAAAAAACAQhK6AAAAAAAAKCTf0dUA//znP1NbW5vmzZuXehUAAAAAAIDCmTt3bioqKrLFFlss0XWErgaora2NrzYDAAAAAABomMbqLEJXA8y/k2vTTTct8SYAAAAAAADF89JLLzXKdXxHFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEJXI6iurlmm5gAAAAAAABRBs1IvsCyoqqrMRQOuyJuvvtVkMzpvuGbOuf7kJrs+AAAAAABA0QhdjeTNV9/Kay+OK/UaAAAAAAAAyw2PLgQAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACqmsQtf111+ffv361Xtt9OjROfzww9O9e/fssssuueOOO+odr6mpyVVXXZUddtgh3bt3z7HHHpuJEycu1jUAAAAAAAAonrIJXb/5zW9yxRVX1Htt2rRpOeqoo9K5c+cMGzYsJ5xwQgYNGpRhw4bVnXPNNdfkrrvuyoUXXpi77747NTU16d+/f+bMmbPI1wAAAAAAAKB4mpV6gXfffTfnnXdenn766ayzzjr1jt17771p3rx5LrjggjRr1izrrbde3njjjdxwww054IADMmfOnNxyyy0ZOHBgdtpppyTJ5Zdfnh122CGPPPJI9t5776+8BgAAAAAAAMVU8ju6/vOf/6R58+a5//77s/nmm9c79uyzz6ZHjx5p1uz/etw222yTCRMmZOrUqRkzZkw+/fTTbLvttnXHV1hhhXTr1i3PPPPMIl0DAAAAAACAYir5HV277LJLdtlll4Uemzx5cjbccMN6r3Xo0CFJMmnSpEyePDlJsvrqqy9wzvxjX3WNVVddtUF719bWZsaMGamoqEjr1q0bdI2GmDlzZmpra5faPAAAAAAAgMZWW1ubioqKJb5OyUPXl5k1a1ZatGhR77WWLVsmSWbPnp2ZM2cmyULP+eijjxbpGg01d+7cjB49Oq1bt063bt0afJ3FNX78+LrPDQAAAAAAUFSf7zcNUdahq1WrVpkzZ0691+bHqTZt2qRVq1ZJkjlz5tT98fxz5t9l9VXXaKjmzZtn/fXXb5TauDi6dOniji4AAAAAAKDQxo4d2yjXKevQ1alTp0yZMqXea/N/7tixY+bNm1f3WufOneud07Vr10W6RkNVVFQsUShrqKX5mEQAAAAAAICm0Fg3ElU2ylWayNZbb53nnnsu1dXVda899dRT6dKlS9q3b5+NNtoobdu2zdNPP113/OOPP87LL7+crbfeepGuAQAAAAAAQDGVdeg64IADMn369JxzzjkZO3Zshg8fnttuuy0DBgxI8tmzGw8//PAMGjQof/7znzNmzJj86Ec/SqdOndKrV69FugYAAAAAAADFVNaPLmzfvn1uuummXHTRRendu3dWW221nH766endu3fdOSeeeGLmzZuXc889N7NmzcrWW2+dm2++Oc2bN1/kawAAAAAAAFA8FbW1tbWlXqJoXnrppSTJpptuWvfagJ0H5rUXxzXZzA02WzfX/2VQk10fAAAAAABgaVlYa2mIsn50IQAAAAAAAHwRoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6lhHV1TXL1BwAAAAAAICv0qzUC9A4qqoqc/EPf5U3X3u7yWZ03mCNnPWrHzbZ9QEAAAAAABaH0LUMefO1tzP23xNKvQYAAAAAAMBS4dGFAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQRaOorq5ZpuYAAAAAAADlr1mpF2DZUFVVmUt+dH0mjn2nyWastf7Xc+blA5rs+gAAAAAAQLEIXTSaiWPfydj/vFHqNQAAAAAAgOWERxcCAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIVUiNA1b968XHnlldl5552zxRZbpG/fvnnhhRfqjo8ePTqHH354unfvnl122SV33HFHvffX1NTkqquuyg477JDu3bvn2GOPzcSJE5fypwAAAAAAAKAxFSJ0XXvttRk6dGguvPDCjBgxIl26dEn//v0zZcqUTJs2LUcddVQ6d+6cYcOG5YQTTsigQYMybNiwuvdfc801ueuuu3LhhRfm7rvvTk1NTfr37585c+aU8FMBAAAAAACwJAoRuv70pz9l7733zre+9a2svfbaOfPMM/PJJ5/khRdeyL333pvmzZvnggsuyHrrrZcDDjggRx55ZG644YYkyZw5c3LLLbfkxBNPzE477ZSNNtool19+eSZPnpxHHnmkxJ8MAAAAAACAhipE6Grfvn3+8pe/5K233kp1dXXuueeetGjRIhtttFGeffbZ9OjRI82aNas7f5tttsmECRMyderUjBkzJp9++mm23XbbuuMrrLBCunXrlmeeeaYUHwcAAAAAAIBG0OyrTym9c845JyeddFJ23XXXVFVVpbKyMkOGDEnnzp0zefLkbLjhhvXO79ChQ5Jk0qRJmTx5cpJk9dVXX+Cc+ccaora2NjNmzEhFRUVat27d4OssrpkzZ6a2trbea6XeodTzAQAAAACAYqmtrU1FRcUSX6cQoWvs2LFp165drr766nTs2DFDhw7NwIEDc+edd2bWrFlp0aJFvfNbtmyZJJk9e3ZmzpyZJAs956OPPmrwTnPnzs3o0aPTunXrdOvWrcHXWVzjx4+v+0zzlXqHUs8HAAAAAACK5/PtpiHKPnRNmjQpp556am677bZstdVWSZJNN900Y8eOzZAhQ9KqVavMmTOn3ntmz56dJGnTpk1atWqV5LPv6pr/x/PPWZK7kJo3b57111+/UWrj4ujSpctC7+gq5Q6lng8AAAAAABTL2LFjG+U6ZR+6/vWvf2Xu3LnZdNNN672++eab529/+1u+/vWvZ8qUKfWOzf+5Y8eOmTdvXt1rnTt3rndO165dG7xXRUVF2rRp0+D3N9TSfERgue5Q6vkAAAAAAMCSaaybaCob5SpNqFOnTkmSV155pd7rr776atZZZ51svfXWee6551JdXV137KmnnkqXLl3Svn37bLTRRmnbtm2efvrpuuMff/xxXn755Wy99dZL50MAAAAAAADQ6Mo+dG222Wb5xje+kTPOOCNPPfVUJkyYkCuuuCJPPvlkvv/97+eAAw7I9OnTc84552Ts2LEZPnx4brvttgwYMCDJZ893PPzwwzNo0KD8+c9/zpgxY/KjH/0onTp1Sq9evUr86QAAAAAAAGiosn90YWVlZa699tpcccUVOeuss/LRRx9lww03zG233ZbNN988SXLTTTfloosuSu/evbPaaqvl9NNPT+/eveuuceKJJ2bevHk599xzM2vWrGy99da5+eab07x581J9LAAAAAAAAJZQ2YeuJFlxxRVz3nnn5bzzzlvo8c022yz33HPPF76/qqoqp512Wk477bSmWhEAAAAAAIClrOwfXQgAAAAAAAALI3QBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhfLjJrqmmVqDgAAAAAA8OWalXoBaCyVVZW59LSb8ua4yU02o/O6nXL6Zf2b7PoAAAAAAMCiE7pYprw5bnJef/nNUq8BAAAAAAAsBR5dCAAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBY2kprpmmZoDAAAAAADlrlmpF4BlRWVVZS4967ZMHDe5yWastW6nnH7xkU12fQAAAAAAKBKhCxrRxHGT8/qYt0q9BgAAAAAALBc8uhAAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCErpgGVJTXbNMzQEAAAAAgC/TrNQLAI2nsqoyl/3415k4fkqTzVirS4ecdmG/Jrs+AAAAAAAsKqELljETx0/J66+8Veo1AAAAAACgyXl0IQAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhVSY0DVixIjsueee2XTTTbPXXnvlwQcfrDv21ltvZcCAAdlyyy3zrW99K1dccUWqq6vrvf83v/lNdt1112y22Wbp06dPXn755aX9EQAAAAAAAGhEhQhdI0eOzDnnnJO+ffvmD3/4Q/bee++ccsop+ec//5m5c+fmmGOOSZLcfffdOf/88/Pb3/42V199dd3777vvvlx66aU56aSTMnz48Ky55po56qij8sEHH5TqIwEAAAAAALCEmpV6ga9SW1ubK6+8Mt/73vfSt2/fJMkPfvCDPPvss/nHP/6Rt99+O++8807uvfferLjiitlwww3z/vvv59JLL81xxx2XFi1a5Lrrrsvhhx+efffdN0ny85//PLvttluGDh2aAQMGlPLjAQAAAAAA0EBlH7rGjx+ft99+O/vss0+912+++eYkyfnnn5+NN944K664Yt2xbbbZJtOnT8/o0aOz5pprZsKECdl2223rjjdr1ixbbbVVnnnmmQaHrtra2syYMSMVFRVp3bp1g67REDNnzkxtbW2910q9Q6nnl8MOpZ5fLjsAAAAAAMCiqK2tTUVFxRJfpxChK0lmzJiRY445Ji+//HLWXHPN/OAHP8guu+ySyZMnp1OnTvXe06FDhyTJpEmT0qzZZx9x9dVXX+CcMWPGNHivuXPnZvTo0WndunW6devW4OssrvHjx2fmzJn1Xiv1DqWeXw47lHp+uewAAAAAAACLqkWLFkt8jbIPXdOnT0+SnHHGGfnhD3+YgQMH5uGHH87xxx+fW2+9NbNmzcoKK6xQ7z0tW7ZMksyePbvuX8R//pfVsmXLzJ49u8F7NW/ePOuvv36j1MbF0aVLl4XeyVPKHUo9vxx2KPX85XEHd5MBAAAAABTX2LFjG+U6DQpdDzzwQHr16tUope2rNG/ePElyzDHHpHfv3kmS//mf/8nLL7+cW2+9Na1atcqcOXPqvWd+wGrTpk1atWqVJAs9Z0ke81ZRUZE2bdo0+P0NtTQfTVeuO5R6fjnsUOr5X7RDTXVNKqsqm3z20poDAAAAAEDTaKwbJxoUuk4//fT89Kc/zV577ZX9998/m222WaMsszAdO3ZMkmy44Yb1Xl9//fXz2GOPpUePHnn11VfrHZsyZUrde+c/snDKlClZb7316p0z/9pA46isqsygn96ViROmNNmMtdbpkIHn9Wmy6wMAAAAAUBwNCl2PPvpo7rvvvowcOTL33HNPunTpkgMOOCD77rtvVltttUZdcOONN87Xvva1/Otf/8pWW21V9/qrr76azp07Z+utt86IESMyffr0tG3bNkny1FNP5Wtf+1o22mijtGjRIl26dMnTTz+dbbfdNkkyb968PPvss+nTx78sh8Y2ccKUvP7q26VeAwAAAACA5UCDnv3VqVOn/OAHP8hDDz2U3/zmN9lqq61y4403Zuedd85xxx2XRx55JPPmzWuUBVu1apX+/fvn6quvzgMPPJA333wz1157bZ544okcddRR2W233bLaaqvl5JNPzpgxY/KnP/0pgwcPztFHH133aMWjjz46t956a+67776MHTs2Z599dmbNmpUDDzywUXYEAAAAAABg6WvQHV3/bcstt8yWW26Zgw46KJdeemkee+yxPPbYY1l11VVzxBFH5Oijj05VVdUSzTj++OPTunXrXH755Xn33Xez3nrrZciQIfnmN7+ZJLnpppvy05/+NAcffHBWXHHF9OnTJ8cff3zd+w8++OB88sknueKKK/Lhhx9mk002ya233ppVVlllifYCAAAAAACgdJYodL399tsZOXJkRo4cmTfffDOdO3fOKaeckp122imPPfZYrr766owdOza/+MUvlnjRo446KkcdddRCj6299tq55ZZbvvT9xxxzTI455pgl3gMAAAAAAIDy0KDQNXTo0IwcOTLPP/98WrZsmd133z0XXXRRve/Q2nDDDTNt2rTcfffdjRK6AAAAAAAA4L81KHT9+Mc/zuabb57zzz8/e+65Z9q2bbvQ87p27ZpDDjlkiRYEAAAAAACAhWlQ6HrggQey/vrrp7q6uu77t2bNmpW5c+emXbt2deftt99+jbIkwKKqqa5JZVXlMjMHAAAAAIAv1qDQtc466+S8887Lv//97wwbNixJ8vzzz+f73/9++vXrl9NOOy2Vlf4FMLD0VVZVZtBF92TiG1OabMZaa3fIwHPcrQoAAAAAUGoNCl1XXXVV7r///px44ol1r3Xr1i0DBw7MkCFDsvLKK+f73/9+oy0JsDgmvjElr7/2TqnXAAAAAACgiTUodP3+97/PGWeckUMPPbTutZVWWilHHnlkmjVrljvuuEPoAgAAAAAAoEk16PmC06ZNy1prrbXQY+uuu24mT568REsBAAAAAADAV2lQ6Fp33XXz8MMPL/TYo48+mrXXXnuJlgIAAAAAAICv0qBHF37ve9/LmWeemQ8//DC77bZb2rdvnw8++CB/+ctf8uCDD+biiy9u7D0BAAAAAACgngaFrv322y+ffvpprrnmmjzyyCN1r6+88sr58Y9/nP3226+x9gMAAAAAAICFalDoSpK+ffumT58+GT9+fD788MOssMIKWXfddVNZ2aCnIQIAAAAAAMBiaXDoSpKKioqsu+66jbULAAAAAAAALLIGha4PPvggF110UR577LHMnDkztbW19Y5XVFTk5ZdfbpQFAQAAAAAAYGEaFLouuOCC/OUvf8lee+2VTp06eVwhAAAAAAAAS12DQtff/va3nH322TnkkEMaex8AAAAAAABYJA26Fat58+ZZa621GnsXgMKrqa5ZpuYAAAAAAJSzBt3R1bNnzzzwwAPZbrvtGnsfgEKrrKrMoEuGZuLEKU02Y621OmTgmQc12fUBAAAAAIqiQaGrW7duueKKKzJx4sRsvvnmadWqVb3jFRUVOeGEExplQYCimThxSl4fO6nUawAAAAAALPMaFLouuOCCJMkzzzyTZ555ZoHjQhcAAAAAAABNrUGha8yYMY29BwAAAAAAACyWyiW9wCeffJLXX389c+bMSXV1dWPsBAAAAAAAAF+pwaHr6aefzkEHHZQePXpkn332yWuvvZZTTz01l1xySWPuBwAAAAAAAAvVoND15JNP5phjjkmrVq0ycODA1NbWJkk22mij3HHHHbn11lsbdUkAAAAAAAD4vAaFriuuuCK77rprfv3rX+eII46oC13HHXdc+vfvn6FDhzbqkgAAAAAAAPB5DQpdo0ePzgEHHJAkqaioqHds++23z9tvv73kmwEAAAAAAMCXaFDoateuXd57772FHps0aVLatWu3REsBAAAAAADAV2lQ6Np1111z+eWX56WXXqp7raKiIpMnT851112XnXbaqbH2AwAAAAAAgIVq1pA3nXrqqfnXv/6Vgw8+OKuuumqS5JRTTsnkyZOz+uqr55RTTmnUJQEAAAAAAODzGhS6VlxxxQwdOjQjRozIU089lQ8//DDt2rVLv379sv/++6d169aNvScAAAAAAADU06DQlSQtWrTIwQcfnIMPPrgx9wEAAAAAAIBF0qDQNWLEiK88Z7/99mvIpQEAAAAAAGCRNCh0nXnmmQt9vaKiIlVVVamqqhK6AAAAAAAAaFINCl1//vOfF3htxowZefbZZ3PjjTfm6quvXuLFAAAAAAAA4Ms0KHStscYaC319gw02yNy5c3PhhRfmrrvuWqLFAAAAAAAA4MtUNvYFu3btmv/85z+NfVkAAAAAAACop1FD15w5c/K73/0u7du3b8zLAgAAAAAAwAIa9OjCXXbZJRUVFfVeq6mpybRp0zJ79uycccYZjbIcAAAAAAAAfJEGha4ePXosELqSpG3bttl5552z3XbbLfFiAAAAAAAA8GUaFLouueSSxt4DAAAAAAAAFkuDQtc777yzWOd//etfb8gYAAAAAAAA+EKN9h1dX2b06NENGQMAAAAAAABfqEGh64orrsh5552XjTfeOPvuu286duyYadOm5dFHH82DDz6YH/zgB1ljjTUae1cAAAAAAACo06DQNXLkyOy8884LfFfXnnvumfbt2+f555/PD3/4w0ZZEAAAAAAAABamsiFvevLJJ7P33nsv9NiOO+6Y5557bomWAgAAAAAAgK/SoNC18sor51//+tdCjz355JPp2LHjEi0FAAAAAAAAX6VBjy488MADc+2112bmzJnZZZddssoqq2Tq1Kl56KGH8tvf/jY//vGPG3tPAAAAAAAAqKdBoev444/PJ598kttuuy0333xzkqS2tjatW7fOj370oxx66KGNuiQAAAAAAAB8XoNCV0VFRc4888wcf/zxeeGFF/LRRx9l5ZVXTvfu3dO2bdvG3hEAAAAAAAAW0KDQNV/btm3ToUOHJEn37t0zb968RlkKAAAAAAAAvkqDQ9fIkSPzy1/+Mu+9914qKioydOjQDBkyJM2bN88vf/nLtGjRojH3BAAAAAAAgHoqG/KmUaNG5Ywzzsg222yTwYMHp6amJknSs2fP/PWvf80111zTqEsCAAAAAADA5zXojq7rrrsuhx56aM4///xUV1fXvX7AAQfkgw8+yL333puTTz65sXYEAAAAAACABTTojq7x48enZ8+eCz22+eab5913312ipQAAAAAAAOCrNCh0tW/fPq+//vpCj73++utp3779Ei0FAAAAAAAAX6VBoWvPPffMVVddlYceeihz5sxJklRUVOTf//53rrnmmuy+++6NuiQAAAAAAAB8XoO+o+vkk0/Oq6++mpNPPjmVlZ+1sn79+mXGjBnZaqutctJJJzXqkgAAAAAAAPB5DQpdLVq0yE033ZQnnngiTz31VD788MO0a9cuPXr0yLe//e1UVFQ09p4AAAAAAABQT4NC1zHHHJP+/ftn++23z/bbb9/YOwEAAAAAAMBXatB3dD3//PPu2gIAAAAAAKCkGhS6dthhh9x///2ZO3duY+8DAAAAAAAAi6RBjy5s2bJl7r///jz44INZb7310qZNm3rHKyoqcvvttzfKggAAAAAAALAwDQpdkydPzhZbbFH3c21tbb3jn/8ZAAAAAAAAGtsih65HHnkk22yzTVZYYYX8+te/bsqdAAAAAAAA4Cst8nd0nXTSSZkwYUK912688ca8//77jb0TAAAAAAAAfKVFDl2ffxxhdXV1Bg8enMmTJzf6UgAAAAAAAPBVFjl0LYzv4gIAAAAAAKBUlih0AQAAAAAAQKkIXQAAAAAAABTSEoeuioqKxtgDAAAAAAAAFkuzxTn5hBNOSIsWLeq9dtxxx6V58+b1XquoqMif/vSnJd8OAAAAAAAAvsAih67evXs35R4AAAAAAACwWBY5dF188cVNuQcAAAAAAAAsliX+ji4AAAAAAAAoBaELAAAAAACAQhK6AAAAAAAAKCShC2AZU1NTs0zNAQAAAAD4Is1KvQAAjauysjKXDfpdJk6c2mQz1lpr1Zw28MAmuz4AAAAAwKIQugCWQRMnTs3rr08q2fyamppUVjb9TcNLaw4AAAAAUJ6ELgAaXWVlZS4dPCxvvtV0d5V1XnPVnH7KAU12fQAAAACg/AldADSJN9+amtfHle6uMgAAAABg2ed5TwAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBcAyp7qmZpmaAwAAAAAsXLNSLwAAja2qsjKXXDk8E996r8lmrLXmajnzpP2b7PoAAAAAwFcTugBYJk18672MHT+51GsAAAAAAE3IowsBAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAAAAAgEISugAAAAAAACgkoQsAmkB1Tc0yNQcAAAAAylGzUi8AAMuiqsrKXDxkeN58e2qTzei8xqo563/3b7LrAwAAAEC5E7oAoIm8+fbUjJ0wuSSzq2tqUlXZ9DduL605AAAAALAwQhcALIOqKivz82vuy5vvNOEdZV9fNWcf37vJrg8AAAAAX0XoAoBl1JvvTM1rJbqjDAAAAACWBs8aAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AoElU19QsU3MAAAAAKD/NSr0AALBsqqqszEXX35c33pnaZDPW/vqqOWdA7ya7PgAAAADlTegCAJrMG+9MzWtvTC71GgAAAAAsowr16MLx48dniy22yPDhw+teGz16dA4//PB07949u+yyS+64445676mpqclVV12VHXbYId27d8+xxx6biRMnLu3VAQAAAAAAaGSFCV1z587NwIEDM2PGjLrXpk2blqOOOiqdO3fOsGHDcsIJJ2TQoEEZNmxY3TnXXHNN7rrrrlx44YW5++67U1NTk/79+2fOnDml+BgAwFLiO8IAAAAAln2FeXThkCFD0rZt23qv3XvvvWnevHkuuOCCNGvWLOutt17eeOON3HDDDTnggAMyZ86c3HLLLRk4cGB22mmnJMnll1+eHXbYIY888kj23nvvEnwSAGBpqKqszIU33Jc3JjXhd4Stvmp+/H3fEQYAAABQKoUIXc8880zuueeejBgxoi5YJcmzzz6bHj16pFmz//sY22yzTa6//vpMnTo177zzTj799NNsu+22dcdXWGGFdOvWLc8884zQBQDLuDcmTc1rb/qOMAAAAIBlVdmHro8//jinn356zj333Ky++ur1jk2ePDkbbrhhvdc6dOiQJJk0aVImT/7sX2x9/n0dOnSoO9ZQtbW1mTFjRioqKtK6deslutbimDlzZmpra+u9VuodSj2/HHYo9fxy2KHU88thh1LPt0N5zC+HHUo9vxx2KPV8AAAAAL5cbW1tKioqlvg6ZR+6zj///GyxxRbZZ599Fjg2a9astGjRot5rLVu2TJLMnj07M2fOTJKFnvPRRx8t0V5z587N6NGj07p163Tr1m2JrrU4xo8fX/e55iv1DqWeXw47lHp+OexQ6vnlsEOp59uhPOaXww6lnl8OO5R6PgAAAABf7fP9piHKOnSNGDEizz77bH7/+98v9HirVq0yZ86ceq/Nnj07SdKmTZu0atUqSTJnzpy6P55/zpL+V97NmzfP+uuv3yi1cXF06dJlof/VfCl3KPX8ctih1PPLYYdSzy+HHUo93w7lMb8cdij1/HLYodTzAQAAAPhyY8eObZTrlHXoGjZsWN5///1638uVJOedd15GjRqVTp06ZcqUKfWOzf+5Y8eOmTdvXt1rnTt3rndO165dl2i3ioqKtGnTZomu0RBL8zFM5bpDqeeXww6lnl8OO5R6fjnsUOr5diiP+eWwQ6nnl8MOpZ4PAAAAUDSN9R8ql3XoGjRoUGbNmlXvtV69euXEE0/Mvvvum5EjR+buu+9OdXV1qqqqkiRPPfVUunTpkvbt26ddu3Zp27Ztnn766brQ9fHHH+fll1/O4YcfvtQ/DwAAAAAAAI2nrENXx44dF/p6+/bt07FjxxxwwAG56aabcs4556R///558cUXc9ttt+WnP/1pks+e7Xj44Ydn0KBBWWWVVbLGGmvksssuS6dOndKrV6+l+VEAAAAAAABoZGUdur5K+/btc9NNN+Wiiy5K7969s9pqq+X0009P796968458cQTM2/evJx77rmZNWtWtt5669x8881p3rx5CTcHAJYH1TU1qaqsXGbmAAAAAJSbwoWuV155pd7Pm222We65554vPL+qqiqnnXZaTjvttKZeDQCgnqrKylxw8315Y9LUJpux9uqr5ifH9P7qEwEAAACWQYULXQAARfLGpKl5deLkUq8BAAAAsEzyjBsAAAAAAAAKSegCAAAAAACgkIQuAIBlVHVNzTI1BwAAAODzfEcXAMAyqqqyMj+99b5MmDy1yWas02nVnHdU7ya7PgAAAMCXEboAAJZhEyZPzasTJ5d6DQAAAIAm4dGFAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AADSZ6pqaZWoOAAAAUF6alXoBAACWXVWVlTn/9vsyYfLUJpuxTqdVc/4RvZvs+gAAAED5EroAAGhSEyZPzatvTS71GgAAAMAyyKMLAQBYZnl0IgAAACzb3NEFAMAyq6qyMuf9+r5MmNKEj07ssGp+2s+jEwEAAKAUhC4AAJZpE6ZMzSsenQgAAADLJI8uBAAAAAAAoJCELgAAAAAAAApJ6AIAgCZUXVOzTM0BAACAcuI7ugAAoAlVVVbmx7+5LxOmTG2yGet0WDUX9u3dZNcHAACAciV0AQBAE5swZWpeeXtyqdcAAACAZY5HFwIAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAAAAAFBIQhcAAAAAAACFJHQBAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAwDKuuqZmmZoDAAAA8zUr9QIAAEDTqqqszI9/Ozzjp0xtshldOqyaCw/bv8muDwAAAAsjdAEAwHJg/JSpeeWdyaVeAwAAABqVRxcCAAAAAABQSEIXAAAAAAAAhSR0AQAAAAAAUEhCFwAAAAAAAIUkdAEAAE2quqam5HPKYQcAAAAaX7NSLwAAACzbqiorc+69wzP+valNNqPLaqvmZwfv/6U7nP274Rn/3ntNuMNq+fmBX7wDAAAAjU/oAgAAmtz496ZmzDuTS7zDexkzqbQ7AAAA0Lg8uhAAAAAAAIBCEroAAAAAAAAoJKELAAAAAACAQhK6AAAAAAAAKCShCwAAoIlV19SUfE457AAAANDYmpV6AQAAgGVdVWVlzh4+POPee6/JZqy72mr5+f77f+kOZ40YlnHvT226Hdqvmov3O6DJrg8AAPB5QhcAAMBSMO699zJm8uTS7vD+1IyZPKmkOwAAADQmjy4EAAAAAACgkIQuAAAAAAAACknoAgAAAAAAoJCELgAAAAAAAApJ6AIAAAAAAKCQhC4AAAAAAAAKSegCAACgyVXX1CxTcwAAgPLQrNQLAAAAsOyrqqzMWb8flnHvT22yGeu2XzUX73NAk10fAAAoP0IXAAAAS8W496dmzLuTSja/uqYmVZVN/2CTpTUHAAAQugAAAFhOVFVW5qw//C7jPmjCu8pWWTUX73XgQo8JbQAA0PiELgAAAJYb4z6YmjFTSnNXWVVlZc5+qOlD2893X3hoAwCAZZHQBQAAAEvJuA+mZsx7Ht8IAACNRegCAACA5URVZWXO+ePvMn7ae002o8vKq+Winu4qAwBg6RC6AAAAYDkyftp7GTO1dHeVAQBAY/IcAQAAAGCpqa6pWabmAABQWu7oAgAAAJaaqsrK/PjRoZnQhI9PXGfl1XLhLgc12fUBACgfQhcAAACwVE2Y9l5eed/jEwEAWHIeXQgAAAAAAEAhCV0AAADAcqMcviOsHHYAAFhWeHQhAAAAsNyoqqzM+X8dmgkfTWmyGeus2CHnf/uLvyOsqrIyP3v8nrzxUdN9T9naK66Wc791SJNdHwCgXAhdAAAAwHJlwkdT8mqJvyPsjY/ey2sfvFOS2dW1NamqaPqH/CytOQDA8k3oAgAAAFiOVFVU5pIn78mbHzfdXW2dV+iQM7d1RxkA0PSELgAAAIDlzJsfT8nYaaW5owwAoDG5fxwAAAAAAIBCEroAAAAAWKpqamuWqTkAQOl4dCEAAAAAS1VlRWV++Y/fZuInTfc9YWu165BTexzWZNcHAMqD0AUAAADAUjfxkykZ96HvCQMAloxHFwIAAAAAAFBIQhcAAAAAyxXfEQYAyw6PLgQAAABguVJZUZmrnrsrb09vuu8IW6Nth5z4jT5Ndn0A4DNCFwAAAADLnbenT8n4j94u9RoAwBLy6EIAAAAAAAAKSegCAAAAAACgkIQuAAAAAFjKamprlqk5AFAqvqMLAAAAAJayyorKXPfCb/LO9HebbMbX23bMcd37LvRYTW1NKiua/r+BX1pzAFh+CV0AAAAAUALvTH83b3z8dklmV1ZU5paXfp3JnzZdaOv0tY45etN+X3hcbAOgMQhdAAAAALAcmvzpu5n4yVslm19ZUZk7X74t7346uclmdPxapxze7cgmuz4ApSd0AQAAAAAl8e6nk/P29NLFNgCKzz27AAAAAAAAFJLQBQAAAAAAQCEJXQAAAADAcqemtmaZmgOwvPIdXQAAAADAcqeyojL3jL45782Y1GQzVmuzeg75n2O+8HhNbU0qK5r+XoSlNQegFIQuAAAAAGC59N6MSXln+sSSza+sqMzwMddnahPGtlXbrJ79NxrwhcfFNqDohC4AAAAAgBKZOmNSJn/6RsnmV1ZU5oFXrs77M95pshnt23w9e3c9ocmuDyzfhC4AAAAAgOXY+zPeyZRPJ5RkdjncUVYOOwANJ3QBAAAAAFASlRWVeeTVKzNt5ltNNmPl1mum14YnfekOj702KB824Q4rtV4zO20wsMmuD8szoQsAAAAAgJKZNvOtvPfp+JLu8OHMt/L+p6+XdAegYdwnCQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAAAlUltbvUzNgaWtWakXAAAAAACA5VVFRVX+32sX56OZbzbZjBVbd852G5zVZNeHUhK6AAAAAACghD6a+WamzRhb6jWgkDy6EAAAAAAAlmMen0iRuaMLAAAAAACWYxUVVXlm7IX5ZOYbTTajXeu1s/X6P26y67P8EroAAAAAAGA598nMN/LRjFdLMru2tjoVFVXLzByWLqELAAAAAAAomYqKqrw49rxMnzmhyWa0bb1ONlv/p012fUpH6AIAAAAAAEpq+swJ+WTGKyWb766y4hK6AAAAAACA5VpFRVXGvH5uZswc32Qz2rTuko3W+1mTXX95JXQBAAAAAADLvRkzx2d6Ce8qo2EqS70AAAAAAAAANITQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIRUidH344Yf5yU9+kh133DFbbrllDjvssDz77LN1x5988snsv//+2XzzzbP77rvnD3/4Q733z549Oz/96U+z7bbbZosttsipp56aDz74YGl/DAAAAAAAABpRIULXKaeckn/+858ZPHhwhg0blv/5n//JMccck3HjxuX111/PgAEDssMOO2T48OE56KCDcvrpp+fJJ5+se//555+fxx9/PEOGDMntt9+ecePG5cQTTyzhJwIAAAAAAPhMbW31MjVnaWpW6gW+yhtvvJEnnngid911V77xjW8kSX784x/n73//e37/+9/n/fffT9euXfOjH/0oSbLeeuvl5Zdfzk033ZRtt9027777bkaMGJHrrrsuW221VZJk8ODB2X333fPPf/4zW2yxRck+GwAAAAAAQEVFVcaNOzezZo1vshmtWnXJuuv+rMmuXyplH7pWXnnl3HDDDdl0003rXquoqEhFRUU+/vjjPPvss9ltt93qvWebbbbJRRddlNra2jz33HN1r83XpUuXdOzYMc8884zQBQAAAAAAlNysWeMzY8aYks2vra1ORUVV4eaUfehaYYUV8u1vf7veaw8//HDeeOONnH322bnvvvvSqVOnesc7dOiQmTNnZtq0aXn33Xez8sorp2XLlgucM3ny5AbvVVtbmxkzZqSioiKtW7du8HUW18yZM1NbW1vvtVLvUOr55bBDqeeXww6lnl8OO5R6vh3KY3457FDq+eWwQ6nnl8MOpZ5fDjuUer4dymN+OexQ6vnlsEOp55fDDqWeb4fymF8OO5R6fjnsUOr55bBDqeeXww6lnm+H8phfDjuUen457FDq+eWwQ6nn//cO70w4L7NnTWiy2S1brZOvr/PTuh0qKiqW+JplH7o+7/nnn89ZZ52VXr16ZaeddsqsWbPSokWLeufM/3nOnDmZOXPmAseTpGXLlpk9e3aD95g7d25Gjx6d1q1bp1u3bg2+zuIaP358Zs6cWe+1Uu9Q6vnlsEOp55fDDqWeXw47lHq+HcpjfjnsUOr55bBDqeeXww6lnl8OO5R6vh3KY3457FDq+eWwQ6nnl8MOpZ5vh/KYXw47lHp+OexQ6vnlsEOp55fDDqWeb4fymF8OO5R6fjnsUOr55bBDqef/9w6zZ03I7JmvLJUd5s6du9B+s7gKFbr+9Kc/ZeDAgdlyyy0zaNCgJJ8Fqzlz5tQ7b/7PrVu3TqtWrRY4niSzZ89eokLavHnzrL/++o1SGxdHly5dFlpaS7lDqeeXww6lnl8OO5R6fjnsUOr5diiP+eWwQ6nnl8MOpZ5fDjuUen457FDq+XYoj/nlsEOp55fDDqWeXw47lHq+HcpjfjnsUOr55bBDqeeXww6lnl8OO5R6vh3KY3457FDq+eWwQ6nnl8MOpZ5fqh1ee+21RrlWYULXnXfemYsuuii77757fvGLX9RVvtVXXz1Tpkypd+6UKVPSpk2btGvXLp06dcqHH36YOXPm1CuDU6ZMSceOHRu8T0VFRdq0adPg9zfU0rx9sVx3KPX8ctih1PPLYYdSzy+HHUo93w7lMb8cdij1/HLYodTzy2GHUs8vhx1KPd8O5TG/HHYo9fxy2KHU88thh1LPt0N5zC+HHUo9vxx2KPX8ctih1PPLYYdSz7dDecwvhx1KPb8cdij1/HLYodTz5+/QWHGtslGu0sTuuuuuXHjhhenbt28GDx5cL1httdVW+cc//lHv/KeeeipbbrllKisr841vfCM1NTV57rnn6o6PHz8+7777brbeeuul9hkAAAAAAABoXGUfusaPH5+f//zn6dmzZwYMGJCpU6fmvffey3vvvZdPPvkk/fr1y4svvphBgwbl9ddfzy233JKHHnoo/fv3T5J07Ngxe+21V84999w8/fTTefHFF3PKKaekR48e6d69e2k/HAAAAAAAAA1W9o8ufPjhhzN37tz88Y9/zB//+Md6x3r37p1LLrkk11xzTS677LLcfvvtWXPNNXPZZZdl2223rTvvwgsvzM9//vP88Ic/TJLsuOOOOffcc5fq5wAAAAAAAKBxlX3oOu6443Lcccd96Tk77rhjdtxxxy883qZNm/zsZz/Lz372s8ZeDwAAAAAAgBIp+0cXAgAAAAAAwMIIXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AUAAAAAAEAhCV0AAAAAAAAUktAFAAAAAABAIQldAAAAAAAAFJLQBQAAAAAAQCEJXQAAAAAAABSS0AXw/9k777CokuzvH0wTdtLu7P5mdmdm80yDGJCoIiAZCQoiQUVQBFEQVFDEgAkDiIJZMWHAhAETKmDAhCKKYsKAIkEEBERApYHu7/sH763tFnUUusHZrc/zzON0c/tW3boVTp1UHA6Hw+FwOBwOh8PhcDgcDofD+U3CDV0cDofD4XA4HA6Hw+FwOBwOh8PhcDic3yTc0MXhcDgcDofD4XA4HA6Hw+FwOBwOh8P5TcINXRwOh8PhcDgcDofD4XA4HA6Hw+FwOJzfJNzQxeFwOBwOh8PhcDgcDofD4XA4HA6Hw/lNwg1dHA6Hw+FwOBwOh8PhcDgcDofD4XA4nN8k3NDF4XA4HA6Hw+FwOBwOh8PhcDgcDofD+U3CDV0cDofD4XA4HA6Hw+FwOBwOh8PhcDic3yTc0MXhcDgcDofD4XA4HA6Hw+FwOBwOh8P5TcINXRwOh8PhcDgcDofD4XA4HA6Hw+FwOJzfJNzQxeFwOBwOh8PhcDgcDofD4XA4HA6Hw/lNwg1dHA6Hw+FwOBwOh8PhcDgcDofD4XA4nN8k3NDF4XA4HA6Hw+FwOBwOh8PhcDgcDofD+U3CDV0cDofD4XA4HA6Hw+FwOBwOh8PhcDic3yTc0MXhcDgcDofD4XA4HA6Hw+FwOBwOh8P5TcINXRwOh8PhcDgcDofD4XA4HA6Hw+FwOJzfJNzQxeFwOBwOh8PhcDgcDofD4XA4HA6Hw/lNwg1dHA6Hw+FwOBwOh8PhcDgcDofD4XA4nN8k3NDF4XA4HA6Hw+FwOBwOh8PhcDgcDofD+U3CDV0cDofD4XA4HA6Hw+FwOBwOh8PhcDic3yTc0MXhcDgcDofD4XA4HA6Hw+FwOBwOh8P5TcINXRwOh8PhcDgcDofD4XA4HA6Hw+FwOJzfJNzQxeFwOBwOh8PhcDgcDofD4XA4HA6Hw/lNwg1dHA6Hw+FwOBwOh8PhcDgcDofD4XA4nN8k3NDF4XA4HA6Hw+FwOBwOh8PhcDgcDofD+U3yP2PokkqltGzZMjIwMCANDQ3y9vamgoKCtq4Wh8PhcDgcDofD4XA4HA6Hw+FwOBwOp5n8zxi6Vq1aRdu3b6ewsDDauXMnSaVS8vLyorq6urauGofD4XA4HA6Hw+FwOBwOh8PhcDgcDqcZ/E8Yuurq6mjjxo0UEBBAffv2JVVVVYqOjqbi4mJKTk5u6+pxOBwOh8PhcDgcDofD4XA4HA6Hw+FwmsH/hKHrzp079OLFC+rVqxf77quvvqLOnTtTRkZGG9aMw+FwOBwOh8PhcDgcDofD4XA4HA6H01xUAKCtK6FskpOTyd/fn7KysujTTz9l348bN45qa2spJibmg+6XmZlJAKhjx45ERKSiokKVZc+poV6i0HrL0qFje/rmj1/T216XiooKVZZXUUN9gxLr0IG++farN9ahsfxqkjQor/z2HTrQN99++c42eF5RrfT38PUf3lyHxvJrqEGJbdChQwf6+g9fvLsNntVQQ4MS26BDe/r692+uQ1uXz+pQ+UL5dfjmd29vg8oX1CBRYvnt314+q8PzVmiDr9+nDlIl1qHdW+ugoqJClVUvSKLE8tt3aEfffPXuNqisUn4bvK0OjeW/VHpf/Oarz9/dBtUvld4Xv/nyzXVo6/Jl61CvxPfQsf272+BZtfL7we9/pQ2e1Sj/Pfz+i3e0QU0rtMFbyv+46vCCGqRKnJPataPff/H2OenZixdUL1Fe+R3bt6Pf/+7d83Jb1oGVr8R30LHdr7dBxcsX1KDENujQvh394fO3t0HFS+X3w7eVL18HJY7Hdu3f2QbPXr1Q+rrw+89+ZSy8ekH1SmyDju3eow61ypeZf//pO95DrfL7wdvKF+pQ2Qp1+OYdbVApboXyP/mVPYO4RulzwtefvH3/WlVXo/Q2+KrTu/evVXU1JFFiHdq/ow4qKipUXVdDEiixfJX29OWvtEFNfQ1JpErUJ7XrQF90fHsbvKivVnob/K7ju/VZL+qrSQrltUE7lQ6/WoeX9VUkVWI7tFNpT593fLte8VV9ldLb4LO3lC/Uobb+udLr8GnHN+t3VVRUSFxfqfTyP+n4zTvbQFxfSVBiHVTeUQcVFRWqq3+m9PI7dfz9O9ugvuEZQVqvvDq060gdO7y5DioqKtTQ8IwAJZav0pE6vKV8oQ6SBuW/h/b/vw719fWkoqJCmpqaLbvn/4Kh68CBAxQcHEzZ2dnUrt1/gtiCg4OptLSUNm3a9EH3u3r1qpyhi8PhcDgcDofD4XA4HA6Hw+FwOBwOh/P+CIauHj16tOg+HRRUn48aIYqrrq5OLqJLLBbTZ5999sH3a2mjczgcDofD4XA4HA6Hw+FwOBwOh8PhcFrO/8QZXX/+85+JiKi0tFTu+9LSUvruu+/aokocDofD4XA4HA6Hw+FwOBwOh8PhcDicFvI/YehSVVWlL774gtLT09l3VVVVdPv2bdLR0WnDmnE4HA6Hw+FwOBwOh8PhcDgcDofD4XCay/9E6sJOnTqRm5sbLVq0iP7whz/QDz/8QJGRkfT999+ThYVFW1ePw+FwOBwOh8PhcDgcDofD4XA4HA6H0wz+JwxdREQBAQHU0NBA06dPp9raWtLR0aENGzZQx44d27pqHA6Hw+FwOBwOh8PhcDgcDofD4XA4nGagAgBtXQkOh8PhcDgcDofD4XA4HA6Hw+FwOBwO50P5nziji8PhcDgcDofD4XA4HA6Hw+FwOBwOh/PfBzd0cTgcDofD4XA4HA6Hw+FwOBwOh8PhcH6TcEMXh8PhcDgcDofD4XA4HA6Hw+FwOBwO5zcJN3RxOBwOh8PhcDgcDofD4XA4HA6Hw+FwfpNwQxeHw+FwOBwOh8PhcDgcDofD4XA4HA7nNwk3dHE4HA6Hw+FwOBwOh8PhcDgcDofD4XB+k3BDF4fD4XA4HA6Hw+FwOBwOh8PhcDgcDuc3CTd0cTi/AoC2rgKHw+FwOBwOh8PhcDgcDofD4XA4nDfADV2c90YqlbZ1FdqE8vJyIvrffP6Pwcj3v9juHA6Hw+Fw3o/XZRUuN3A4HI7y+G+bY588eUIFBQUKv+/HsI/mcIR++N82bn+r8Pfw22fWrFnk6enZ1tVQKG3VLw8ePEjXr19X+H25oesj5mMTjtq1a+wuT548IaKPd5JWZL0OHz5Mtra2dOvWLWrXrt1H+8zKQkVFRe5zW/RJod/dunWL6urqWr381xHa4GMbn6+jyL76sT/rx4Zse/G2+20jlUrZO6ysrGzbyrQBr893EomkLavTIpSxfv83j++SkpK2rsIHc/nyZSoqKmJyA4cjAOA3I7+1BOHZysrK2rgmnNeR7YO/dYQ5trS0lIg+fH392Nrh1q1bNHz4cCovL6fs7GzKzs5u8T0BsH200E7/q7ypf3xsfaAtEdri2bNnCr93RUUFJSYmklgs5rLRR4LwHo4fP64UA/v7IvS71tav/dbHvlgspr/85S/0+PFjCgwMbPZ9Xm+Htm6XttD1P3jwgNatW0cREREKWXdl4bPdR8jbNmJt3fmJiE6ePEn9+vWjkpKSj3KxlEqlrF4PHjygnJwcevDgQbPv9+WXX9LPP/9MwcHBdPv27f9JY1dMTAxFR0cTUVPDV2tx8uRJGjNmDGv7thgLQpm1tbVERPTq1atWr8OHIIyD3bt3szHQnHaTSqVy7/3Fixdyf/8Y5iWBN9WlNcerUL5se6moqLRKG7X0OZ88eUKFhYV0//59BdWobWlpm1dUVBBR4zhSUVGh8+fPk6+vL7169eqj6vPKRBj7AGjdunWUkZFBJ06coKNHj7Z11d6L18eEMmSWtloTBd7UFxXRP48dO0aurq6Un5/f4nspG0GZePnyZXJzc6NLly79z4zR1/ktPPe71iplGqNVVFTYeBX+/S2014eioqJCycnJNGrUKMrJyWnVsmXb82PcK7X1+1ZRUaGXL1+2aR0USWJiItnZ2VF9ff0Hra+y+wqpVPpRODF27tyZ/vrXv5K1tTU5ODhQfX19i+4n+4xHjx6lyMhIhSvxFEFr7U+E/pGXl0ePHj2ip0+ftrr81Nbj/12oqKjQkSNHyNXVlYqKihR674qKCtq6dSvt3r2bkpKS6MyZMwq9vzJR1jryJl1ra65ZUqmUCgsLyd/fn27dutWkLq2FiooKnT59mnbu3Kn0tamhoeG/JrLwk08+oaFDh5K7uzvduHGDJkyY8MH3kF0jysvL6eXLl22+pyRqfV3/v/71L/Lx8aF27drRggUL6Pbt2wq7dweF3YmjEIQN+8WLF+no0aP0pz/9iXr27Ena2tpM4dSWg+Cvf/0rqaqq0pUrV8ja2pokEgm1b9++zeojCwA2IKOjo+nkyZNUWlpKlpaW5OXlRX/9618/+J5GRkbUqVMnWrt2LU2YMIGio6Opc+fOckJbW5GRkUEXL16k69evU58+fahLly6kpaWllLLS09OpuLiYvv/+e6Xc/9cwMDCg9u3b0+rVq2nChAltIhyrqKhQamoq7dq1i4qLi8nQ0JBGjBhB33zzTavW5UOQSCQUHR1NlpaWNHPmzA9uN9l+vmnTJrp58yZlZGSQubk5aWpqkrW19UexKBP95x1lZGRQeno6qaio0KBBg+i7775rlfEqq2w9d+4cFRQU0O9//3vy9/enr7/+WmHl1NfXU8eOHenRo0dUU1NDUqmUunXr1qLnO378OC1ZsoQqKirIxsaGAgMD6dNPP/1o3u27ENr9/v379OTJE8rLyyNTU1P64x//SJ06dWrWPbds2UJXr14lX19f+vnnn4mI6Ny5c9SpUyf67LPPPurNsqIQxoxUKqWcnBw6fvw4LV26lH7++Wf64osv6JtvvqFevXq1dTXfiuyYP3ToEN27d4/N22ZmZvTZZ5+1uIyEhAS6desWlZSU0N/+9jeaMGFCq8pDQt+/ceMG3b17lzp16kT9+/dv8bgtLi6mI0eO0MiRI+m7775TUG2VhzDvXrlyhSZOnEj29vatVrbwDm7dukX379+nFy9ekLGxMf3lL39ptbLLy8tJIpFQQ0NDi+a91kB2XB48eJDu379PpaWl9M9//pNtdBWJ0EZXr16lCxcu0MOHD6lLly5kZWVF33//vULXOKGsmpoaqquro06dOrH/WnPP8PDhQzp06BANHTqU/v3vf7dKmcKzV1dXU7t27UgikShU7mlufe7cucMU63379qW//e1v9Omnn7ZJnbZs2ULp6emUnZ1N3bt3J2trazI1NW3zvWRL0NTUpO+//54OHTpEAwcOfK/fyO7VY2Nj6fr163T//n2ytramnj17kqampjKr/Fb+8pe/kK2tLV24cIG++OIL+v3vf9/se8mO9zNnztCBAwfowoUL1K5dO/L09CSRSKSoarcIYZxcv36dRbGZmJjQzz//TH/+858VVobQFsuWLaMjR45QTU0N+fv7k4uLi1w9FMlvbX0sKSmho0eP0ogRI+iPf/yjQu/9/fff0z/+8Q/atGkTFRYWUkREBBHRR6HLep07d+5QWVkZtWvXjjp37kzffPONwuspe7/CwkISi8X0ySeftIrcJtCuXTv68ccfadiwYRQbG0s6Ojr07bfftlr5svuH4OBgmjhxIn3++edKKSs3N5f+8Y9/UIcOjWaH8+fPU0JCAn3++eeko6NDdnZ2SilXmQCg3/3udzRgwACSSqW0efNmpid+398LfXDVqlV0+vRpqqyspNGjR1Pfvn1btP60lNbU9Qtj0dbWllRUVGjbtm0UHh5OISEh1Llz5xbf/+Oa3TikoqJCx48fp5EjR9KjR48oNjaWFi1aRIcOHWJ/by0l25s8rP7973/Tn/70J4qLiyMi+miMXET/8dDcuHEjxcfH08yZMyk6OpoGDx7cLCOX4G3Qq1cvGjlyJP35z3+mCRMmfBSRXcnJyTR27FjKz8+nv//97xQTE0OzZs2i3NzcFt33TX1LS0uLiouLmSeasp/79ait+vp66tChA7m4uFB2drZSwvrfhqwn8OnTpykgIIA0NDTIwMCA1NTUqGPHjk3q/bEgLEyBgYGUnZ3drMhGYRFevHgxrVu3jrp06UJ+fn508uRJWrx48UeV2kpFRYWSkpJo5MiRlJycTNu3bydHR0cqLCxslfEqeFH7+PhQeXk5/eEPf6Djx4+Tg4MDPX36lIia760VHx9Py5YtIyKijh07UmJiInl6etLo0aPJz8+Phg4d2uzUB6dPn6aJEyfS0KFDafHixTRixAj67LPPPqp3+zYEQT05OZl8fX0pOjqa4uPjqV+/frRly5Zme6d16NCBLly4QFu3bqU7d+6w7wUF2X+LR9q7EMZ+VFQUBQUF0ZMnT0gikVB2djZduXKFVq1aRadOnWrjWr4dof6RkZEUERFBd+7coeLiYpo0aRLNnj2bCgsLW3T/yMhIioqKIhUVFfrXv/5F69evp4CAgFaL9BX6/rFjx2j48OEUExNDwcHBNH36dGpoaGj2fSsqKsjY2JjS09PpH//4B33yyScKrLVyePnyJUVFRVF0dDTl5ua26rgU5p8RI0ZQQkICbd68mW7cuNGid/A+CO//5MmT5O3tTcOGDSMHBwcKCQmhixcvKrXsliA7LhcuXEg1NTX0ySefUHR0NPn6+io8taDwfsaMGUPZ2dn0zTffUHh4OE2bNo0eP36skDKI/vM+Tp06RaNHj6ZBgwbR0KFDaebMma2aSjM3N5dGjRpFt2/fZk4aykbWEczX15ccHR3JysqKIiMj5dbP1kSQB319fWn9+vV08uRJGjBgAMXExFB1dXWr10eQobt3705hYWGUmppKa9euZemBfgu8Pq9KpVL65ptv6Mcff6TU1NT3+r2sB/vSpUspJiaGfvjhB+ratSsdOHCAIiMj3+teikZ4tq+//ppCQ0Ope/fuNHjw4GZHYAnjPSIigqZPn07ffvstGRkZ0YkTJ2jTpk0K9VhvCcI48fPzo6SkJCouLqZRo0bRwoUL2b5FEWUQNb7vHTt20NSpUykiIoL69etHUqmUnj17pnDd1m9tfbx79y6ZmprS7du3SVVVVaHGOKlUSl988QWZm5vTkydP6Pvvv6eKigqqq6trc13W60RFRdGkSZMoNDSUFi1aRP369aO8vDyFrp+yBoYVK1aQn58fjRw5kgYMGEDTp09n0VWK5nWdqpAG3sDAgMRiMdPftVZ6eBUVFbp58ybFx8eTiYkJOTk5KaUv7N+/n8aPH0/Hjh0jokbDv7e3N9XW1lJaWhqtW7eO1q9fr/BylYXQRioqKmxsDRw4kEaMGEHXr19/r8gu2XVw+fLltHnzZtLX16d///vfNG3aNNq9e3erHZXwpnfemrp+2bFtY2NDgwcPpvr6egoPD1fMOgnOR4FUKgUAFBcXY/jw4di1axcA4N69e/Dw8ICrqysOHDjQ5HplcP78ebnPWVlZqK6uZp/z8/NhZGSEhIQEpdXhfdm/fz+qqqrY59raWowdOxbr169vcu2BAwdYu/4aQvuKxWL2XVpaGtzd3WFhYYFbt24BACQSSUuq3yzy8/Nhbm6OnTt3srpqaWlh3bp1KCwsRGFhYYvLqKiokPscGhqK/v37y/UDZSP0Q6GNb9y4AQ0NDezfv1/pZWdnZ8t9fvnyJXx8fBAVFcW+E/rI7du3ce/ePaXX6dd425xw584d9O3bF/Hx8e+87m1kZWXB3NwcmZmZAICrV6+iW7duSElJwfXr1z+KZweAkpISjB49GgkJCairq0NmZiaGDBmCnj17oqCgAIByx2tBQQEsLCwQFxcHAHj8+DH09fURFRWFvLw8vHr1CsCHt39VVRXGjRsHS0tLxMbGorCwEMbGxtixYweysrJw5swZ2NrawsbGBmVlZR9URl1dHSZPnoxVq1YBAGpqarBr1y64ublBV1cX0dHRH1TXtiAzMxOampqsfxcXF0MkEmHXrl2orq6GVCpt1nq5b98+6OvrY+rUqSgtLcXWrVvh6OiInJwcuXXhv5l9+/ZBV1cX4eHh0NHRwe7du+Hv7w81NTU4OTnB29sbp06dautqvpXjx4/DyMgI165dY30gJSUF6urqmDdvXrPvm5aWBmNjYzYnHj9+HBoaGjh69GiTtUOZnD17FhoaGti1axeqqqoQFxcHkUiEWbNmtUhGPHfuHEQiEcLCwlBeXq7AGisHqVSKe/fuwdPTE3369MHdu3eVWpYsOTk5MDIyws6dOyGVSlFZWYmXL18CgNLb7uzZs+jevTs2btyIiooKrF+/HiKRCIcOHfqo56jU1FQYGxvj6tWrAICkpCRoaGggMTFR4e8uNzcXffv2ZetydXU1tLW1ERMTgydPnihUpk1NTUX37t2xevVq5ObmIiwsDCKRCImJiWhoaFBYOe8iJycHoaGhUFNTY88skUiUumcE/vPsa9euxcOHDxEZGQmRSIRTp06hvr5eqWW/iaysLOjo6DC5oLy8HCKRCNu2bUNlZWWrtIlAdnY2LCwskJ6eDqBRZhFk6GvXriE/P79V6qEorl27Jvf5xo0b6N69O44ePfre9ygoKEBwcDBSU1PZd+fOnYOnpydGjhzJZHZlI9sHZPtpcXEx3NzcoK+v3+w1PSMjA0ZGRsjKymLfJScno3///ggODlbqOvW+3LlzB/r6+ti9ezeAxjbo3LkzNm/ejNLSUoXNj6WlpXBzc8OZM2cANM5T69evh42NDfr06YOUlBSFlCPLb2l9lEgkmDZtGkQiEdatW4fa2lqFl3Hx4kUkJiZiypQpsLOzw+rVq1k7tIUu63ViY2PRs2dPXLx4EQCwfPlyiEQipKWlsXoqcs5etWoVevXqxeagqVOnokePHrh165ZC+0d4eLjc+h8XF4cLFy7g2bNn7LsRI0Zg2LBhCivzfYmKioKGhgZ0dXXZOqTovpCRkQEXFxe4ublh7969mDBhAnbs2AGgUZ85bdo02NraYu3atQotVxnIts3hw4cRGRmJgwcPQiwWQywWIy4uDiYmJhg/fvx73a+4uBgzZszApUuX2HdLly6FSCTCmjVrmuhiFY3seGoLXb9QfklJCXJyctj3R44cgaurK4YNG8b07c2FR3R9JAgpt1atWkUSiYR69+5NREQ///wzhYSE0CeffELbt2+nw4cPs+uVwerVqyk0NJR2795NREQnTpwgT09PGjx4MJ06dYoKCgrop59+Ii0tLbpx4wYRtV3O4/Xr19PBgwflQm3FYjFdu3ZNzhIukUhIIpHQ5cuX6eTJk1RfX//OOkMmBdrixYspOjqaioqKqFevXuTn50fff/99m0Z21dXV0e9+9ztycXGhR48ekZGREZmbm5ObmxstWrSITpw40aL7b968mXx9fSkhIYGdx+Ti4kIdO3Zk71wZzyx7z0uXLpGnpyf179+fYmJiqLi4mLp06UJeXl4UHx+vVC/I2NhYmjdvnpzX56tXr+jevXv0pz/9iYj+c6B0fX09bdmyhWJiYuRyD7cFwpywZcsWloauvr6eRCIROTo60rp166ioqOhX547X321dXR19+umn1KNHDzpy5AiNGDGCJk2aREZGRrRkyRI6ffq00p7pfcnOzqaZM2dSZWUlaWlpUceOHalHjx4UEhJC//jHP8jJyUnpkV3CWHF1daXi4mIaPHgwmZiY0JgxY2jjxo20dOlSIvrwufvLL7+koKAg0tXVpYMHD1JERASJRCJycHCgbt26kYGBAa1bt44kEglNnjz5g8oAQI8ePaJHjx7RlStXyM3NjXbu3ElffvklDRs2jNasWUPXr1//oPq2Ng8ePKC+ffuSk5MT5eXlkaurKzk7O5ORkRHNmzePSkpKPqjNhUgMOzs7Gj9+PKWmplJMTAxdvnyZbt68SR4eHjR48GAKCAigLVu20LFjxxSeT/9j4f79+2RoaEjPnz8nMzMzGjRoEIWGhpKJiQllZ2fT48ePae3atXT+/Pm2rioRNZ27CgoK6Oeff6bu3buzv5uZmVFYWBht27aNrl692qxyioqK6P/+7/+oR48elJKSQhMnTqTJkyeTvr4+RUREMPlJmUgkEkpKSqJhw4aRs7Mz1dfX0+HDh6lv37504MABmjFjRrM9Q/X19WnDhg0UFxdHBw4coKqqKgXXvmUI62xVVRU9e/aMnj17Rj///DPNmjWLvvvuO/L19VXK4d6RkZF08uRJue9yc3OZt7SKigp9/fXX9Nlnn1FBQQHNmjVLKWckSSQSAkCJiYk0aNAgGjFiBNXW1tKuXbvI3d2d1NTUKCEh4aM492bixIl09uxZIvrPe3v8+DH9+OOPpKGhQcnJyTR58mSaPHky6enp0eLFi5nnryKoqqqiP/3pTyzq2dramqysrMjd3Z3Cw8PpwIEDLS5DOGNo9+7d5OHhQaNHj6avv/6aRROoqanRoUOHlPI+Xpc5//Wvf5G/vz8NGDCAwsLCKDk5WenRZA0NDbR3715yd3cnb29v+uyzzyglJYWGDx9OP/74I9uTKEs+3rx5Mx05ckTuu4KCAtLT02NywcCBA8nZ2ZksLCxozpw59PDhw1ZLzVxdXU0dOnQgXV1dSklJIU9PTwoODiYzMzNavHgxxcfHt0o9FMHRo0fJ29ubXFxc6MyZM2xvZm1tTVeuXKH6+vom6/DYsWNp5cqV7HNKSgqZmZlRSkqKXN/U19cnd3d3unbtmlLm79cR9vrnzp2jKVOmkL29PU2ZMoV27dpF3333HUVGRtK///1v8vLyoszMTNq/fz9dvnz5ve8vnFv2xz/+ka3F5ubm5OvrS4cOHaLY2Ng2i3gUqKiooH/+8580aNAgys3NJVNTUxowYADZ29vTnDlzKCsrq1n3fX2s19bW0t27d6moqIj279/PIsg0NTVJR0eH5syZozA5Qyj7yJEjH+36KNRROPO7Xbt2NHfuXHJwcKDly5fTiRMnWhzZI5SRl5dH9+7do59++omsra1p8uTJJBKJ6MiRIxQbG8siu9oKAFRXV0eZmZnk6+tLenp6dOrUKdqwYQOFh4fTl19+SZGRkS0+vwgymThevnxJGRkZFBwcTEZGRnT8+HFKSkqi0NBQev78eZP1pLncuXOHduzYwaKlqqqqKCEhgYYPH05TpkyhLVu2EFHjHAmg1fUpEyZMoHHjxlHHjh1p2bJlLPpckWu1trY2TZ06laRSKe3fv5/u3bvH9mQ//fQT+fj4ULdu3ejAgQO0YcMGhZWraCATCRgREUEzZsyg06dP06RJk2jhwoVUXV1NTk5O5OnpSTdv3qSgoKB33i85OZlF+cr264CAAPL19aUlS5bQ7t272XnhikY2qmznzp0UFBRErq6urabrF9Zfwc4wdOhQGjlyJBUVFVG/fv3I3d2dRXa15GxLbuj6iHj58iUlJibSpUuX6N69e+x7VVVVmjJlCv3ud7+j1atXK/UgeAsLC/r3v/9Nu3fvpv3795OxsTFFRkbSL7/8QiEhITRp0iTav38/WVhY0M6dO+n69ettdo6Ll5cXxcTEUPv27SkzM5PKy8vpq6++IkNDQ7p27RoTINu3b0/t27enb7/9lhoaGqhjx45vrbMw8I4dO0ZeXl6UlZVFGzZsoLFjx9LVq1dJV1eXGbuCg4Pp+vXrrS4glJeXU0FBAV27do28vLyYQvfTTz+lqqqqDw7Lf31TIuQpnjZtGvn6+tKaNWvo559/pq+++op27txJRKTwZ25oaGD3TE5Opq+//pqSk5Opc+fOlJKSQv3796dNmzZR+/bt6csvv2QpFZRhtLC2tqbZs2fTl19+SWVlZURE9Ic//IH+9re/0ZUrV6impoYdat6xY0dq164d1dTUUIcOHdpkLMguPmKxmG7dukWbNm0ib29vWrBgAZWXl5OpqSn99a9/ZSH5bxOgZfNW37p1i+rq6ujFixf05MkT2r17N82YMYMmTpxIbm5u1LFjR6qtraX8/HzlP+SvcPv2bSopKaHs7Gy5s3e6du1KU6dOpZ9//pnMzMzo8ePHCuu7QrsLZ8OIxWL63e9+R2fPniVXV1cyMjKiWbNmUceOHSk/P79ZxhAAJJFI6KeffiJnZ2dSVVWlzMxMKiwsZCnFGhoa6Pvvv6cxY8ZQQUHBBxmBO3XqREOHDqWUlBTy8vKi77//nsaPH0+rVq0iKysr6ty5M3311VcfXO/W5O7du1RaWkplZWU0fPhwMjAwoDlz5tBnn31GJ0+epOTk5A+6X4cOHejIkSNkbGxMlpaWNGnSJEpOTqa0tDTq27cvRUdHk4GBAZWWllJsbCyFhoZ+VCl8m4vsJlCgtraWcnJyqLKykikFfv/735OlpSXV19dTXl4eZWZm0qZNm9rc2CW7CTl9+jSVlJRQdXU15eXlUVVVldzcrKGhQV988QWVl5c3q6z27dvT7373O9q7dy8FBwfT5MmTydXVlcRiMT169KhVDEMSiYQyMzPZ57Vr19LPP/9MERER5OXlRbt376axY8fStWvXmnV/fX19WrduHUVGRtK+ffs+GmMXZFISBQQEkIODA3l4eNC8efPop59+oqioKPrqq69o5MiRCleWVlVV0Q8//MDqQdT4HiorK5ukeZJIJJSSkkKPHj1SWPmyyjEVFRV69OgR9ejRg8RiMTk7O1PPnj1p6tSp9OjRI4qMjGxzA3xVVRWVlZXRhAkT6NKlS2wM1tXV0VdffUXHjh1jRi5XV1dqaGiga9euNXtcCsjKRDU1NVRSUkLnzp0jDw8P6tu3L82aNYs+/fRTKi8vb7axW5Z27dpRp06dqKysjHr16kVlZWXUv39/6t27NwUFBbH0PIoeQ8JYyMzMpG3bttH06dNp79691KlTJ5oxYwY5ODhQQEAAHT9+XKlp7yUSCeXm5lLPnj3p5cuX5OTkRHp6ehQSEkI3b96ksLAwKisrU8oZPKWlpXThwgVSU1OT+9uDBw/oyZMnVFRURMOHDydDQ0OaM2cOff7553Tp0iU6fvy4QuvyJgQFlbA3W758OYWEhFBwcDANHTqUiBpTUT9//lzpdWkur++xtLW1KTIykj777DOaPXs2eXt7U3JyMv3zn/+kY8eONTm8vqamhkxMTMjb25t9Z25uToMHD6aXL1+y9KHCnsTIyIi+/fZbunv3rtKfTTgqIiAggL755hvy8PCgvLw8CgsLo6ysLPr+++8pIiKCfv75Z3J3d6ewsDD6v//7vzfe60170VevXlFpaSm9evWK2rdvz2QoMzMz+v777+nMmTO0a9cuKi0tVepzyiK7bhE1nk9UWFhIeXl5NHLkSKZP+Oqrr+jhw4fNSk8tq0B9/vw5VVdX008//USOjo4UHh5OM2fOpL59+1JwcDDNmTOHevfuTT///LNCzk2Vfc68vLyPcn2UNbCOHz+exo8fz1KELViwgCwtLWnatGmUkpLSImOXkJZyyJAh5OnpSc7Ozky/EhoaSqqqqnTkyBFauXKlQpykW1LP9u3bU3l5Of3xj3+kU6dOUWBgIE2aNIns7e3pzp07lJSU1CK5QLZPCo4H2dnZ1KVLF7p8+TJNmjSJgoKCyMHBgW7dukVRUVEKmZf/+c9/0sqVK6mqqooGDRpEX375Je3Zs4eWLVtGf/jDHyg6Opo8PDzo1KlTJJFI6P79+y0u823IGj7v3LlDycnJJJFIaPjw4eTp6Um3bt1ijuWKkhcEp/Bu3bpRUFAQ1dfXU05Ojlx6yJ9++olGjx5NmpqatGnTJmb8+9gQ+s+GDRvo0KFDtH79ejp06BC5u7vTrl27aPXq1Uz+GTFiBJ04cYIdOSGL0K7Gxsbk6OhIZWVllJubS/X19eyagIAA8vPzo6ioKDpz5ozCn0VW17ds2TK6ePEijR49mtTU1FpN1y+sv+PHjycDAwOaPn063b17l8LCwqiwsJAZuwDQ1KlTmy8TtCgejKNwLl26BENDQ4wcORJXrlyR+9vt27cxZswYpYX0C6G6xcXF8PHxgZOTEw4dOsT+npqaiqioKHTt2hVjx45F9+7dMWfOHNTV1bV62LNsWLFsupBXr17hzJkzMDY2xtSpU3H79m0AjelKvL29MWvWrF+9d0ZGBnR0dLB3714AwK1btyASiTBkyBCWguDSpUtwcHCAo6MjxGKx0lNgFBQU4OrVq8jOzsazZ88wcuRIiEQiTJgwAcB/wmk9PT2xZMmS976v7Ht7+PAhnj9/zkKsb968ienTp8PY2BiOjo6YP38+tLS0kJaWprDnEtIvCnXJyMhA165dUVJSAqAxrLWgoABLly7FoEGD4OTkBJFIhDFjxiisDrLIhpdfuXIFAwcORGJiIgBg48aNMDExwfr161FTU8Oumz17NqZPn476+vpWS4UiIPv+Vq9ejZMnTwJoDAOeN28e7O3toauri9WrV8PCwgI+Pj7vda+lS5fC0NCQpQX19PSESCRCTEwMu+bFixdwcHBAbGysgp/qw6mvr8exY8dgZGQER0dHuZQAQGOqFS8vLzx8+FCh5V68eBHdunXDiRMnUFZWBmNjY4hEIoSEhMhd5+/vj/DwcADNS71w7NgxzJo1C5cvX8a0adOgq6uLTZs2yV0jpIMqKir64Ps/evQI9+/fl/suOjpaLh3ix4DQdq9evcLz588BND63vb09dHR0MHXqVHbdkydPYGlpKZca530oKirC+PHjsWnTJpY+5NChQ9DU1IS9vb1catjKykqlpxZoDWTHvpBic9++fThw4ACMjY0xYcIEdO7cGTdv3gQAXLhwASNHjoSjoyO6du0KR0dHTJo0iaVsa21kx1RMTAzMzMzw4MEDHDp0CL169UJcXBzrL0BjSgZbW1tkZGS8dxlZWVnIyMhAVlYW8vLy0LVrV4hEIrn5r6qqCg4ODkpJ9fCmeePgwYNISUnBlStXMGbMGJb+Z+PGjbCxsUH//v1bnBbrzJkz6Nq1K9asWSOXJrotSU1NRdeuXbF8+XLExcWx9CsBAQEAGt+vk5MTdHV1lSIvnz17FseOHQPQmIJJS0sLCxYsQGVlJbvm1atXGDJkCM6dO9eisl5/74mJiXB3d0d9fT0mT56M/v37w8jICHPmzGFy8blz52BmZtastUDRlJaWYty4cdDU1GQpia5evQqRSMRSzAqUl5fDwcGBte2HIrSVMA/V1taitLQUTk5O6N69O5OXBdzd3bFixYpmlfUmHBwcMGbMGJiammLmzJnsfRw5cgRmZmYoLS1VWFkCSUlJ0NHRQVBQEEaOHAlTU1NYW1tDLBajqKgIkydPhrq6OpNjlYWPjw9GjRoFIyMjzJo1iz37gQMHYGFhITf/Khphnb569Sqbey9fvgwbGxtoa2szeUwikaC8vBy2trYflGavOaSmpsLJyQkPHz5EfX09vLy8oK6ujvnz57Nr6uvrMXDgQDm5+mNCdu45d+4cTp48ydKNAsDJkycxf/58aGtrY8qUKRCJRJg5cybq6ureeL/NmzfLpXQKDg6GpqamXNqmZ8+etcr7kUqlKCsrg6OjI5Ola2troa+vjxUrVuDhw4fsWWtra3Hq1Km3rqWy8lNhYSEeP37MPru5ucHKygrFxcXsu/Lycvj6+iI6OhoaGhrNnu/eF+F9CO/z1KlTmDdvHqRSKXJzc2Fvb4+uXbsiODgYQOM+uLa2Fk5OTti+ffsHlSXbZ1auXAl3d3cYGhpiy5YtKC8vx40bN/DkyRO533h6emL8+PEK3z8HBQV9tOvjsWPH0LVrV4wbNw5DhgyBpaWl3DwwadIkaGtr48CBA81Oe3vv3j1oa2sjLi4OBw8eRHBwMEQiERtbz58/R3BwMGxtbdGtW7cWpwhrCQ0NDRg1ahQsLCygpaUl1+9OnDgBW1tbuTH0vkilUrnxuXDhQgQHB0MsFsPHxwcuLi7o3r079uzZw65Zv349XFxcWpxuWDYVanJyMvT09ODm5sbqU1NTg7y8PEycOBG+vr4QiUTQ0NDA9evXW1Tum5BN3W5lZQVbW1toamrC2tqarZkrV65Ev379MHv2bIUcgSKUWV9fz9ri5s2bGDx4MFxcXJCUlCR3/aNHjxAWFvZRp/IVi8UYNWoUtm7dCqBRT9ivXz+EhoaydO9lZWVoaGhAcnIy60Pv0pEHBgZCQ0MDx48fb3JdfHy8UlM/p6enw8HBATk5Oex9nT17tlV0/cXFxbC1tWVtWVlZCQMDA6irq8PFxYXt3Q4fPgxPT89m90lu6GojZM/3SUxMxOrVq1keaCGvs5+fn5xQCUBpeYVlBYzk5GS2OTIzM2M5zgUeP36MpUuXwsXFBT179mxT5ceuXbuQn5+PmTNnwtjYmOV4TUxMhLW1NczNzTF06FA4OTnB1ta2icD3JlavXs2E8ZKSEnh6eiI0NBQmJiZwcHBgxq7r168rZDH4NZKSkmBiYsLKz8jIwN69e9G/f3+4uLjg+vXryMjIQFRUFHR1dfHgwYP3uq9sG0RHR8PY2JgZCPPy8gA0KgwqKioQFhaG4cOHQyQSYfHixU1+3xySk5Ohrq4uZ3w8c+YMdHV15QxuAvfv30dqaiqGDBkCCwsLpqRUlnGpqKgIlpaWcHZ2xunTpwEAM2fOhIWFBcaMGYOYmBiW07ktzqmSXXBu3rzJjFEnTpwA0Li5EYvFWLVqFQIDA2FgYACRSITk5OR33mvevHkQiURQV1dnc9LJkyfh7OwMY2NjJCQkYMeOHfDy8kL//v1b/fwF4X3fv38fp0+fRkJCAsvte/z4cdjY2GDo0KFySkdA8XPn/fv3ERISIneO1dWrV6GpqQkfHx8cP34cV69eRXh4OLS1td97XAoIz5mTk4N+/fph48aNABrn36lTp8LNzQ1btmwB0GjIDw8Ph4ODQ5Pnfl+qq6uxcOFCBAYGIiAgALq6um268XkdoT1OnjwJDw8PmJiYICwsDPfu3cPw4cPRu3dvpjStqqrCsmXLYGpq+t6bWWHTLxKJoKWl1eTsqQMHDkBfXx+zZs1SykakrZCdP7ds2QI/Pz8EBQWha9eucHBwgI+PD4yMjGBpaQktLS0cPXoU7u7uGD9+PAYNGgRNTU2sXLkSIpGoVc+nehOnT5+Gu7u7nJIsKCgIWlpaWLVqFW7cuIF79+5h5MiRcHV1fW+hfdGiRTA1NYWxsTGGDRuGyspK7N+/HyKRCLNnz0ZycjIyMjIwYsQI2NvbK/w8HuEdpaenIyoqCjt27GDKtPr6eoSHh8PJyYldP3v2bKxZs0Zhc96JEyegp6fXxIGgtZFKpXjx4gX8/PzYuYJA49x+/PhxdO/eHYsWLQLQOD97eHjg0aNHCq9HUFAQRCIR26jv3bsXIpEIc+fORVZWFkpKShAVFYU+ffo0Ueo1B9kzfD08PLB9+3aIxWKcOnUK/fr1g7m5OV68eMGuj4iIwMCBA5VqXPg1ZOeVkpISBAQEoEePHsxRKi4uDurq6li8eDEuXLiArKwsjBw5Eg4ODs0aP0J5qampGDVqFOzt7ZlxZ/PmzdDR0UFwcDCuXLmCe/fuITIyEj179kRubm6zy8rOzsb58+fZWX1JSUno2bMnbGxs5K6fM2cOhg4dKucg1Vxkz5zMycmBsbExcxgrLi6GtrY2lixZgidPnkAsFqOsrAz+/v7Q0dFBTU1Ni+Vl2b3r2bNn2XlN8fHx0NXVhYODg9y8M2/ePIU9+9uQSCSoqanBsGHDYGdnh2PHjqGhoQGBgYHQ0dFBbGws6urqUFFRgWXLlsHY2Fipe7cjR44gMDAQIpEIPj4+KC0tRVZWFvr37w8HBwesXbsWO3fuxPDhw2FnZ9cmZ5i9i/DwcDlnjXnz5kFXVxfa2tro27dvE8NcZmYmYmJiYGtrC3Nzc3bOh7C+SqVSvHr1CsuWLYO+vj5CQ0PZbwMDA9GjRw9ERERgw4YN8Pb2xoABA1qlTQSjWnFxMfLz89GnTx9MmTIFEokEYWFhCAkJ+aB6CPtoExMT+Pv7A2h0srO3t4ehoSEOHTqE/fv3w9PTk63Xw4cPl2sPRbNt2zZs2LCBjT+JRIJhw4Zh4cKFABr3iYsWLYKxsTFmzJiB8vJyPHr0CEuXLoW+vj7TBXwoy5Ytg56eHhITE7Fu3To5B9nS0lIEBgZixowZGDx48HvrZt6G8Js7d+4gNTWV6axSU1M/yvXx5s2bMDAwYPW8fv06unfvDlNTUyxfvpxd5+vrCwMDg2adk5adnY1ly5YhLCyMfVdYWMgM0oKM/PLlS9y7dw9Pnz5t4VN9OMeOHcPy5cuxefNmAI2GDnNzc9jY2KC8vBwvXrxAdXU1PD09MXr06BavXenp6Rg0aBBu3ryJhoYGxMbGQl9fH56enuya+vp6eHp6YuLEiS0qS5bly5fD09MTRkZGEIlEcHBwkNt7iMViPH36FBs3boSVlRU2bNgAQDFnZcm2WXp6OjQ0NBAfHw+JRILs7GyIRCLs2bOHyVyrVq2Cvr4+FixY0KJ9jFDuuXPnMGPGDDg6OrL94dWrVzFkyBAMHTq0ibHrY1sLX+9zZWVl6NWrFxITE1FeXo6QkBAsW7YMQOO+S11dHSNGjJA7l1HW8WPXrl0ICQnBqFGjMH/+fIjFYiaraGpq4sSJE29878pol2PHjkFPTw/Dhw/HixcvmpShbF3/3bt3YWpqys7KnTx5MubPn4+8vDzo6urC19eXrRstkR+5oasNSUpKQu/evWFrawt9fX106dIFixcvRn19PTN2BQQEfJDXcUuJjo6Gjo4ONm3ahE2bNmHgwIFwcXFp4tXT0NAAsVgMJycnFqnQGshOANu3b0fnzp3ZhBIaGgoDAwOsW7cOQONCHx8fj7CwMGzevJkN4rdNGMIG0tfXl3l+RkdHY8qUKQAaPQRFIhHs7OyaRFMoi6tXr0JbWxvbt29HUVERMjMzWf137NgBHx8fiEQimJubo3///iyC7deQnby3bt0KXV1d7N+/H7Nnz8bAgQPh4+PTxKuirKwMcXFx0NDQaBL90RzKysoQExMDY2NjTJ8+HUDjO7Ozs5N7z69P+tXV1Rg0aBAiIiJaXAdZhDYRlGlAo7Fr4MCBcHBwwPnz5wE0bhz8/f0xYMAA+Pv7486dOwqtx4eycOFCWFlZwd3dHdra2uzwc1lKSkqQnp6Ofv36Ydq0aW+91/z586Gnp4eLFy/CzMwMZ8+eBdDYJpcuXUJAQAA0NTXh4OCAcePGsQW8tQ5aFzh27Bh69+4NOzs7qKmpwdTUlBlgU1JSYGtrC3d3d6UoZiUSCV68eMEMv6NHj5b7e0ZGBkxNTdGzZ0+YmprC3t7+vcfl62RlZcHf3x8uLi5ym7K8vDxMnToVurq66NevH3x8fGBmZsYibppDbW0t9uzZg2HDhmHu3LlyB4N+LJw+fRrdu3fH8uXLsWfPHqbgq6iogJubGywsLKCrqwsXFxf07t27WYa6JUuWQCQSITQ0tMnmLyEhAerq6ggLC/voDrNuDrJznhAVIwjcJiYm6N27N1xcXDBx4kSYmZmxKAx1dXWYm5vDysoKNjY2OHHiBAYMGPDBxlxFcv36dTg5OaFLly5NjPnTp0+HhYUFRCIRBgwYABcXFzZ3/dpmMi4uDr1792ZGMlnFT0JCAvr27QsNDQ3Y2dnB09NTaXPi8ePH0a1bN/Tr1w/6+vrw9vZm6/Dy5cvh5OSEhIQELFy4EL169VLIGi2LrKKotRH6qUQigVgshrW1NZPzBMRiMebOnYtBgwahuroaUqlUqWM0ODhYzhv/4MGD6NWrF3r37g1ra2uYmJi0yFEgJiYGcXFx7HNWVhb09PTkPB3r6uoQExMDKysr9OvXD1OmTMHo0aOhra3dZkbn1z2oBcrLy+Hn54cePXogPT0dQKMspa2tDW1tbVhbW8PDw+ODx4/sdcnJyejatSuio6MRHR0tZ+Tcs2cP7OzsIBKJ0K9fP1hZWbXo/SQlJaF79+7Q19dH9+7dWQaIpUuXQkNDAz4+PliwYAEmTpwILS2tFr+P1atXM+ODMB4uXrwIOzs7AI1RjH379sW0adNQWVmJ0NBQVqeCggKWJUERHDt2DFpaWtDU1ISVlRXzyF2wYAHMzMzg5uaGRYsWYfz48dDU1FRKX3yT0vPGjRvw9PSEo6MjUlNTIRaL4e/vz+ZoR0dH9OnTR6kOPOHh4ejbty9mzZrF5LKRI0fi6dOnuH79OkJCQqCpqQkXFxeMHz++zWTot5GTkwMXFxc4ODjgxIkTSE9Ph6mpKbKysnDx4kXMnTsX+vr6zKlUltraWhgbG2Pp0qVv3Gc/f/4cGzZsgKGhodw+ZOrUqRCJRHBxccGKFSvY/KEM5Z6s8S0vLw/a2trYs2cPzMzMWGYOoNG497rR9nVk35mwj961axeioqKgr6+PESNGAAByc3Mxfvx49OzZE7a2tvDx8WGR856enkrNijFixAgYGxtj+/btzGDi7u7O9ktA43sLDw+HpaUlRCIRrK2tYWpq+t7jJDs7W248FhcXw9nZuYkSG2jcn6WmpmLp0qUYPXo0IiIiflU38y6Eco8dOwZ9fX2YmZlh7NixqKqqglgsxsaNG2FhYQErK6uPYn0EGp0CBg8eDOA/0X0hISGYOXMm9PX15fpDc6KYysvLWZRIUFCQ3N8KCgowZcoUqKur4+DBgy16jpYQHh6Onj17YtiwYQgJCWF98/Tp0+jduzeMjY1hZ2cHJycn9O/f/73ldYHQ0FC5bB5HjhxhSn1BaV5fX4958+bBwsIC/fr1Q0BAABwdHVtseJVl69at0NbWxoULF3Dnzh0kJibC0tIS/fv3Z88iO4+sXr0apqamLZZdU1NTmQ5PKGfNmjUsavPhw4cwMzNDaGgo8vLysGDBAnbdunXrmh1VJdteSUlJ6NatG6ZMmYKZM2fK6cpu3bqFwYMHw93dHYcPH25WWcpGtq89f/6c9dHDhw8jMzMThw8fho+PDy5fvgwALItSWFjYG9fzyMhI9OrVC6GhocyZ2MHBgcmpwndHjhxRenYoqVSK1NRUDB48GJqammxfK/Q7of7K1PXn5+dj4MCBTFc/ceJEXL16FXV1dbC3t4dIJMLgwYNb7JDADV1txI0bN9C7d2/s3bsX5eXlAP6zQRI8Os6ePQsNDQ1MmjSJpWZQFlKpFI8fP8aAAQPklEQFBQUIDg7GwIEDsW/fvia/mzlzZpM0Xa3Bzp07ERoaiv3798t9L2vsetPgeJ/NRHZ2Ng4dOsQ8gg8ePAiJRIKTJ0/C1tYWkydPVnporTDJxcTENFGkA43vJTw8HOXl5bh69SoKCgpYP/oQbt26hYkTJ+LIkSPsux07dsDR0RE+Pj5MoSIbau3i4tLiNCiCQPvixQusWbMGZmZmLDpDCP/duHEjrl+//sa2jomJweDBg9lmoaXIhuyGhITAxsaGpdN48uQJBg4cCHt7exbZBTQa3Npa2X348GHo6uri8uXLePHiBXJzc7FgwQKIRCK5dBhCe2dmZkJLSwv37t3D9OnT5SLRpkyZAh0dHWYsMTc3f2PapcrKSrx8+VIuLF3ZyI7brKws9O7dG/Hx8SgvL8fjx48RHh4OY2NjNnceOXIEffv2xahRoxSeVlUYZw8ePMDo0aOhr6+Pbdu2yV3z7NkzZGdn4/79+x9sbJMVcDIyMjBgwACIRKImzgaFhYUIDQ2Frq4u5s+frzBFlkQiafUUnL+GRCLBq1ev4Ovri8jIyCZ/Ly0txfHjx3Hu3DksX74chw8ffq+UZcJzVldXy3lNRkVFQSQSYc2aNU3e38GDBxWeArMtkB1TeXl5GDp0KHMaqaiogIODA8zMzKCnp4fBgwcjNzcXKSkpWLFiBfbv34/Dhw8zI/usWbNga2vbrDWoubypj8bHx8PY2BjW1tZNIjXu37+PtLQ03Lx584MUaSEhIZgzZ06T73ft2oU9e/bg5cuXuH//PnJzc5U2J9bX1yMsLIx5AO/duxcuLi4YMWIEHj16hJs3b8LR0REmJiawsbFptmH9Y+b48eNYtWoVioqKYG1tzTzSZef3NWvWwNbWVqEpNGW9xU+dOiWX4mbSpEnQ0NBg3tH5+fnIyMjA+fPnmz0fCym1QkND5ZwN8vPzMWTIEKiqqsrJIWKxGKmpqQgJCYGXlxfCwsI+GieFa9eusTEHNHqP+/n5yaUxzM/Px/Xr13Hnzp0PGpeyadUB4OnTp3B0dGTr5MuXL3H27FlMmzYNEyZMwNOnTyEWi3Hp0iVkZ2e3aK4SUpTGx8fj4sWLTOY6cOAAgEalq4uLC4YOHYpJkya12Oj86tUrjB8/HiKRSE5WP3z4MFOUGBkZMYcxACydjqKprKyEi4sLdu/ezVIpyxq79u3bBy8vL7i4uCAkJEQp2Q5kZRQhGkd4n48ePYKHhwcGDhyI1NRUSCQSZGVlYcOGDTh+/LhcWjlFc+XKFZiamsplYjl69ChGjhwJLy8vprR++vSp3Bz1sXmxC6lwnZ2d4efnJ5e1ID8/HwsWLGhi7BKeYfbs2XI6gUOHDmHx4sVISEjA8+fPUVtbi3Xr1jUxdoWGhkJDQ4P1b0XLoML9BAW28O/MmTNZ5J0sgYGBb43oen1PeuHCBcydO5fVva6uDsePH0evXr3g4eHBrisqKkJ5eTnbOy5ZsgS9evVqVlTpryGkMQaA8ePHw9zcnDlOTJ06lc0NwpxbV1eHp0+f4siRI7hy5cp7G1j8/f3h7+8v975ycnLQrVs3uTo0NDSgvLwcbm5uWL9+PQD5ft8SQ296ejq0tLSQkJCAiooKlJWV4fnz58jKykJ1dTVOnz79UayPQhtt3LgRI0eORGlpKdasWYMpU6agqqoKjx49QufOnSESieRSfDaH1NRUeHp6olu3bnLRJUDj3jEgIEBhUb4fSnx8PAwNDZmxsaqqCjk5OTh48CBu376NyspKrFy5EtHR0di+ffsHG0Lz8/Mxffp0uUiatLQ0uLi4yCn1hXseO3YMoaGhCAkJwYoVK1pkeJVFIpFg6tSpck7ZEokE169fh5mZGVxcXOTGHwCcP38e/fr1a1HEcWZmJvT19TFlyhS23kkkEvj5+WHGjBmor6+HoaEhmwOKi4vRuXPnFqVQvXz5styalpubC0tLS+acIzz3okWLEBsbi6dPn+Lu3bvM8K/MiO/m8HoKVg8PD/Tt2xdxcXFM1vDx8cGMGTMAND7fqFGj2P6gpqZGbm+Snp4OMzMzZhQDGvek/fr1g6urK/tuxIgRchGGiuJNejCpVIrMzExYW1vDzMyM6UDe1O9bqusX2vPmzZtISEjA1q1bmewmkUgwevRolqWjvr4eQUFBSElJUUhGDG7oagW2bNnSxMP4wIED8PT0hFgslutUUVFR6N69O/OMvnDhglKEoDfx9OlTGBoaMuOR0DFLS0thYmICa2trOU+TiooKDBs2DG5ubq1yTpUs/fv3Z2dUvW7smDFjBoyNjREVFfXOUEvZ9COHDx/GunXr5KLndu7cCVNTU/Y5MjIS06dPb9UJOTw8HP3792cLiDBZxcfHQ0dHp1nePgKpqamwsbGBrq5uk3NsduzYgUGDBmH06NFyXrGPHz+GgYEBC61uDrL9JCEhAXv27MGaNWtYakY1NTUMHDgQxsbG6NatG3R0dGBubs6i6J48eQJnZ2cMGTJEoYYmwRt4ypQpWLhwoZxyoqSkBE5OTk3OrWtrli9f3sQQ+uzZM0yfPh0ikYgpxKRSKRoaGpCRkQELCwtcuHABbm5uTLiqrq6Gv7+/XEo2BwcHOY9yiUSCLVu2yKWCU/aYX7p0aZNzLTZv3gxPT0/U19ezzVFJSQnmzJkDKysrPH78GPX19Th69KjCDdJ37txBly5dWHrI3NxcjBw5EoMGDZJTgLaUCxcusHcheD4NHDiwiSAq5LRuyTzwW0EqlcLR0ZGdQSiVStnaOWLECPj6+n7w/YDGedDNzQ1ubm6YN28e+/uiRYvYuXRtnbJNkbi7uzP5QiKRICYmBi4uLjA3N8eAAQPYdY8fP4a9vT3Mzc2hpaUFNzc3AI1KsMmTJ2Pw4MHo2rUrhg8fDl1d3VY1rrye9kN2jjhy5Aj69+8Pb2/vd6bd+TUDuBA91L9/fzkFsvC79evXw9jYuEmqUEUZ1oX+ee/ePaSmpsLFxUVunU5ISICzszNGjBiBkpISdiZPaxoblY2skUlPT4/JHRs2bICqqmoTT9CZM2di/PjxCnMMe5u3uGykZ1BQELp164akpCSFrIeyTkBAo7ODIPsUFBTA1dUVRkZGH40xS2DRokVy8sL8+fNhbGwMLS0tGBsbw9PTEy9evMCLFy/g6+sLTU1NXLhwocl93mf8XLx4EdbW1nJGi4cPH8Lc3ByXL19GYWEhRo0ahf79+6Nfv36ws7ODg4NDi2R34d0WFRUhOzsbwcHBzJmuuLgY8+fPh0gkwu7du+V+11Jl2a1btyAWi1FeXs7OgRAczYqLi6GlpQWRSCS3djU0NMDT05OlO1ZUusLS0lJcu3YNPj4+zJBbVFSE0NBQWFpayu0Pa2trFR6ltGnTJjmlbXJyMszNzWFkZAQNDQ2Eh4ejuLgYhYWF8PDwgKOjo9LPepLl7Nmzb0z3lpCQAE1NTYwaNYo5ychGU38svO5k5evrC3V1dbn1D2hUJIeHh8PAwEDOCDZq1Cj07t0b7u7uqKurQ0REBIt2Fs6uLSgoYMYuIyMjOWNsSEgItLW1sX//foX2HeG5zp8/j5CQEAwZMgTDhg3D5cuXkZ6ejrFjx0JLSws7d+7E3r172XnUbzLS+vj4yKWXy8zMhJ2dHTQ0NFjWD6BRLklJSYG+vj6TnYDGlJ8WFhZwcHCAsbGxUqILr1y5Am1tbTllub+/P0tz6urqCk1NTTg6OiI0NBQ7duzAlStX8Pjx4w/eU8s6fBYVFbFz8BwcHBAdHd0k7Z67u/sbHYdawoYNG1g/qqqqwvLly1mfc3Z2blbqP0XxpvFdWFiIM2fOoKioCB4eHtizZw8kEgnu37+PwYMHY9euXR+Uclkoo7a2Vk4evX37Ntzc3GBmZtbE2PX48WOFRvl+CIsXL2aZkjIyMjBx4kTo6elBTU3trZkh3nc+eL299+zZw3SaV69ehY2NjZxS/20oav4ZMWKEnLFbQEj3bmpqKudw6efnB11d3RbL8StXroStrS2mT5/O9CDx8fEwNzeHrq4uOzJEIpHg7t27LcoIs3v3bgwYMEDuvOr79+9j0KBBuHXrFsrKyjBhwgRYWlpCV1eXpUYEGh2XW+MImOYipGA9dOgQYmJi5FKwhoWFoU+fPti9ezfc3d3ZUR6urq5Nzmneu3cv7OzsmjjhXblyBZqamiyQpL6+XuHO2bL3O3HiBLZs2YJly5ax4xmysrJgbW0NCwuLNxq7FKXrF86TdXd3h7m5OZKSkiAWi/Hs2TP07t2b7XOioqJgbGyssPmpHXGUBgB68uQJnT59mn7++We5v927d4/u3r1LnTp1og4dOlBdXR0REY0aNYo6depEly5dIiKinj170t///nel1E32XyKihoYG6tSpE924cYPQaAQlAPSnP/2J1NXV6eXLl1RaWsp+U1FRQT/99BNNmzaNOnXqRCoqKgqv5+t1FDhw4AAZGhpSamoqnTx5krUfEdHs2bOpe/fu9ODBA/riiy/eel8VFRVKTk4mX19f2rp1K505c4bc3NxoxYoV1NDQQP/3f/9HT58+pQULFlBoaCjt2rWLhg4dSr/73e+U8pxv4scff6TS0lK6cuUK1dfXU7t2jUNWU1OTvvvuO6qtrX3ve0mlUrnPRkZGZGBgQPX19XTw4EGqrKxkf3N1dSVnZ2e6e/cu7dq1i4iIXrx4QTdv3qR27dqRkZFRs54HAOsnu3fvpoiICNLW1iZHR0dycXGh6upq+vnnnykuLo5OnjxJq1atoqlTp1KfPn1o6NChRET07bff0o8//sj6nSIoKCigqKgomjFjBs2fP5/Gjh1L1dXVNH/+fFq1ahUREa1atYoqKytp7969VFNTo5ByW4pUKqX8/Hyqqqpi333zzTdkampKRI3zyfHjx0lFRYVevXpFJ0+epLy8PPr73/9Omzdvpo4dO9LevXvp4cOHFBUVRV27dqWGhgaSSCRERPT48WN2Xy8vLzpw4AD93//9H/tOWWOeiKioqIgyMjLo2bNncs+bk5NDL168oA4dOlC7du3YWB06dCjl5ubS7du3qUOHDmRlZUU//fSTQuv07bffkpGREQUHB9Pp06fp73//O02ZMoW++uor2rVrFyUkJLS4DLFYTDExMTRkyBC6desWde7cmYKDg+nTTz+luLg4Sk5OZtf+7W9/o8mTJ9N3333X4nI/dhoaGqhdu3Z07949Imrse8J8qK+vTzU1NVRfX/9e95JKpWz+Hzt2LP3000/0l7/8hY4dO0azZs0iIqKgoCDy8vKiZcuW0ZYtW+j58+dKea7WpKCggP75z3/Sjz/+SACoXbt2pK2tTbdv36bCwkIqKCggb29vIiL6y1/+QqtXr6avvvqKVFRUKCMjg6ysrKi4uJiIiD7//HP617/+RX/9619p27ZtpKam1irPIJVK2Xtft24djRkzhuzs7GjkyJG0bds26tevH7m7u1NFRQXNmzePCgoK2O9kEe7xNtq1a0edOnUiCwsLOnHiBJPJhN99+eWX9MMPPzSRB37tvu+LiooKpaSkkIODA82bN4+uXbtGJSUl7O/29vY0ePBgevXqFfn5+VFBQQH9+c9/pj/84Q8KKf9jQOh3W7duJX19ffL09CQioiFDhpCLiwsFBQXRnDlzaMmSJTRjxgw6ePAgjR49mj755BOFlX/p0iWaNm0aTZw4keLj42nWrFn06aef0oULF6iuro4iIyOpX79+FBAQQKmpqS0q7/nz57Ru3ToqLy+nzz//nGpqaig+Pp5iY2MpLi6OfvzxR1q8eDF999135O3tTQ8fPiSipn27tSkpKaG0tDQ6dOgQHThwgE6cOEEpKSm0cOFC2rZtGwUHB1NBQQG5u7vT559/TpGRkWRgYEDDhw+nW7duyd3rfcZP586daevWrfSXv/yF7ty5Q0RE//jHP+i7774jPz8/sra2ptraWvLw8KDDhw+To6MjffHFF/Tpp582+xlVVFQoKSmJPDw8yMvLiw4ePEgPHjwgIqLvvvuOPD09afjw4TRjxgyKjY1lv2vfvn2zy0xKSqLhw4fTnj176Msvv6Tx48fToEGDKDAwkA4fPkzfffcdTZs2jb7++muqrq6mvLw8unfvHi1btoxu3rxJxsbGrO4tQVgrXVxcaOrUqZSenk5isZiIiP785z/T6NGjSVdXl/bt20eLFy8mIqJPPvmkRc/+OjU1NZSYmEje3t507949ys3NpeDgYBoyZAhFRkZSQEAApaSkUHh4OH322Wc0c+ZM+vrrr2n58uV05MgRhdXjXTQ0NBARMVlBkKPt7Ozo22+/pQcPHtCiRYuouLiYvRNlytAfgiATCfttbW1t8vLyIj09PTp16hQdPXqUXfvTTz/R0KFDycDAgO7cuUMASCKR0LfffktlZWX0yy+/0Llz5ygtLY02bdpEBw8epMjISDp79iytXLmSSktLadiwYeTu7k579+6ltWvXEhHRvHnzqFevXrR48WJ69eqVwp5NRUWFjh8/Tn5+fvTtt9/SgAEDqKGhgby8vOjbb7+lMWPGUP/+/SkiIoLWrVtH2dnZFBcX10RvQ0Q0aNAgGjVqFBER269aW1uTiooK7d27l13XqVMnMjQ0pDlz5lBGRgbNmTOHiIjU1NTI19eXJk2aRNu3b6fOnTsr7DmJiF6+fEmampqUlJREP/zwA5OXly1bRp07d6a4uDh6+PAhWVlZUe/evamwsJAiIiLIzc2NRowY8d7tfu/ePcrPz6cvvviCOnXqRDt27CAnJyfKzMykP/zhD6Snp0fbt2+npKQkevnyJRERmzN++OEHhT5zUVERHT9+nLZt20Z2dnZ05swZ0tHRofj4eLp7965C9mXNQdB3XLlyhTZt2kSBgYF08OBBamhoIAMDA3r06BE9ePCA9PT0qF27dpSYmEidOnUic3Nz+tvf/vZBZZw+fZr8/f1p4MCBNHToUFq0aBH961//ogkTJtBf//pXmjhxIt24cYP97i9/+YvcXr416dSpE125coUCAgJo5MiR9OLFCwoJCaHDhw/To0ePWJ+V5X3XEmE+BUAVFRW0bds22rJlCx07dow0NDRo7ty51KFDB3J0dGR6HFn94YeWJ/A2GczU1JRKSkroyJEjcrrMH3/8kQwNDUlHR4f99osvviB7e3vasmVLs+V4YQ/s6+tLlpaWlJ2dTWvXrqXS0lLS1dWlb775hr788ksyMTFh1yclJVH79u2b3R8GDRpEy5Yto9///vdUVFREL168oE8++YRqa2tpxowZZGBgQKWlpeTm5kbp6emsXgCoW7duCp8Pmsvdu3flPhcXF9O5c+dozpw5ZGtrS6NGjaJevXoREdGJEyfohx9+oG7dutHmzZvp888/pz179lCHDh3I3NycrK2tiYiYjra+vp5qamqotLRUrowffviBPv/8c/beBL2WImV6QaaOjIyk2bNn08WLF+nSpUs0duxYWrx4MXXr1o1mz55NHTp0ICcnJ6qurqYOHTqw3zdH1/+63v7Bgwc0f/58CgoKok2bNlF8fDwZGBhQp06d6MWLF2RqakrLli0jOzs72rVrF61cuVJx85NCzGWcNyJYRAUvwszMTOaJd+bMGRgZGbFDpYFGD4LHjx/DxsZGzmqsaGStu4WFhXjw4AGL0khKSoKqqirWrl3LvGLFYjF8fHywZcuWJpZmZaduky3vwYMHuHv3rlzU1bBhw6Cvr48TJ040qYtsLu43cePGDejq6mLHjh0AGtM3iUQixMbGorKyEsXFxViwYAEGDBiA4cOHt0pO56tXryIuLo6lKAIADw8PGBkZITU1lXmQRkZGwtbWtok3+duQbceioiI5b6GFCxfC0tISERERTe53/PhxOc+WysrKZnmaHDhwQM6D5sSJExg2bJhcZFh5eTliYmLkvE1eR1n9rbCwEG5ubsjIyEBpaSkCAgJgZWUFY2Nj9OjRg4UnC6G2rc3bPDxSU1Ohr6+P7du3y6XqzMrKgpeXF6ZOnQpjY2Pm/b1gwQJ07doVV65cAdCYd1hVVRUDBw5s4vEVEBDAcvJ6enrC0tLyg/NktxTB+yUtLY1FLe3ZsweqqqosraJwJkh+fj4GDBjQ5Dmai+yh77KUlZUhKCgI3bt3ZxEWOTk5GDVqFCwtLRWS9zw/Px/e3t7o2bMnbty4AaBx/RgyZAg8PDw+2pzWikJo97y8PNy9e5d5QZ89exZqampNckVPmzYN48ePf6f3/P79++X6xp07d2BsbIxdu3YBaHyH2tra0NLSwqRJk9h1YWFh0NHRkfNW+28gJiYGmZmZWLJkCQYMGIBu3brBzs4O2tracqkTCgsLMXToUEycOBHTpk2TWw9aax54E8I5GDt27MCNGzdgZmYGY2Nj5h24b98+ODs7w8nJ6YMiHo8ePYqNGzciJSUFNTU1ePjwIYsOENKtVVdXY/To0QgMDFRaiqWCggI4OjoiPj4eaWlpmD59Orp06SKXDghoTKHo6emp1JRcrY3QBuXl5di5cydEIhG6dOkiJ/uJxWJs2bIFAwcOxMCBA5V2Xua7vMUHDBjA5JrXUw02h5qaGri6umLIkCHYvn07tm/fjnv37mHq1KmwtrZmh7Y/fvwYzs7OMDc3V/hZbB+K8K4ePnwILy8vDBs2DGPGjMHs2bPZNRKJBFevXkXfvn2ZN39xcTGWLFnywRFPsuMtPz8fRkZGGDduHLvn1q1bcfToUbl5KiwsDN7e3s1KaSmUd//+ffTt2xdLlixBbGwsunTpgrFjx8q98+LiYoSGhkJLSwvPnz9XSCTV6NGjYWlpiR07dqCurg7l5eWYNm0aRCIROwNnz5490NXVhba2NszMzFp8/phQtlD/W7duwcjICEuWLMGKFStgYGAAT09PuQi5oqIiBAYGwsXFRWlRpYWFhfDy8kLv3r0RExPT5LzZQ4cOwdDQkEXcXL9+HWPGjHmvNMYtqZNsBJe9vT2cnJzkvJFLSkrg6emJhQsXwsHBocWp3xXN6/vszMxMlJWVAfiPbGtvb98kOq6kpKSJnLxkyRKoqqrC399fTo4CGtdkfX19Ftn16tUrHDx4UG4OkEqlCo80qaiogJOTE4twLC4uhrGxMSIiIvDo0SO2pysqKsLLly/fGO3x+tmDsbGx8Pf3R0FBAcRiMdauXYtevXqxvaKAWCxGRkZGq6Sn3LlzJyZOnMjSPRUWFkIkEsnVKSgoiJ1BKzxPaWkpsrOz33tv29DQgNWrVyMqKgp1dXW4desWXr58ib59+8LOzo5FhgQHB0NfXx9+fn6IiIiAm5sbbG1tW9QWQl979eoVm39evHgBFxcXWFpaYsqUKezMMIlEgqFDhzaRmVqTpKQk6Onpwd/fH+PGjYOuri5cXV1RVlaG27dvQ01NDR4eHvD29n6vsxzftKacOnUKGhoaWLZsGTIzMxEYGCiX0SUzMxNeXl7Q1dVt0TnOLSE/P5/toXJzczFnzhwMHz4cu3fvZhkZamtr4ezszCJNPpQ37Udu3boFT09PODk5sXn36tWr7JzOd2V9ak65qampiIuLw9atW3HlyhW8evUKQ4YMgbOzM+Lj41kGCm9vb7nIRtk0iy1B6B8XLlzA/Pnzoa+vDzU1NYSGhuL58+fIyMiAi4sLevbsCQcHBwwdOhR6enrNkhfy8/PlfpednY2+ffuyNMapqalYtWoVduzYITenzpgxA1OmTGnzoz9kGTt2LJMjBYQUrCdPnmTfNTQ0oKysDO7u7ti4cSPq6+tRWlrK5hvZuW3VqlVYuXIlXr58iTt37kBdXR3h4eFyGWLKy8vh6OiolDlKdq44ePAg+vTpw9IqJyQkoHv37khKSmL74ytXrkBPT++NaVM/5F0tXLgQx48fl/suJSUFNjY2TWTD/Px8hISE4MiRIzh8+DBiY2PfmYmlOXBDl5KorKzE5s2bWYcWi8UYMmQI+vfvj+PHj6Ourg4+Pj4YMGAAtm7dColEgufPn2PJkiUwNTVVWioq2Y6/YsUKDBgwAAYGBtDS0kJoaChu3ryJ9evXQyQSYcSIEfD398fQoUPRr18/tnFsLeWWbF2XLVuGgQMHwtDQED179oS/vz8bMEOGDEGfPn3eaex6E4cOHWJp3/Lz82FoaIiZM2eyMFshFZNYLG6VdIVHjx5F165dYWVlBZFIhJEjR6K8vBy1tbXw9PRE7969YWFhAQ8Pj2anilqyZAksLS2hpaWFOXPmMGNmeHg4rK2t32jsAlqWfmXXrl3o378/6z+VlZUYO3Ys1NXVMXbsWLlrnz17hpiYGJiYmDRZdJTJw4cPYWpqCicnJ4hEIgwdOpSl4VmxYgVcXFxYKqHWRrYPHzp0CMuXL8f06dOZ0DZv3jxoa2tj9erVuHXrFvLz8zFy5EiMHz8e169fh5GREUu1d+7cOfj4+MDc3JwpDQsKCtCnTx84OzvLGQLmzp2LiRMnYsyYMTAzM2OCmLI3bE+ePJFL0VVRUQEXFxd0796dzYs+Pj7o2bMnzp49C6Bx0xMVFQULC4smqQ4/lNeVYWlpacwwKFBWVobAwEB0794dZ86cAdCYYkzY+H4Iwvt9vdzCwkJ4enrKGbuuXbsGW1tbjBo16qPLaa1ojh07ht69e0NfXx/6+vpMcNq0aRM6d+4Mb29vzJs3D1OmTIGWlhbu3r37xvtIpVI8f/4cIpEIrq6ubKN34sQJ2NraAmick8aNG4fp06cjNjYWPXr0wNy5c9k9/hvSwdXX1yM6OhrXrl1DVVUVnJycoKamBmdnZ6SlpeH69evo1q0bBgwYAG1tbXh7e6O6uhrPnj2Dv78/li9fLne+RVumXMrNzYWNjQ0b/1euXGFCe0ZGBlMWxMbGYtq0ae8ts4SHh0NPTw99+vSBsbExFi1ahLq6Oly5cgU+Pj5QV1eHra0tbG1t5Q7IVnRbZGRkICIiAr6+vkymqaiowPTp06Gurt5kU9SWqXmUxdGjR9GnTx9UVVUhJSUFenp6mDBhQhNFkGBQUHS6QoGwsDD06tULcXFxMDIygpOTE+bMmYOsrCxoaGhgy5YtCikXaNxEnzhxAqamphCJREwxe//+fUyePFnO2FVUVARLS0vY2dkpTEnSXIQ2y8nJgaenJ1RVVZuceQM0pjMcNmxYk7RAzZUpnj17xtJeT506lX3//PlzbN++HYmJiQgLC3svBaIsaWlpcnLw3bt3ERYWhpkzZ7LvMjIyoK6uDn9/fzljV0lJCTMSNJf58+cjKiqKffbz84OZmZmcsWvq1Klyxq6nT58iJSUFWVlZLZKBZNOvAY3przZs2MBSI4rFYqSnp0NfX7+JsevJkyctlr9+DSEtpSCnA/JpppYuXQoDAwMmrytTmRYdHQ0LCwv06NED06ZNQ3V1NbKzs2FhYQEbGxts27YNiYmJGD58OIYNGwYALF3cx8jixYthYmICTU1N6OnpITQ0FMXFxXjw4AF8fHzg4ODwxnNcJBKJ3Bq7fPlyiEQi2NnZNZGdEhISYGBggDFjxsgZtBS9r5Cdx588eYK+ffuiuLgYT58+hYGBAaZPnw6JRIKoqCiMHDkSdXV175QTZO/36NEjbNu2Dbq6upg2bRpLxxgTE8P0CG9C2XunyMhIWFhYYPbs2WyvtHnzZnTr1k0utWlgYCBMTEwQHx//3s6yrxMVFQU9PT0MGjQIxsbGABrlaBMTE/Tr148pwOPi4jBx4kSMHDkSYWFhrA2akxpOeAenTp3CyJEj4erqypxlJRIJqqur2TVisRjLly+Hvr6+Ug3d7yInJwd9+/ZljssNDQ3o1q0bNm7cyNJEJiUlwcfHByEhIW/dw8givFfhOIKamhp4enpi5cqVABplQSMjI0RHRyMnJ4cp6c+ePQt/f/8PSomoKJYuXQpra2vo6+tj6dKlcuvjy5cvkZ2djeLiYnh5eWHgwIHN6huyY/fevXu4du0aM9zm5eXBw8MDgwYNYnqTa9euQVdXt8VnockSEREBfX19ODo6ok+fPtDS0kJsbCyqq6sxatQoGBkZQVNTE3Z2dkrdP5w/fx4ikQjr16/H0aNHMW/ePNjY2CA0NBTV1dXIz8/Hnj17MG3aNGzevLnZfeL06dMICAjA48ePWbpJHx8fWFpaYteuXWztraysRFpaGlJTU7F48WJoamq+V19vTaqqqt6YgtXe3h5Lly5tssdyc3OT0xEATed3QUYT5Pi9e/cyJ4OkpCRcuXIFnp6eze7zb6OgoIDpk4RnioqKQmBgIIDGvVWPHj2wa9cu5ObmYty4cbh37x4kEglu377d4rpMnz6dyduvp39/3Rnx4cOHUFVVlTMmKhpu6FISpaWlcHZ2xrRp07Bz506cOHEC2dnZGD58OFxcXJCWloaamhqMHj0ahoaG0NTUhLOzM/T19VvF42LlypXo1asXTp48CYlEgqCgILnN4MWLFzF16lRMnjwZUVFRLRJOWsqqVaugq6uLtLQ0VFRUICIiAiKRiCl/AWDo0KEQiURyHr+vI7sZLy8vx5YtW+Di4sI8NYXNR3l5Ofr27YuYmBjlPpgM1dXV6N+/PxISElBeXo4rV66gZ8+e8PT0ZMbSxMRErF27Flu3bn1vi7fs4r927Vro6uqy/KwaGhoIDAyUM3bZ2tqyxVCRCP3m8uXLkEgkKCoqwpQpU6CpqSl3oDHQqLyIioqCn5+fUoyqsh7IqampuHbtGoBG5cb69euxd+9euc1xaGgogoOD29z7JCIiAnp6ehgzZgwsLCxgYGCAsWPHQiqVIjo6GjY2NlBVVYW1tTXs7e1Zmzs4ODBjDNCooPHx8YGJiQk7I+Px48fo3bs3nJycWHtERkZCJBLBwcGh1YxcQON70dDQwObNm5GWlobDhw8jPT0dzs7OMDQ0RHl5OQoKCjBmzBioqqrCxsYGgwYNQs+ePVvsxVxZWYmkpCS2Oa+ursa4ceOgpqYmd8A40LjhcHNzg76+PvNAe1+FY3l5uZwC4Pr16zAwMGgSEVBQUAAPDw/o6+szw/bHntNaEdy7dw/a2tqIi4vDwYMHMWnSJIhEImYATU9Ph5eXF7y8vBAYGPhOoVkY77m5uejduzeGDBmC7OxsJCYmwtPTE3l5edi4cSNCQkJQVFSEkpISdu6Jm5sbGhoaPqpzNJqDVCpFaWkpRCIRbGxskJWVhb1790JTUxO//PIL2/xlZWWhe/fucHBwgJ6eHrp16wYzMzPY2Ni0yth/X+7cuQMLCwsAjZ5iGhoazDHBx8cHkydPZtcK7+7X1pKYmBj06tWLyRA+Pj7o1asXFi9ejNraWlRXV+PkyZNYt24dEhIS2PyqjHbZsWMH1NTUoKGhgczMTPZ9eXk5pk+fDg0NjY8uKkCRFBUVYfz48di0aROTT4RogKlTp8qdnaIMmfT06dPsvKEXL17A2dkZVlZWSvUWF/rp7du3oaenByMjIwwdOpQphWSNXYLH7JMnT9pMiQfIj6nXI7vMzMxw5MgRues3bdoEFxeXZjtpCOVVVFQwBe3Lly8RGxsLIyMjBAcHA2hURHt7e8PY2Bju7u7vbeSSSqVITU1Fjx49WLu/evUKwcHB0NHRweDBg+WuF4xd48ePV5jipqGhAbt3727iyCZr7BLO7BIiuxR1buyFCxegqamJp0+fsj7u5uYGkUgEFxcXOTnw4sWL0NfXx6hRo1rd0P748WP4+/tDW1ubKdiEeWD//v2ws7NTumPa+vXroauri23btmHNmjXQ0tLChAkTUFZWhuLiYvj4+LCoAR8fHzaP+fv7y51l1pbIjt/ExETo6ekhNTUVDx8+xJo1a+Dg4AAfHx9UVFTg1q1b8PX1haGhIYtsfv0esqxZswYikQgrV65sEg2/fft2+Pj4KN1p9vLly8jNzUV1dTUcHBwQGxvL9vrCuj1z5ky4uLi88z6y9QwPD4eJiQmAxr4mG6FWW1uLtWvXwtjYWKEK9A9h1apVsLGxwYwZM5hRZPv27ejcubOcsWvcuHHQ0dFBfHz8e8u3Pj4+TGkLAAMHDoSamhqmTp3K9jOyxi7ZM59l988tkZlSU1PRuXNnTJo0CWPGjIGamhoiIiIANM7VixcvhpmZGVxdXdGnT582i2ACGuXpQYMGAWiMlDQ0NERISAiqq6sREBDAsn+IxeL3kmMSExOhpaXVJLLdwcEBN2/exJMnT9CnTx/m9LF69Wq4uLiwc+ybE9HcUmJiYqCnp4e4uDjMmDED2tramD17Nh48eICGhgaEhYXByMgI/fr1g6urK1tjmivXLV68GH379oWuri7U1dURGhqKgoICdm6js7Mzi0y9d++ewuTHAwcOwMjICFeuXIFEIkFhYSGWL18OdXV17Ny5Ew0NDcjOzsbu3btx7tw5pewfhOjaqVOnsjPQBOLi4ph+T3AwaOm+9ujRo+jXrx9zEBcMi76+vjA3N0dcXBxqa2tx6dIl2Nvbw8TEBI6Ojq16nvP7IPsONm/ejL59+zLn5nnz5kFXVxf79u1j46e2tpZFdAm8Hj0lsGDBAohEImzYsAF1dXVITExkmaLs7OwwfPjwFvf511mxYgVWrFgBAEynFBoaigULFiAtLQ0aGhrYvn07gMa9tJqaGpKTk+XuoYi6nD17ljnG5OTkQEtLCwsWLJBzrnj16hUGDx4sl6FJ0XBDl5IQi8XYuHEj88wUBNusrCy4ubkxL+r6+npcuXIFMTExOHbsWKtsWmtqauDu7o4DBw4AaExPp6WlhX379iEtLY0N0tcn4LZQdL148QKjRo1iSp2UlBRoa2tj3759SE9PZ4fXAcCsWbN+dXCmpqbCyMgIGRkZOHHiBCwsLKCrqyu3KAhGJ0WkIHsfzp07h9DQUAQGBsptCLKysqCnp4cRI0a02EP01q1b2LBhA4vsARqVOd27d5czdk2bNg1BQUEKm2xkDaRpaWkQiURYtWoVGhoa8OTJE6a4eX3jJ+uZpcjNkKx3gaGhIfr06QMvLy+58PXy8nKcPXsWSUlJWLRoEXr06KGUlEjvW1egsd+bmZnJGXK2bdsGGxsb1ncLCgpw6dIlXLlyhb3PyMhImJmZyUWIPn78GFlZWfD09HyrsSs7Oxvnzp3D5MmT2TtsrfEvFouxc+dOqKurQyQSsaiNq1evwsHBAUZGRmxTlZiYiMWLF2Pnzp0KSSlZXFwMHR0dzJs3D4mJiYiJicGjR4/g6+sLHR0dOaUz0LhJ7t69O/T19fHixYv3GjdSqRRbtmxh6XXy8/Nx8+ZNODg4wMLCgqXpE7hw4QJEIhE0NDSUcnD1x0Z2djaWLVuGsLAw9l1hYSFCQkIgEomYYlnoj79mgJZKpeyaO3fuQENDAxMmTMDJkyeRkZGB6upqDBs2jAl+xcXFGDlyJI4dO9YmaUoVyaVLl/DixQs2h27evJlFaycnJ2PWrFlQVVWFmpoai+a8ceMGfvnlF0ybNg3r16/H9u3b29TR5U3zf15eHhunWlpa7N0BwMSJE5tEA79rXEqlUlRUVMDV1ZUpjG/evAlTU1N4eXnB1NQUUVFRb/R8VlR7vKl+hw4dQs+ePTFp0iS59aeiogKBgYHo1avXf11Up1QqRW5uLkQiEbS0tJqksNm7dy/09fURGhqqtFTSYrGYOXkIcolEIkFVVVWreIsXFxcjKysLycnJGDBgAFxcXOSMXVOnTmXpitsS2XGZnp6Oo0ePMs/ghw8fwtPTE97e3jh48CAaGhpQUlICNzc35lX6vmRkZODp06fsc0pKClxdXWFubo7IyEjmGS8Yu6ZPnw6gsS8VFxc3a4wIiqD8/HxIpVIUFBQwx6z169c3qZ9IJFKoM5TQz86cOSO3Dr7J2DVjxgy5yK6W8OrVK9bXcnNz2Xf+/v4sTaygNG1oaEB6ejqLalOWM4isAfjMmTPMwfHp06cYNmwYDAwM8OjRI9Yfw8LC4OrqqtS58fr164iNjZUzcl+4cAEaGhrw9/dnCrHq6moUFRWhuroaL1++xNKlS9GzZ0/Wth8L+/btY6noZImPj4e5uTmLWk1LS0NkZOQbs7scPHgQS5culUs7v3TpUohEIqxevbqJsUsZ+7vXsbW1hZeXF4BG5atIJGqSRWTKlCmYOHHie0WpZ2VlwdfXF+np6exaYU2SNXZFR0fD19e3VVM7y8oiy5cvh7W19a8auyZPnvze0RzV1dXYtm0bm+OkUin8/f0REhICAwMDLFq0iMnLlZWVMDU1Rf/+/ZGWlibXri2ZJ4qLixETE8P648uXL9lecdGiRQAa97ELFy5EfHx8m8vviYmJ0NfXR15eHkxMTBAaGsqe38HBgTlmvC/nz5+Hp6cnLCwsmCL+5cuXMDExwezZs2FmZobQ0FD2jrZv3w4LC4s2S7uen5+PmTNnshSKALB161bo6+tj1qxZKC8vR1FREVJSUnDmzJlmGX9k+9PZs2ehq6uL8+fP4+HDh+z5x44di/LychZxbmZmJnc8TEsjyIBGg8br77O0tBRhYWGwtrZmx8PIouj9g7B2jx8/nq3Jsu0TFhaGrl27IjAwsNljIyoqimXCAhoN/4JDtKxM7uvrCwsLC3Y0wKNHj1BQUPDRHQHw+nz09OlT6OvrY8CAAcwgFxQUBH19ffj7+2PRokVNUrDK9gXhCJyAgAD23dy5c6GqqsqiT8vKynD//n08ePCA/VZR+jWxWIzJkyfD1tYWzs7OLNpWiCZTVVWVc4zKzc2FnZ1dk6xFikBIkyvIpkId5s6di6ysLJSUlCAqKgp9+vRh6XaVATd0KQGh42ZkZEBDQwMGBgYICQlhA1wwdrm4uLRJ7uDi4mL06tULeXl5SE9Pl7Purly5EsbGxqiqqmrT8zcEKioq0KtXL5w/f55Zordt2wagccGUPZND4G2LR05ODnx8fLBmzRr2nZDLeMeOHSgrK2PRREZGRq0SNSGRSLBnzx6oqalBT0+viafF9evXoa+vDxcXFzYRvK8yXSAzMxMikQidO3du4gV++vRpaGhoICgoiG1ghd8qY+MaERGBzp07Y82aNczrRZiUZY2Wb3oORXHx4kX06NEDcXFxqK6uxpMnT1BdXY07d+6gpKQEOTk5sLS0hIWFBTP6tCYzZsxg6WOEMbh+/Xq4u7ujtraWeX/U1tZi1apVMDIyYl6tQOO8ExAQAB8fH+jq6soZR06ePAl1dXU8f/4ct27dgre3dxNjV58+fWBhYYGsrCzW/q1t5E5PT4dIJIJIJMK6desANPaFa9euwcHBAQYGBkpL73rhwgV06dIFIpEICQkJAMA8dHV0dOTSOy5YsACpqakfLLwJ586MHTsWtra2ePjwIfLy8uDi4gJjY2O593n//n0EBgYiJCRE7vv/RsrLyxEYGMjmJFkKCgoQEhICdXV1OUHt1+YI4e9CGitLS0uIRCJ4eXnh1q1byM7OhoGBAS5fvgygMU2uo6Nji50L2poNGzZAJBJh//79zOM+JSUFRkZG6NKlCyZNmoTU1FTMnj0bXbp0QefOnVnfvnfvXpMx3xZGLlnF8Z07d5Cbm8vG/bRp09C1a1em2AYa50tnZ+cmCrtfo7S0FBYWFkhOTkZBQQGCgoLYpmTYsGHQ0tKCs7OzUtJyCf0zMzMTmzZtYvMd0Jj2V4hiko0YefbsmdJThLU2r5/zIqT4kDVyAI2pr9TV1REWFqYQw8KbFK7CBkzW2PXq1StERkbC3Nxcod7iQvnZ2dlITk5m3toNDQ04dOgQ7O3t4erqypw7rl+/jlmzZrWpEk/2XUVGRkJXVxe6urro1q0bix4XlEo9e/aEpaUlRowYIRcV9D7z9pUrVyASibBs2TKIxWJcunQJ3bp1w/z58xEaGgpNTU1MmjQJeXl5zNhlYmICf3//Zj2X0AcaGhqYwXXZsmVyjlk2NjZNHLMyMzNbfD4bIH8u1pMnT7B//36IRCIWsQC82dg1d+5chZ7V9uTJE4hEIqY8FtKnW1tbY8+ePWzc1dfXIyMjo4lzjqI5duwYtLS0oKmpCSsrK2ZsLCsrw7Bhw6CtrQ1HR0eEhIRAQ0NDqR7j169fZ7Lp686QQkRcQECA3LkXQ4YMgY2NTRNntY+BV69eMZlIMELLjs3AwEA4ODg0+Z2sfBAeHo5evXrB09MT8+bNk3McFNIYxsTENEljqOxI+YsXL8LW1hYZGRmorKyEubk5bG1tsXr1ahw9ehSzZs2CpqamXITwm5BKpbh48SJEIhHU1dWRnp4u93fB2DV16lQ2F7WGIU+2foC8vLR8+XL069evibGrW7duTc62+zWSk5PlooE2bNiA6Oho9nnRokXQ19fH4sWL5YxdOjo6H+zY8DZyc3NhYmKC3r17MydtoPGZt2/fDjU1NSxevFghZTUH2bPDZP/f1tYWIpEIISEhABrXloaGBri5ucmdUf6+ZGRkYNSoUTAxMWH9MC4uDhoaGix6TCA0NBReXl5Mt9OanD59mjlovp6WTDB2zZ49u4mhtbn7jK1bt2LVqlVYuHCh3PcHDx5Er1692Jp9/fp1hIWFtWg/Iztv3bhxA1KpFKNGjWJyh+y9hXaQjW5UBklJSXB0dERpaSkWLFgAY2PjJjLi/v37YWRkhPHjxzfrHMSGhgakpKTIOd5FRUVhxowZcHBwgK+vr1y0oWDs2rRpU5sd/fEuZOfmNWvWYN++fQAa9RBGRkawsbFh+r8tW7YgMDAQnp6emDNnzhuzHC1btozpiUQiEUaNGsX+Jhi7YmNjmzhNKmONGDBgANTU1OTOZ5wzZw7TA+fl5bGz4F1cXJS2TgUHB0NDQ4NFdgnjsXfv3rC2toaJiYnSZSJu6FIwshNgXl4eLl68yEJGg4KCWBq6rKwsDB8+HLa2tgrxxHsbb+u8Hh4eGDJkCDQ0NLBnzx72/Zo1azBkyJA2MXK9qUyxWAw/Pz+MGjUKmpqazDsAADZu3IiBAwe+Uwkvm7ZqzJgx0NbWbmLsGT16NPr27QsNDQ04OTmhT58+rboZaWhowP79+9G1a1c5bzhZBZi5ufkbPULehGwfFCJ7YmNj0b179yZCANDoNSps6N90j5YSFxcHPz8/9lnwlpY1dk2ZMgV6enpKTcckPFN4eDib/MvLyxETEwMHBwdoaWlhxIgRqKioQH5+PsrKypqdv7y55OTkwMXFBaampkxgkEqlmDJlCuzt7dl1woampKQEIpFILuz49OnTCAsLQ3R0dBMFRGVlJZydnVnqo4sXLzKhWUhHkp+fj1GjRrWJYlsgPz8f586dQ1xcHFRVVVn0k1QqxdWrV+Hs7Ax1dXWlKHvv3LkDkUgENTU1hIWFsT4gGLuE8+0CAwOhpaXVbO/c4OBgqKqqwtvbm3336NEjuLi4wMTEBDdu3EB5eTmWL1+OUaNGtXnqzNYiNTUVnp6e6Natm5xREWiM7AoICICOjg5qamree54SnE527tyJixcv4sKFC9DX18fIkSNx5MgR6OjowMHBAa6urtDW1m5147ayGDduHLS0tJCQkIC6ujqMGTMGurq6MDQ0hEgkgo+PDzN2de3aFb/88gtTmDY0NLRZusKYmBi5TZqgSOnZsycGDx6Mhw8foqCgAF5eXtDX10d4eDhWrFgBDw+PZh12LhaLsWTJEty+fRt79+5FYGAgS+E6ffp0uLi4YO7cuQqfE4X+e/ToUWhqasLCwoIZ1QQEY1doaOhHl/JDEbxtDAsK0tWrV8sd3gw0bpYUrVx/feP/9OlTLFq0CCKRiK2Xjx8/Rnh4OHbv3q0QQ5NshLmuri4MDAyYbAQ0jsHDhw/DwcEB9vb2CAkJwfr169tEcfUmli5dCj09PZw5cwb5+flwcXFhn4FGuVtIAbpr165mea+uWLECampqWLlyJebOnSuXLiYxMRF9+vTBxIkT8ejRI4jFYqxatQq2trYKcYSZP38+1NXVmzhmyZ6VpgyEaL5r164hPj4enTt3xoIFC9jf/fz8YGlpidjY2F89W+h9EfpiWloajh49ig0bNqBLly5M9nr16hUzdu3bt09hZ+L9GpWVlXBxccHu3btx+fJlTJs2DdbW1iy1vHBeqkgkQmJiotLPt37x4gW2bdsGDQ0NuWg7AcEgsmTJEvZdfHw8zp079957OGXypr5SXl6O4cOHw8jIqIk8u2bNmjeetyewZ88e9OnThxl6KyoqkJ2djZiYGGZAEuZywXFMmWRnZ7P1oqysDGPHjmWGHUGGNzc3h7m5+TvTmr7J4XPVqlUQiUSYN29eE0eoffv2sfXq9XsoE6GMS5cuYfny5XLz46pVq5oYu2JjY6Gnp9fEgeRtHDp0CCKRCGvXrkVFRQXq6+vZWaayc1JUVBSL7MrOzsalS5dQX1+vMJnp0aNHmD9/Prp168bGvqyBb9euXU30GK2FUA9h7zJ27FhmjN+5cyfMzc0xevRoPHnyBLdv325WZKdsX0pPT2f79mvXrkEsFjOHtdDQUKxYsQLTpk374LMpFcHrTjAikQiLFy9uIsPFxcXJnV/UEqqqquDq6gqRSIQJEyYAkD9GYPbs2bCysmqyZrU0kktIYypk8FJXV5c7UgVo1PU6Ojq+93EjzeHx48dwdXVlTnIvX76ElZUVXFxc8ODBA6Y7CA8PZ5F0zUVWTpCN7EpISMCAAQOaGLu8vb3Rv3//Vtel/Rqy7/HmzZsYOXIkRCIROwtc1tgl69D2thSswtEwp06dwqVLl7Bz50707t0bnp6e7Jr58+czOUXRyM6FRUVFGDp0KMaMGYMBAwaw87VLSkoQGhqKzp07Q09PD/369ZNzPmuJHCmUf+fOHZw6dUrOrjBp0iRoaGiwlKH5+fnIyMjA+fPnm2Vw/VC4oUuBCC/6woULmDdvHqZNm4azZ89CIpEgJiYG/fv3x8SJE9mAz8rKgo+Pj9LSFcp22qNHjyIhIYHlwdyyZQt0dXVZWD/QOOl7enrKnW/RGry+2Jw9exYJCQlsgd6zZw9TysmenePl5YWJEyf+qjCZlpaGQ4cOYdWqVTAwMICdnV0TIe/8+fPYvn07UlJSWmUzcv36dcTFxeHEiRPsmeLj46Guri53wKHwbM3ZVO7cuROhoaFMwFi7di1UVVXlBHGBa9euKUWpKaT4EaIaBQQBKCYmBhKJBPn5+SylobJZvnw5LC0tER8fDysrKzg6OmL27NnYtWsXdHV12ULXVmRkZGD06NFyHlvnz5+HmpqanLc/0GgYs7e3f6Nn+ettKZFI0NDQgClTpsidNXHx4kW2+ZM9y+tN91AWQj9/9OgRMjIyWJ9taGjA+vXroaqqynIOA41j2sfHRymexEIu7dTUVJbjW5izy8rKMGvWLNjZ2cHDw6NZmwjhPfj7+8Pf3x8ikQhRUVHMYzI3N5edOWhpaQktLa2PzgtYUcjOb7KC8O3bt+Hm5gYzM7Mmxq7Hjx9/sHC0Zs0aeHh4yH1XWFgIAwMDBAcHY/369Zg1axYWLlyoUM/4tkJ2Lg8ICICGhgZCQkLQo0cPaGhoYNq0adi6dSt69uwJPz8/ZuzS1tbGxIkT27DmjYb6vn37wtfXFxUVFUhKSkLPnj1x6tQpbNiwAe7u7rCyskJeXh6Ki4sRFRUFQ0NDeHh4YMqUKe+dZvHChQtISUlBcnKy3OZlxIgRCA8PZ59HjRrFzv96n/t+KGlpaejRowfi4+NRX1/P5J0hQ4awawTZQFFRTB8Lspvm0NBQeHt7swgdoNHIIcgJrytKFElOTg5EIhE7NF6gpKSE5diX3bgpktTUVHTv3h1xcXEoLCxkspGgKGtoaEBiYiK8vb1hZGTURJHSWshGaUilUhQWFmLQoEEsLVFGRgaMjIzg4uKCbt26sZTDDx8+xPz589l+5H0307LjbOXKlcw7XEhbJXDo0CHo6+tj8uTJTKnTnL4i9MWqqio8f/6cff8mxywhfaSQXUKR5OTkYNy4cdi9ezeARhl6x44dTYxdHh4esLe3l6trcxGe/caNG9DQ0MD+/fvx/PlzJnvJGru8vb2hr68vF1WhaIT6lJaW4tq1a/Dx8WFrflFREUJDQ2Ftbc0MwsXFxfDz81NqSsC6ujr2H9BoMFBVVZUzaAncvHnzozrTUuD1dKMXL15ksmVFRQUGDBiA/v374/79+3j+/DlevXoFNzc3lh593Lhxcvs4AFi3bh073zozMxNBQUHo1asXunTpAl1dXeYQIKxvyiQnJweqqqosNZlYLMaNGzegrq7O9nW1tbUoKyvD06dP3xplINtO9fX1ctcJRrs1a9Y0mWdSU1PbxEHw5MmTUFNTg729PctWIOgVBGPXnDlzWFaYD50zlixZAjU1NcTExLD5VUjdO3/+fHZdVFQU9PX1oaenB2trazaOm9Mmb9LrlJeXY9asWRCJRCz6QkAsFmPv3r0Kiax9X2TrePr0aaipqWHSpEkYOnQoM/oBjboYKysriEQiWFhYwMrKqsV7uqtXr7LjB27duoWGhgbExcXBwsICjo6O8Pf3V9i5kR+KrL5KkJ82b94sJ0MAjQ4+ikgbCPzn3EZdXV0mPwrXrV69Wk7XqQheT2P67NkzjBw5Erq6urhw4QKKi4vx9OlTeHp6Yvjw4UoLHrhx4wbs7OxgZmYm975v3rwJa2tr9OnTB87OzvD29ka3bt1a1Cdk9TSHDh1C9+7d5Qw5CQkJsLe3h5+fHzIyMnDp0iVIpdJWMWY0l4ULF8LKygru7u4sEkvIGFNeXg5jY2PY29vjwoUL7PljY2Px+PFjdo9Xr17Bz89PzmhbX1+PtLQ06OjowNfXl32/adMmha+Dsn3r9fEUEhICW1tbrFy5ku0dMzIykJycjLS0NIWkTpR12NPX14eZmRnGjh0rp2cPCgpCt27dkJSU1OpnnnNDl4IRDkYPCQmBj4+P3GZl3bp1sLW1ha+vL0JDQ3Hw4MFWUVqEh4dDU1MTOjo6sLS0ZBvFBQsWwMTEBHZ2dggKCsKgQYPkvKFbozOGhoYiKSmJDbYFCxZAV1cX2tra0NXVZZ60GzZsQPfu3eHk5IRRo0bB2dkZtra2v5oGJTMzU25wxcXFwcbGBmPHjm2z1D+C966RkRF69uyJ0NBQ5m0lKLRkN7TNZdasWbCwsEB4eDgTyGNiYuQ8hl+npRPwmxbzyspKbNy4EcbGxnI5jBctWsTSDci+P0VuFGRTCAikpaXBy8sL2traCA4OZp77AODo6Ngm6UQB+bbLyMiAj48PTExMmHfM3LlzoaGhgeXLl6OoqAh3796Fj48PBg8ezH4rlUrZ4iKrRJRNO1FcXAxdXV05j+SMjAw4Ozuz0PvWjOgU6pmcnAxjY2NoaWnB1NQUJ0+eZN7KgsJl4cKFWLt2LbZv366wUHjZ1FGJiYm4efMmS/WWmJgIdXV1zJgxQ25zWF9f/8EH+75utBbqL3i2RUVFyfXTffv2YefOnUr1BGtLZL0ghRSaQ4YMQWRkJMRiMa5cuQJPT0+Ym5u3OO3DzJkz4ejoyD4L7+D8+fMsn/brBrXfKm9KYzN27Fh07doVZmZmUFVVhaenJ9TV1dGlSxeoqalBS0sLMTExiIiIgL+/f5sbU7Zt24aBAwdizJgxCA4OljNAnD9/nhm7BKOkMF4Ffm0dCw8PR+/evWFmZgaRSIRhw4axzY27uzuGDx+OY8eOwcPDAw4ODmxNUoZMNHv2bBZpXVlZCTc3NwQEBMDExAQuLi7susTERKWnCGsLBJl58uTJmDBhAiwsLNCrVy+W7iY6Ohrq6upYunSpwr1Chff5+PFjTJkyBZ07d24SdXD37l10794dIpFIzuCpCMRiMQICApgTR3l5ORwdHeHq6gpVVVU5OU0qlTbp563F48ePsWvXLlZ+XV0dcnJyoK6ujgcPHqCwsBDjxo1DTEwMKisrYWtrC319fcTExMiNxZbIFcI6GRoa2sQjWVinQ0ND5Ty53xehH5w4cQKOjo5wcnJ6o2OWYOzKz89XSvrIR48ewczMDIaGhnJe0bLGLtk0hoo81+DKlSuYOHGi3N6jtra2ibHr5cuXGDt2rNLlkqSkJBgbG8Pa2hoaGhpybf348WOEhobCzs6OpVBTpsy6efNmTJo0Cfb29pgwYQKLrN28eTNUVVXfGkXyMRm7ZNtn0aJF6NWrF7S0tDBw4EDmYf7s2TPY29tDS0sLNjY28PHxgb29PcRiMRoaGrB161Z07dpVzrgRGRmJHj16ICAgAGpqavDz82PpLfX09JoYg5XZJmKxGIMGDYJIJMKAAQMwdepUXLx4ERs2bICPj897RfvJttOmTZvg4+MDOzs7+Pj4MCXxrzlgtIaxS1YWCQ4OxrZt21BTU4OsrCyWRlKYJ9esWYPevXtjwYIFH1Q32Wujo6PZHCgYu5YtW9bE2JWcnIzdu3e3SI8k/CYjIwOxsbGYOHEitm3bhpKSEtTX1zNjV2tECL6J1yOqCwsLMXPmTKavKisrw+rVq9GnTx9m7Kqvr8eJEydw586d946mA+SPsdi7dy+io6Nx/vx5iMVi3Lt3DyNGjGCRXcB/9jZtIcPv2LEDEydOhKurKwIDA9l4mzdvHjp37owtW7Y0MXYBHzZe3uTAL5y3JaSyNTAwwIMHD5ixfvjw4Qpz4H9XGtPbt29j7NixUFdXh4GBAWxtbTFw4ECFRMy8XgdZxowZA5FIhPDwcLmzKevq6hATE4Pw8HCsXLlSIfuHEydOYMCAAUhLS0NSUhL09PTknEgTEhJgZ2eHPn36QCQSKS2QQxEcPnwYurq6uHz5Ml68eIHc3FxmmD18+DCARplcXV2dyYOHDx+Gu7u7XJ8Vi8WwtrbG7Nmz5e4vlUoRFhb2xrMhFbUOyvapDRs2wNvbG+bm5kyf8fLlS2bsWr58OSorK5tkBlHEepWens6yx1RUVKCsrAzV1dXM4UQqlWLy5MkQiURNUpkqG27oUiClpaWws7NjVl2xWMw6s2BU2bx5MwYPHgxdXV2leWbKdvyCggIMHjwYt27dwu3btzFjxgxYWlqyBTklJQWBgYGYNGkSli5dyurbWgK6iYkJjI2Nce7cOSQmJsLCwgLp6ekoLS3F5MmTYWhoyM5uOnnyJDvwUXYD/ba63r59G9OnT2+SXmLTpk1wcHCAv78/Ezhaywvr3Llz0NDQYO0fEREBHR0dhIaGskgywaP7ffNNR0ZGIjMz861/s7a2xoIFC+Qiu9TV1ZWaz1qIHBSorKzE+vXrYWxsLKdAmDlzJlxcXJSiQBTuef78eYwfPx5BQUHMy7ihoYG1h2DAWLx4Mfr27dsm6UXelM89IyMDXl5eMDExwfXr19khx927d0ePHj1gYWEBV1dXOSHq2bNn2Lx5MxMuEhMTYWJiAlNTUxw4cIClEpk/fz5CQkLkhKLs7Ow2O5fv5MmT6NKlC1auXImcnBwMHDgQDg4OOHHiBBoaGiCVShEbG4uePXtCW1tb4VE3R48ehY6ODnR1dVkqNCE1iaBECwwMxJw5cxAVFfXB84Xs4fK+vr5wcXGR82wRUjRGR0fj2bNnuHr16gcb0j523jTGT506BQ0NDSxbtgyZmZksBZEQJZCZmQkvLy/o6uq26Dyc1NRUqKqqYv/+/XLfnzt3Dra2trC3t/8o0gq1lNfHryBgSqVS6Ovr45dffoGdnR3Ky8tx584dXLhwAaNGjcIvv/yC0aNHIyMjo1XPlngd2c35+vXr4ebmBnV19Sbeu+fPn8fw4cPRr18/XL16Ve5vv7aW3L17F4aGhrh27RoqKytx9+5duLq6wsnJCenp6cjIyIC+vj6L2hTmV0UfHF1QUACJRIKRI0ciJCSEpQSaMWMGysrKsHHjRohEIpiZmTV5xv8WiouLYWtrKxelIxaLMWLECLkDiufOnQtdXV2FHWQtvAPZ+z1//hwzZ85sokCrqqrC5MmTsX37doV7i1dXV8PIyIgZ0MLCwphTRWhoKEQiEebMmdOqXupv4v79+yxl16JFi7Bp0yZUVlYiPDwcd+/exaZNmxASEoK7d+9CIpHAzc0Nffv2xbBhw5o1jwjv58GDBzh9+jRLq7xp0yaIRCKsWLGiibHr2LFjLYrouXDhAjp37oy5c+ciJCQEenp6cHd3Z3+PjIyEuro6oqOjIZFIFLpHEp734cOHmDt3Ljp37szScwnIpueSPR9HEYjFYnaovGwqZeA/xq4uXbogMjJSoeW+jtAOt27dgpGREZYsWYIVK1bAwMAAnp6ecvJqUVERAgMD4ezsrNQD7iMjI9GrVy9s2rQJW7ZsgZGREXR1dZnRd9OmTVBXV8e8efOUVgdFsmTJEujq6uLs2bO4dOkSnJycYGlpyRR7FRUVGDFiBJsHhX5eV1eHhoYG7Nu3D127dpUziIaGhmL8+PFMyQU0zpuDBg3CqVOnlPYsQn+RNW5nZWXBz88PU6ZMwaxZs9CnTx8MGDAATk5ObB55H6KiotCrVy8sWbIEixYtgq2tLXr27InU1FQAjYafzp07IyoqqtUdEGTHydmzZ+Hr68vOmAUa20BPTw8jRoxg8+SGDRs+yDj9prYVUvm+buwyMDCQi4IX+NA5UlZ2S0pKgra2NiZPnszO+jE2NsarV69QWlqKWbNmoXPnznLHWbQG8+bNw9atW9m6dufOHfj6+sLMzIydrQ00Gl1WrVqFPn36tHhuEM4oHDp0KPT09GBoaAgfHx/U1NTg7t278PT0hIWFhVz5rR01sXDhQvTp0wfLli1DfHw8VFVVMWTIEGbYCgsLQ5cuXbBmzRqFOKnKOvBbWVlh7dq1AP5j7NLQ0ICFhQX8/f3fyyn+XbzpN7JpTF93mj9+/Dj27duHlJQUtm9QtE719OnTLOofAPz9/WFsbIy4uDilnYd1584d+Pn5MXldLBbj2LFjTYxdly5dwsGDB5ucv/axsXz5crn0i0Cjs8f06dMhEolw4sQJAI17A9l5UNinnjlzhsnmM2fOhIeHR5OIuY0bN2Lw4MEwMDBgkc/KQJBToqKisG3bNjx//pz1vVevXmH69OkwNzdH165dYWNjI3cerCLYsGEDe76qqiosX74cdnZ2zOlEWCNDQ0NbfT/DDV0K5P79+zA0NGQKOdlUGC4uLti7dy+ARguxstKwyG4q7927h8TERHh6erLFprCwEKGhobC0tHxrbtzWMPrI1tPZ2RmmpqaYMWNGE8+4kJAQGBoaIjY29o3nEsjWVTantlQqRUhICDp37gwrK6smSuNNmzZh0KBBGDFiRJNc28pAKpWivr4egYGBzCOzuroaLi4ucHFxgaWlJaZPn84WzISEhPeaDHx9feHg4MCe/eLFi02E7oiICFhbWyM8PJwZdaKiouDq6qqwiU72fV6+fBmamppy540BjRuo5cuXN8lt/6Zc6C1F9uyTLl26wM/PD+bm5rCwsMCePXtQW1vLoizt7e3ZoeltkSJOtu2Ki4uRnZ3N3pMgxJqYmDAPjYKCApw8eRLXr19vEnYsHKAeEhKCiIgIhIWF4dKlSwgODoaJiQnMzMywdetW7Ny5E9ra2m+MYmltBXdlZaVcfmnhcGw9PT3o6+vjxIkT7PkKCws/yBvuXQh95N69ezA3N8eOHTtQUFCA+fPnw8bGBvPnz2dzQ0pKCkxNTWFiYiJ3EOuvITs/JScno1u3boiIiEB4eDjzUBau2bx5M0ttYWFh0WYRp8pC8O6TSqVoaGhATU0NPD09sXLlSgD/UfpGR0cjJyeHef2cPXsW/v7+LRKaX716hdDQUOjo6DCjycuXL7F48WKEhoa2WaSEIpEdt9u3b0dQUBCGDh2K2bNno6KiAomJiRCJRPjll1+QmJjIPD8TEhIwbNgwjBs3rkWbwZYiW+bWrVtx+PBhbN26FcbGxnB2dm5iiExLS2Me9u/L6tWrERwcjMDAQDlBPycnB1ZWVszrs7q6GoWFhezviva+O3HiBKysrJCRkYGUlJT/x96dB9SY9v8Df4csM8yYGbN5ZjzzfOeZOVGIiPZCoUUlhLJUCMmSLZGdyhLJFipLtuxM9iWhLFmyJbKVJUtCaa/3749+537OETOWNrlef3E6nfs+nXPf93Vfn8/1+fDYsWO8cuUKhwwZIvVb3L59O+3t7dmvXz/evHmzRLZf0SQkJLBt27ZKfeFIMiMjg23atFG6MfyYvgJvcujQIdrY2NDe3p7BwcFMT09nenq6lC2+fv16JiUlcf78+ezcuXOJloh78OABk5KSmJCQwI0bN/LQoUM8fvw4hwwZIk2kzpo1i4aGhjQxMakQQfjo6Giqq6tTJpNJ2ePPnj1jTk4OLS0tpet3eno6XVxcGBcX91Fju3379tHAwICmpqa0tbWVkh/kqykCAwNL7Dtx584dLlq0SHoP2dnZ3L9/f7Fg19SpU9miRYsSCazIE3hIKgVwnj17xilTplAmk0n3jHIlWZ5Lvu2EhATGxMTQ39+fc+bMoZqamrTCR3EVemBgILW1tZmamlqq14erV68yODhYmhzOycnhqVOnqKenVyzY9fDhw1IdJ8XFxbFDhw48e/YsyaLJxRYtWnDXrl08d+6cVJJpyZIl7NmzZ7lcN/+J4j5dv36dVlZW0vu5fPkydXR02L17d1pZWUkN4589e8bOnTvTzMyM8fHxSqXITpw4IQXhFVcXkkXn6KSkJN64cYMDBw5UWg1dWmJjY2loaMj9+/czJSWFOTk50lzC48ePGRkZKZWNUyyz9Xfi4+PZsWNHxsTESI/l5eWxT58+NDQ0lM47U6dOLdH76Pexe/duNmvWjNra2m9MjL148SL19PTYpUuX9z5fvV66UXH+JCAgQCnY9fz5c6mcozyB930pjr8LCgqYmJjINm3acMOGDSSL+mW2bNmS8+fP5/379/nq1SumpaVx7Nix1NLSYnp6epl9BrNmzVKaJ7h58yaHDBnChg0bFpu/Sk1N5dKlS9m0adP3ShJQfC/Xrl2jiYkJt2zZIs2BhYWF0dramu7u7szNzeWFCxfYo0cPWltbMysrq8y/j3FxcTQ1NZVWIR89elTqyXP+/Hlp/Cwv6/gh+/dPCfyKfRufPHnCYcOGUSaTcefOndLvfcg4XnG7jx49UloV6u/vL63s/LtjrKTPgTk5OdIq89DQUOnxQYMG0czMjGvXrpWOWcVqPx8jKSmJvXv3ZuvWrZXOi9nZ2VKw613PrxVFQEAAzc3Ni43tjxw5QplMRplMJvWVGjt2LDt16iQ95+zZs2zUqBEnTpzI1NRUXrlyhZqamvTw8JDm1dLT09m/f3/6+/tz5cqVtLKyUip5WFJOnjwp9XUni1a879mzhwMGDODcuXP58uVLZmVlcdu2bQwJCSmR+9nXv0/Tpk2jjo4Ow8LCaGRkxK5du3Lq1KmMi4t7Y8nxsiQCXR/h9frD9+/fp66ubrGLfUZGBq2trd9Yy7u0+Pn5Sc2tdXR0lII59+/f58SJE2lpaVlsoFqWFA82e3t7ymQyenh4FHuep6cn27Rpw8DAwHeakJRPIOfk5NDHx4c6OjrFlvSSRWX8HB0dS7T8xz9xdHRkYGAgX716xZkzZ0rBIHl2Urdu3d654bw8gCoPGslXTM2ePbvY32nq1Kls1qwZZ8+eLQ3SSyrApPj7hw4d4u7duxkYGMh27doVW01369Yttm7dWqm2fUlmFhQUFEivFRcXRz09PWmyIDk5WcoukD92/Phx+vn5cenSpeWSfaL4vgMCAmhtbc2mTZuybdu29PT0ZHp6OhMTE+ns7My2bdu+MSPx9UHU5cuXpQkp+ZJ+smiF2IoVK6itrc2RI0dKJdtKK/vnXT1+/Jht27blmTNn+OrVK3p7e0ulMKysrNipUycGBQWVWIBL0ZUrV7hy5Up6eXkpPS5fCanYdPrp06fvfMO4b98+pf+npKTQ2tqa69evJ1lUtjA6OprTpk3jmDFjpG1ERkZy5syZlaJPlKKIiAhqaWkVK8dka2vLy5cv8+HDh9TX15c+hyVLltDe3l66sSuJ1W1Pnz7lpEmTqKamRlNTU9rY2LBVq1YftVKsIpozZw51dXU5adIkjhs3jtra2rS0tOS5c+ek8mxNmjTh8uXLeffuXbq4uEhlqcjyWcmleB7cunUrtbW1pf53GzZsoK2tLQcPHlxswl8x2P8u5DeHtra20nblwb2dO3dSU1Oz2DY+9u+xfft2pYSC+Ph4urm5SeNEeXbgokWLaGZmJj1PvrrnQ0qxfSri4+PZsmVLpfNlQUGBtNJt9OjR0uMlOXkjv/ny8fGhk5MTO3bsSF9fX758+ZLp6emcPn06ZTIZjY2N2apVqxJJgJHv/4EDB2hhYUEdHR3OnDmTDx8+ZH5+PidMmKDUR8Lb25vh4eHlurJX8W++f/9+ymQyNmrUiFOnTpXKSGZnZ7Nbt26cNGkSL1++TFdXV3bt2lUal3zI8XPx4kVqa2tz48aNfPbsGePj45XGtOvWrWPDhg05e/bsjw46JSUl0dHRkdra2kp92N42gfOxiXHx8fFKn2lkZCT79evH3r17MywsTAq4vml1YUnbu3cvW7duTVtbWxobG3PLli308vJSasquGOwqzT558m05OjpSJpMpNUnPy8vjyZMnqaenxwEDBpRZYsrRo0dpampK8n8lVsPCwpiVlUV3d3dpYjs7O7tUEvY+luKxl5OTw4SEBBoYGDA+Pp63bt2im5sbw8LCGB8fTz09PbZt21YaC6SmptLe3p7a2trSPemsWbOkqhxdu3Zlw4YNOXXqVJJFf4OZM2dSS0uLHTt2pKOjY4mvhn6TxMREDh06lCYmJhw8eDBPnz7Ny5cvU1tbW7r/efLkCYOCgt45YSQyMlIpoCWfq0hLS6Oenh79/f2l55bl5y7fRmpqKp2cnBgeHs5r167R3d2dVlZWSpPeZFFFBFNT0/eaXH3f0o05OTl89uwZN23a9MGf87p166R7o8LCQt65c4cWFhYki87PRkZG9PLy4osXLzhx4kTpuQ8fPiyV+8I3kSegKP5/+fLlLCws5P379+nh4cE2bdoUm/978uQJg4OD32m18fTp04ttZ+/evezcuTPT0tKk72F2djZDQkJoZGQkVfOJjY0tt4QY+ZhG/m9NTU2uW7eOeXl5dHZ2ZkBAgPTcDwm8vGsCv2Kw6/Hjx3R2dqaOjs57Jae+bbuLFi2iubk5LS0tOWnSJOlx+SrH0uwj+6YqG48ePZICbYqLFgYNGsSOHTsyJCSkRMeODx8+pL+/P5s0aVJsnjYnJ0caH7q5uZXYNkvK28agkZGR1NPT47p165SCXXFxcezXrx+9vLxoYmLChIQEbt++nTo6OnRxcZGet3z5choYGHDy5MnMzs7mmTNnaGhoSAsLC1pZWdHW1pYdO3YkWZQo1qFDhxI5X71+7Jw8eZI9e/ZkYmIio6Ki2KtXL7Zr1469evWimpqa0vEnVxLBrqNHj0rXnFevXrFbt27s0KEDx40bx/j4eBYWFrKgoIAODg7l1hKGFIGuDyb/osXGxnLu3Llcvnw5ExISOGjQIPbt21fKPpRzc3OTsgVLs0wbWXRhbN++PSMiIhgWFkZDQ8NimXD379/n8OHDOWrUqDIfmL/tpCO/2ZT35lE0ePBguru7/+O+yoMZ8oGoPLvL0tKS8+fPLzapX9I9H95EcZ8XL17MQ4cO8fTp0xwyZIh08K9evZpmZmb08PB45/IrGRkZHDVqFG1tbdm3b19qaWlx7NixtLS0LFZOIT09nXp6ejQ1NVUaDH/sZ6/4Wd6+fZtaWlr09PRkZGQkFy5cSBMTE6VgV0pKCj08PHj8+PESvflZsmSJlHkh36eNGzeyb9++JIsGmwMHDuSUKVPo7OxMfX19pVUN5S0oKIi6urr866+/GBsbS39/f1pYWNDFxYWZmZm8evUqXV1d2aRJE2kCWJHiyq7Tp09TJpNRTU2NY8aMKZb9e+fOHa5du1bKzpEHesvrBj0rK4suLi48c+YMIyIiOGLECKn0pbu7O5s0acI+ffqUSkNTZ2dnymQyWllZFatpPnv2bHbq1Injx49/r8mtY8eO0cLCgg8ePFBaNWZmZsaEhATev3+fgwcPppWVFU1NTdm+fXv26NFD+i6WV/nI0nTixAmpvIY8mzgzM5Nt2rThlClT2K5dO3p7e0ufwbp162hmZlbiJYlycnIYGxvLFStWcPv27SXeY6W8xcbGsl27dkoBxZSUFJqZmbFr1658+vSpNImvrq5OMzMz2tralutKLkW7d++mq6urtMpPLiwsTAp2vSkx5Z+OmYsXL/Ls2bM8ceIE16xZ88Zm5hEREezSpUuJXRMKCwv54sULymQydu/enfHx8bx79y6dnZ2lhtXk/yYBg4OD2aVLF4aEhHDGjBls3bq1VGr2Uye/4SGLxlzyAHZaWpo0ifb6ex08eLBSMkxJ7INcRESE1DuDLJrAla96l0+enD9/ngcOHCjRRKjIyEg2bdqU69at44kTJ6SJqZSUFC5YsIDOzs6Mjo6mv78/9fT0yrVk4evH1PPnz5mfn8/IyEipb2VaWhoLCgro6+tLY2NjGhgYKJVT/tAx3vr16+ns7FxsHxITEzlq1CiSRaXDWrRo8UGruhS/C8+fP6e/vz+1tbWLrQ5VnMAZNGhQsd99X3v27GGrVq2klQonT55kw4YN6e3tza5du9LU1JS+vr5Kwa6GDRuWSnmuK1euUFdXl9u2bWNqairT09OZlZXF9PT0twa7yoI8iKSrq8v169dL54r8/HyeOnWK6urq73Qv+DHkqwCio6NpZWXFdevWsVmzZly3bh3JomPDzs5OacKTLP/rpyLFfZk3bx4DAwN55swZTpkyhUlJSQwNDeWkSZOkpKqePXtK95Ly4/bp06fs06cP7969y9OnT1NXV1cqkZeZmcmIiAg2adKE06dPJ1n0d9m3bx/j4uJKpMn9372vmzdvMjo6Wlpdun//fnp7e0tlP/v3709bW1veu3ev2N/jbX8nuejoaOro6BQrBSdPWlZMDPq71y4NcXFx7NWrF/v16yfdE6WmpnLo0KG0sbEpFuz60PHMu5RubNiwIf39/ZXma973nJ+Tk8Phw4fT1taWXl5e7NChA7dv386OHTsyMTGRxsbGnDBhgvT8Tp06KfX6Lgvnzp2jpqam0n7Ie++EhoaysLCQSUlJHDlyJC0sLIr18nyXe7q0tDROnDixWFLNwoULaWRkJP1ffo+Um5vLpk2bMjg4+CPeWcmIiYlh165dGRwcTE1NTen6lp6eThsbG6kHrdyH3uO+awK/fHXj/fv3OWDAADZs2PCN8ybvs92WLVsyKCiIPj4+bN26tVLFojlz5pRJGdPX50CePHkiBdoUg129evWira3tB1chUByv5+bmSt+59PR0Llq0iFpaWsWS2LOzs3no0KEK10dY8bu2a9cuBgYGcsKECdKq9RkzZrBFixZcsmQJr1y5wqSkJLq4uHD48OG8ePEijY2NeejQIebk5LyxJ1lwcDB1dHQ4adIkZmZmMikpiTt27KCvry/DwsKk7fv6+rJXr14l+v1YtmwZN23axLt377JRo0a0tLSkTCbj2LFjpbllLy+vYoncJeFNqwoLCgr48uVLpT7hgYGB1NPTK9debSLQ9QEUy6I1bdqUnTt3llZHrF69mpaWluzTpw+XL1/OM2fOcObMmdTW1i6TFSN79+7lzJkzuWTJEpJFJyl5Jtzrwa4nT56U2LLWd6V40rl8+TIvXrzI06dPS4/Z29vT0NCQkZGRxQbI77KvWVlZXLx4MTU0NKQG3zk5OfT29paa8b2+sqs0nTlzhkuWLCk28Jk7dy779u0rvZcpU6ZIN7jvIysri23btqW6urqUyeLj48OOHTvS399fuklMSkri8OHDuWnTplKZSJ81axY9PDyoq6vLhg0b0tXVlUeOHOGiRYtoZGREDw8PHjt2jE5OTnR1dZX2oSSCXS9fvqS7u7tSk8PCwkJOnz5dChQtXryY48aNY2ZmJp88eUKZTEYTExNOmDBByiAvD4WFhUxNTWXPnj2Vltjn5+dz8+bNNDU1lT7XEydOcNasWcX+Zor7fvXqVSYkJPDChQu8evUq1dTU3hg8lX/v7OzsSrVu8Ovk242Pj+eJEyek3jPycjgeHh7STTNZtJozPDy81MqL5uXlceTIkdTW1uaqVauKBcKnTp1Ke3v7d87CiYiI4OHDh6VyOoqTt7a2tjQwMGDTpk3p6OjI8PBw5ubmcsmSJZ/ckv8PcebMGQ4YMIBt2rSRGviGhYVRU1OTXbp0UXqut7c3+/Xr98ZytcL/vH7e2rVrFy0sLKS/m/waeuPGDTZt2lQaeF+7do179uxhdHR0qdWQf1+FhYUcPXo0GzVqxE6dOhU7FteuXcuuXbuyZ8+e73U+mDt3Lk1MTKijo8Pg4GC+fPlSaqweHh7OpKQkpqSk0MXFha6uriU2FpK/zu3bt6mrq8vevXvzwIED9Pf3Z/PmzTl8+HCl5ycmJrJr1660tramtbX1O6/srsji4uKUslwPHTrEXr160dLSkosXL+arV68YFxdHDQ0Nuri4cNu2bbxw4QJ9fHzYsmXLErtpVuyR6OvrS0dHR44fP17pOfISz35+fqWSJZ6bm8uxY8dy8eLFJIsSlTZu3EhHR0fq6OjQzMyMvXr1oqGhIU1NTculjLKc4nklNDSUw4cPp7m5uZSAsmfPHqqrq9Pb21vqV3X27FkmJiaWyAS3vC+TPOgoP0cdPHiQLVq0kAKAHxPkOnPmDGfPns21a9fy8uXLXLhwIXV1daUVKnIlNYHz7Nkz5ubmctCgQTQ1NWVYWBg9PDyU7g0UA67yYNfo0aNLpTzXtm3baGtrW+ye48aNG/Ty8pImcl9fYVCS5O9HXhJKPhmZk5NDV1dXdujQgZs3b5Ym2vLy8njmzJlSnUy7ceMGtbW1uWvXLhYUFLBjx47FJhJfvXpFe3v7YkGFimj//v00MTGR7rOfPn3KnJwcqVICWfTd7Nu3LyMiIopVqpEfz3v37qWpqWmxVQI7duygTCZ7Y8Wakl7JJd+3ffv20cTEhK1bty5WleLYsWPs3r07u3TpQplMxnXr1r31uFHcv/T0dGlu4OnTp2zbti0HDhyo1HNFnrVe1n2hyP9NPu/du5fm5ubU0tJSOv89ffqUQ4cOpZ2dnXSN+VDvU7qxJHpsZ2RkSJ+XPJhkYmJCmUymdD9YWFjI/v37S9/bspq3Sk1N5ZIlS4qVU5b3NZQHm+TBLmtra6X+Se9Kfp6LjIyUVrlfunSJ6urqSslf8h7j9vb2pdoD7+/k5ORI9xkpKSls06YNZTKZ0n5mZ2ezS5cuH1y27EMT+BVXHCUlJdHd3f2DrxmRkZE0NTWVqjIcOHCAjRs3pq6urlLAdcqUKaVaxjQxMVG6Z1H06NEj+vj4FPvZhyRovT5ej4yM5OjRo9mlSxcGBgZK8zWLFi2ivr6+0rFZ0fn5+bFVq1ZSeUcDAwMOGTKEhYWFnDdvHi0sLKimpkZzc3Pa2NhI1wZbW1tGRUWR/N8qf21t7TcGu6ZMmSKtns3Pz2d8fDxXrVrF6dOns3nz5h8VbH1dVlYWPT096e7uTrIoyXX9+vVSIrGcvb19scSMD/FPqwrlY6GsrCzOnj2bpqam7N69O/X19cu9ao4IdH2gU6dOsUWLFlKpi5MnT1Imk9HLy4sbN26kh4cHjY2NpfryZTFpkZeXRzs7O8pkMqUJG3nZB319ffbv37/YjU1ZTfIrXgB8fX2lgWrjxo05cuRIafDUrVs3mpiY8OjRo8VWdr2+r2+6qGRlZXHFihVUU1NTCnZNmjSJBgYGXLp0aZkMkA4dOsSGDRtKDfnc3d2l+r7ywNvRo0c5bdo0amtrf1AfjpSUFGpra9PBwYGdO3eWgiW+vr7s2LEjx40bx6ioKPbr108pC7IkP/P169ezdevWPHfuHK9du8a4uDgaGRnR3d2dR44cYUhICI2NjWlsbMyePXtKn2lJ7kNSUpKUhSrPZHj8+DH37t3L+/fvs1evXty0aRNzc3N58eJF2tra0t/fX8r2K08PHz6krq6u1PhS8Ts/YMAAOjg4FPsd+UVY8Xs8d+5cGhoasnXr1ly6dCnJoom9hg0b0sPDQ1q9Ip88IovKJcovlGVl3759bNq0KfX09Ni0aVNpcJafn8+OHTtK5brmzp1LPT29EvuM5H+rx48f88mTJ9I5OT8/n0OGDKGZmRk3btxYLAPyXSbVCwsL+fz5c8pkMvbs2ZPXrl3jnTt3aGRkJE2o3rlzh0uXLuWOHTuUPuPJkydz8ODBSuVvKhPF93Tq1Ckp2HXhwgXm5ORwypQp1NDQoLe3NxcuXMjx48dTS0urRAeFlZ28fMmOHTuoq6tb7G+XmprKtm3bFiurUpIJB+/rTef//Px8zpkzh3p6epwxY4bSuYosKhUxbty4d752LFq0iK1bt+b58+d57do1pqWlMTMzk+fPn2dwcDDV1NSorq7OESNGKJXKKolrU2FhoTRxce3aNWpqanL06NHSamcdHZ1ik+rPnz/n8+fPS6QfVHlLSkqSJoEKCgp48uRJamhocMqUKRwxYgQ1NTXp7e3NrKwsxsXFsUuXLmzRogVNTU1LJdAXGRlJDQ0Ndu3alfr6+tTR0SlW6mfOnDnU19env7+/UhnkkpCTk0N7e3uOGTOGsbGxtLGxoa2tLV1dXblkyRI2bdqUmzdvZkJCQrn1Z3z9PODv709dXV0GBARw9uzZ3LFjh/Sz/fv3s1GjRnR1dWX//v2VJvbe53zypjHpgQMHaGxszE2bNhWbyLKwsODFixeVfvd9tyVPUrS1tZXulw4dOvTGKgQlZfXq1dy9ezfJouoVjo6ONDY2LhZI8vPzY8eOHTlr1iy+ePGCGRkZpfJ9CAoKYrt27aTJSvnfRl4VY82aNZw6dWqplVFWLOXZqVMnGhoaUl1dncOGDWNiYiJzc3M5YMAAduzYkVu3bi2z6gvp6el0dHSUJkvj4uLYrl072tnZcd26ddy2bRudnZ1pZWVV7skh/2Tbtm10cnJSmpAtKCjgvXv3aGxszNWrV/Py5cscOHAgHRwcpOP2TcdvTEwMGzVqVKx8+q1bt6ipqVmsX0xpiY6OBulyGAAAd8dJREFUlkqjvXz5kvfu3WN6ejrj4+OlsXpKSgoPHDhAFxeXN05wHz58WClItGjRIjo7O9PIyIjTpk3jlStXmJCQwMaNG7NPnz5csWIF9+/fzz59+rBTp05lOl56/RyXk5PDw4cPU19fnz179lT6WWpqKl1cXOjo6PhRZdTKunRjVlYWzczMaG1tTTs7O4aHh3Pfvn1s06YN3dzceOPGDV6+fFlaeVuWq0bk7ystLY1BQUFK93Rk0YqQ14NdAwcOpL29/QdVDLp27Rrnzp2rNJcxa9YsampqcuHChczJyWFKSgoDAgJoZGRUKj1//klQUBAHDx5MMzMzzpgxg4mJiYyPj2fDhg05aNAghoWF8dChQ9Lx8rHnyQ9N4Jf7mO2HhoayW7duJIsSifv27csVK1YwJCSEGhoanDp1qjTOL81+8/fv35dKz79ezjghIYFNmzalTCbjypUrP2g7iuP1wsJCqSfrpEmT6OHhIfVsPHToEAsKCrho0SKamJgUSxirKBQ/gwMHDrBdu3ZKyWNr166lhYUFx40bR7Jo3HP69GmePXtWGmvMmjWL7dq1U+rLlpuby/3797Nly5ZKwa6QkBAaGBhw9OjRfPjwIV+8eMF58+bRxsaGgwYN+uDymW96P3IRERFs0aKF0v3+jRs3uH37dm7ZsoUDBgygpaVliY5T/m5VoXx+4f79+/T19eWmTZsqRNUcEej6QPPmzZP6Bzx69Ih9+/bl2LFjqa2tTXd3d8bGxvL58+dMTU0ttUmLN03GyMs+GBoacsOGDdIBKy/7IJPJpP43ZUnxID1x4gT19PR45swZxsXF8eDBg2zevLnSCqeuXbtSXV1dyiD4O1FRUcUm8LKysrh8+XLKZDLp4piTk8MZM2aU2YHn4eHBdevWMT09nWfOnGHLli05aNAgpqWlMTExke3bt6eJiQnNzc0/alKnoKCAqampHDBgAG1sbLhr1y6SRUEMU1NTaUBcWuWppkyZwpEjRyo9lpycTAMDA7q6ujI2NpapqalMSEiQTrgldeJVPAYePnzIcePGUSaTSU2V5aU09PT0pOfNmzePgwcPLpfJxDcds/KykvLm2+T/Mrv8/f05cODAf7yxUpzQTUhIYGpqqtRv5MKFC1RTU6OTkxO7desmlWySryTr2rVrmU0ivHz5kra2tgwPD+fJkyelTCR5SZhly5axYcOGbNeuHfX19Ussq13+nT948CDt7e1pamrK5s2b093dnYmJiczPz6erqyvNzMwYHh7+3iuJ3rR648iRI/T392e7du2UzrkvX77k5s2beeTIEU6fPp1aWlofPQj6lJw/f57Ozs5s06YNr1y5wvz8fIaFhdHMzIx2dnZ0d3dXyqIV/t758+cpk8l47tw53rlzR1qVoBggfv78OW1tbaVyDeVN8Tx44cIFRkdHc9++fczPz2dhYSF9fX1pYWHBuXPnFkvMeddkjYyMDA4ePFi6FiQkJHDevHk0MTFhkyZNOHXqVG7evFmpXyRZctcm+X5GRERw2rRpbN++vTSp/rbSvuURcCxNR48epYaGBkNDQzl58mSlm/D169dTT0+PEyZMkMoZ3rp1i4mJiSVeUjo1NZW+vr5SUkVsbCzt7e2pp6dXLNgVEBBQamPEnTt3slmzZtTU1OTAgQOlEufXrl2jnZ1dhSr7Eh8fzw4dOiiVQZU7d+4cs7OzeeTIEdra2tLJyemDjhvFEvCBgYEMDQ2VgttDhgyhvr4+N27cKK1C8ff3Z4cOHT5oJZfc60mK8vuiYcOGScelqakpPT09P3gbr5OX57KysqKfnx/btGlDFxcXymQyBgYGFiubLA/2z5s3r9SSXy5evEg1NTWllUryfjN2dnZMSEgo9cSbEydOsFmzZly1ahUjIyOlnmE9e/ZkcnIyc3Jy2L9/f+rp6SkFWUtbTEwMmzZtKgUhb968SQcHB5qYmNDGxobDhg0rk/5T7+v1a+K6deuor6/P5s2bF7uXlpcwbteuHbt06aLUD03uzp07UlnLzMxM9u7dm87OzkpZ40+ePOHw4cN58ODBMgn8+fr60sfHh2RR8GHZsmW0tbVlq1ataG9vrzTx/6YxwtWrV6UJ4fz8fKlvcWhoKH19fdmzZ0+2a9eOZ8+e5Y0bN+js7MzWrVvTzs6OgwYNKtPPXX78nT9/noGBgdyyZYs06Xro0CHq6uoWS4RMTU1Vmph9120oKo/Sja9evZLmMezt7RkUFMR9+/bR1NSUTZs2leZKymOls/z9PX36lEFBQTQ0NHxjsEse6E1OTn6vz0C+jfT0dDZt2pTjx4+nn58fZTKZ1OZhzpw51NDQYKtWrWhubk4jI6NyWSmxaNEiamtrc8mSJfT29qadnR3btm3LixcvMi4ujg4ODtTS0mLnzp05cODAjz5eyjKB/03f4w0bNnD06NF88OABZ82axZkzZzIzM5M3btyQeqHLEwlKst+8/HUUy/e/ePHijb07X758ybFjx3LdunUfVe5acbw+btw4KWGaLBoveHp60srKivHx8UxLS+OcOXNoYWFRZn3y3sXEiROl85b8O7BixQr27t2b2dnZ0vcxOzubixcvppGRkdIigzNnznDo0KEcMGAAtbW1eeXKFcbExHDbtm0MDw+XkqwOHDhQbGVXYGCgUsUq+XfyYyvTKH6nXl9RPXDgQA4ZMkQaQ0ZFRVFPT0+aSynJ69W7rCpU7HNbUYhA1wcoLCyks7OzVPfS399f+ndkZCRlMhm7du0qTd6WBsWTeHx8POPi4qQb0r8r+yCfWCwvu3btoru7e7FyaVeuXKG6urpSptD48ePfaV/lSydfLw/46tUr6aJQEks339XVq1cZExNDNzc3pSb0Z86coZaWFocMGcLU1FTm5OTw9u3bJdbAMjk5ma6urkrBrtTUVMbHx5dKvXT5Rb1fv37s37+/9Lg8aLJr1y5pcKKYcVDS+0AWZTHExMRw4cKFUskVeX+By5cvU11dnQMGDODQoUPLbbWI4mTGmTNnePLkSWnQHhwczCZNmkglGciiv5Ojo6NSAOxN3jShO3/+fBobG7NRo0Zcv3494+Pj2bdvXw4ePFi68KWkpHDy5MmlvtpU/hk9ePCA8fHxHDNmjBRkTElJkS6Q8oFbXFwcd+/eXeKNdaOioti4cWOuXr2aycnJ3LZtG2UymVQiIj8/n4MGDaKOjs57N4B/0+qNMWPG8PDhw9KE9pQpU0gWfT7ySZMePXpU2pVL8s/94sWL3LJlC+fNm8cTJ04wJyeH169fp5OTk7Syi/zfeeP1ST/h76WmprJv376cPXs2SXLNmjVUU1Pj6NGjuXPnTp48eZJOTk60tbWtEJNyioN2f39/mpmZ0dzcnJqamrSxseGJEydYUFDAadOmSf0mX09KeJebyfT0dBobG9PLy4tr166lgYEBHRwc6Ofnx6VLl1JTU5MXL17k/PnzKZPJpAbnJenMmTNSz4KTJ08yJiaGenp6dHNzK7VJ9YomKiqKampq1NbW5qZNm5R+tnbtWurq6nLy5Mml1o8qNTWV6urqNDAwUCoPfOHCBXbr1o16enol2ofrn9y5c6fYKhl56ZTSKtH7TwYMGFDsOxgXF0c9PT1eunRJeiw3N5cPHjxQCgIoltT7kPPLvn37qK6uLq2u6tatmzTx4OHhwXbt2klVC1q3bv3RE51/l6QoD0LPmTOHnTt3LtGVVIrlueTB7WHDhrFt27YMDw8vlmwUEBDAu3fvltj23yQwMJBqampcvny5tJo0MDCQbdu2LZVVZIrfk8LCQo4bN67Y6rn4+Hhqa2tz7NixJIsmdtzd3Us1QXH//v1KK5XS09Pp5ubGqVOnKl1rUlJSmJaWpjTZWlEo7ueGDRukcf2ePXtoZmZGV1fXYhPj586dY1xcnHTcKlYakCeFtGnThuPHj+ezZ88YHR1NW1tb2tracvXq1YyIiKCzszO7dOlSan8T+eteuHCBjx49YmBgIE1MTPjXX3+xQ4cOUvn1DRs20MDAgPv37//H1zx27BjV1dUZEhJCd3d36R6ALBqvjh49mtbW1kxJSeGrV6/4+PFjqbx6abzHN1FcfdqsWTOp/4qHh4eUCHb48GHq6OgoTba+D8V5pKysLGllTGpqKtu1a1cupRuTkpI4YMAAdu/enZs2bWJ+fj63bdvGR48elfmEuvwzkAd7yaJzw5uCXfIyhq8nXb+vhQsXskePHjxx4gTHjh0rBbvIonmOsLAwRkZGlvj98bu4ffs2hw8fLs01kOTZs2fp7u5Oa2trPn36lOnp6Xz48CGfPHnyQcfL2xL4Bw8eTGNj41JL4H/9WJB/3q9evWJiYiJv375NS0tLqT3GpUuX2K9fP549e7bU7qsOHTpEGxsb2tvbMzg4WCpnPHnyZOmeJSkpifPnz2fnzp1LJHlbPl7X0tIqNqd64cIFtm/fXurB9vTp049KOippiYmJtLe3Z9u2baX5cPk4w8bGRnqefI7h0aNHlMlkStcMeZWtefPm8datW5wzZw5NTEzYvXt3du7cmU2aNGF4eDgLCwu5b98+amtrK7WeeH2MU5KWLVvGsWPHSucDsmie1draWqkHVkpKCjMyMkrsevW+qwpf/96UNxHo+kBnz57lzp07pQnkv/76iwUFBdy9ezc7dOigVCqspL0+UWRqasrWrVtTJpNx4MCBvH79OnNzc9m/f3+am5tzy5YtxW6iymPC68GDBxw2bBg1NTWVmj7LTzrz5s2jra2tUgYDWXxf5e//4cOHvH//Ps+fP8+QkJA3HmArVqygmZkZW7VqpTRQLS27d+9m8+bN2aJFC8pkMi5YsEDp57GxsWzdujUdHR1L5QIhD3bZ2dkVW8JcWiUqd+3axYYNGypNIpHkX3/9xT59+rB58+Z0cHAotUwseRaora0tjY2NuXXrVmlll3zp/6ZNm9i3b196eHiU+eqZyZMnK2VF+/r6smXLltTW1maLFi2krO7p06dLATlPT086ODjQwsLiHy9Sb5vQnT17NhctWkQNDQ0+f/5cqUlkWZcsk9f319PTo5qamlRqjfxfsEtNTe2Da3m/C29vb6kpblJSEk1NTTlt2jQmJiZK283NzeWIESPee4LpXVdv+Pr6kiwaSCcnJ5dq49qKYO/evdTS0qKDgwNbtWpFQ0NDurq6MiMjgwkJCXR2dqaZmVmxzFHhzd52Dl+wYAF1dXWl71N4eDi7dOlCDQ0N2tjY0NnZucJloIeGhkolb8mifm1qamrSuVIe7NLR0fngINTWrVupp6fH1q1bc/78+dI1KCoqit27d2daWhpfvXrFwMDAN2aqfaylS5cWm4RKTk6WjgP5pHqnTp0qVFZkSZOX9vb19S12M75hwwaqq6vT19e31ILcx48fp0wmo4+Pj9L4Mi4ujj169KC6uvp7Z2B/jPT0dKmv6dChQ6XM0fJy+vTpYvcI0dHRbNy4sXRTrTgOsbKyUloJRL7f+FJ+jn/x4gW7dOnCLVu2MCcnh8nJydTT06Otra0U+Dx79izXrl3LHTt2fHRD63dJUnRycuKCBQtKfHyuWJ5Lvrq2oKCA7u7u0kryslpZL/fq1SsuW7aM6urqbNOmDS0tLWlgYFBq30X55y5fbWxjYyOtzlFMFtq6dSubNm1a6iscCwsLmZSUxCZNmrBDhw50dXXljRs3mJ+fzwMHDlBTU/OtpcHKq6/vmyjuS0pKCps1a8bu3btLQYpt27bR0tKSQ4cOfetnq3h8r1mzhtra2ty+fTunTJlCGxsbqQrGhQsX6OnpyWbNmrFbt250dXUtlXL05P++L6dOnWKTJk0YERHBEydO0NnZmc2aNeOoUaOkZNLCwkLa2tq+c0+5qKgoymQyqqmpKQW6yKJzjqGh4RuDZmU5Po2JiaGWlhbXrl1LsmgVtIaGBkeNGiUlSxw5coQNGzbkgAED3uu1Fd/H0qVLOWDAABobG3PixInlXroxKSmJrq6ubN++PW1tbWliYlLmQeXXq4C0b9+eCxYs4MOHD5mVlfXGYNfcuXPfK2HnbavpjIyMGBUVxfT0dI4cOVIpcbe8HDp0iDKZjM2aNZPaLMjFxMTQwMBAmm9R9D7nBMXnRkVFMSIiQuoTl5mZSScnJ1pYWJR4Av/fHQvHjh2T9sfY2JgJCQnMz8/n4MGDpR5PZMnfV8XFxVFTU5M+Pj50cnJix44d6evrK1Xqka/INTY2ZqtWrUr0mi0fr8+YMaPYCqI+ffpw+PDhFer6p+jMmTMcOHCgUi/wEydOsGHDhly+fLnScxMTE2ljY/PWlZHh4eFS9TGy6B5VXV2dBw4ckBYo7N+/Xyl5qSRX9cn/xvLXmzVrFnv27El1dXWOGjVKCjhbWVkpJQwpbv9jPqfyWFVYGkSg6yOtXLmS5ubm0v/9/Pw4bdo0pZqxpWXFihXU09NjdHQ04+Pjefz4cerp6dHBwYEPHz5kdnY2XVxc2KpVq3JpWPm2sgEjRoxg8+bNiw1IFy9ezN69e//tayrWde/YsSN1dXU5c+ZMPnnyhPPmzaOamhrDwsKk582ZM4ebNm0q1ti+NKSmptLR0ZHh4eG8dOkSBw4cSGtr62IZPidPnqSJiUmpZREnJyfT3t6eXl5eZTIoT09Pp6enJ7W0tBgeHi6VTnBxcWFQUBBv375NPT09durUqcRXr1y5coW6urrctm2blHUlz8aRB7vk37Pc3NwyXy2SkJAg1TaOj49nbGwsDQ0NGRsby8jISHp6elImk0mDqd27d9PBwYHDhg2jr6/vO5d6fNuE7vHjx2lvb680aVNWN2qKq+2MjY05f/58hoaGUkNDg0OGDFG6GKakpNDb25taWlp8/vx5ifXIIYsGoPn5+bS2tmZYWBgzMzNpYGAgrSqNiYmhpqamUub6h3iX1Rvt2rWTakJXRorfrWvXrtHExIRbtmyRlu6HhYXR2tpaWlJ/4cIF9ujRg9bW1szKyhJBrnd0/PjxYpOAlpaWSoPdp0+f8tatW7x3716FzEAfM2aM1NcnIiKCWlpa3LhxI8+cOUM/Pz+SRcduaGjoR91EPn36VCm4kpOTwwEDBrBfv37S3yU9PZ1Lly4t8QH6pEmTaGdnJ/1fPpEdHR0t9e2MjIysUFmRpeX48eNUU1NjaGhosWDXpk2bSn1SW3H7iqvoY2Nj6eTkVKZlA7Ozs7l582b26tWL06dPL7cbw9DQUKUJkpCQEFpZWUn/HzJkCLW1tZX2Lz09nba2tsUSm97XsWPH6OnpycGDBysFGR8+fCgFu0pjtfk/JSmOGDGi1Hq3Kpbnsra2Vgp2dezYkatWrSrzYBdZNE7dunWr1NO2pClO/sgDiqdOnaKnpycdHR2l1Qnycd+OHTvYsWPHMrmPJouSMPfv309ra2u2bdtWKrner18/TpkypUJdN/+Or68vnZ2daWpqysaNG9Pc3JzXr18nWRTssrKy4vDhw5UqjbzuypUrHDVqlNRPjiwKsNja2nLgwIHSSr/Hjx/z1atXpT62uHDhAqdMmSK1ICCLruHya6b8ePH396eJicl7rXSRrwYJCAgoNqHbqVMnpQoz5WHKlCmcMGECyaJxjKOjI11cXKijo0N3d3dp5euxY8fe6/qleH+1ZMkSamtrc/ny5Zw5cybt7e1pYmLC06dPl2vpxuTkZM6bN48eHh7llgRy/PhxNmnShDNmzKCnpyebN29OT09P3rt3j9nZ2Vy2bBnbtGnD4cOHf/A24uLipGRXudGjR9PKyoqZmZlMSUmR+o+/axC3tEydOpUymYyLFi0qdp3q2LEjFy5c+MGvrXjvN2vWLLZo0YL6+vps1KgRt27dSrIo2NW3b19aWlqWWAL/3x0L3bt3Z9u2bRkREcGnT5+ycePGNDMzo5mZGa2srEo8wK/4N4iIiJDaTJBFfxNzc3Mp2EUWlTQ9cOBAqcwlHj9+nOrq6ty5c6fSvNmAAQOUSr1XFIqfwZkzZ+jq6so2bdpIQarp06dTU1OTgYGBfPDgARMSEujq6soePXq8MfG7sLCQkydPlu6p9+3bx2bNmnHTpk1MSEigp6cnU1JSmJOTw5MnT5b4+VDx/dy+fVv6DPLz83nw4EE6OjrS0NCQzs7OnDlzJi0tLUvlPqI8VhWWNBHo+ki7du1i06ZNuXDhQk6cOJEtW7YskxUjOTk5HDhwIFetWqX0eHx8PJs3b87JkyeTLLowzJw5s8yzuBUP0hMnTnDdunVS1r58IG1raytd4F+8eEEnJ6d3KuETGRnJpk2bSq8pH9hev36dq1evppqaGh0dHdmvXz82b95cGuiXpgsXLtDJyYmurq5S+ZlHjx7Rzc2Ntra2b+whVpoePXpULBugND19+pTTpk2juro69fT0aGZmRltbW+nmITExkW3bti3xCYRt27bR1ta22MqYGzdu0MvLSxqYlUegVy4mJoYuLi40MzOjp6cnFy1aJP0sOTlZCnbJs6ReHzS967H7tgnd/v37l1kAITo6Wqm/SkJCAqdNm8ZJkyZJj505c4bq6upSfyy5R48elXjppqioKGk1yLRp0+ji4kJ9fX1OnDhR+rseOHCAJiYmH12q531Wb5RGWaDyNH369GI3YXv37mXnzp2ZlpYmTYJkZ2czJCSERkZG0kqe2NjYcinD8amKjo6mvr4+tbW1GRISIk1aBQUF0cnJSZoAev2YrygZeAUFBczMzKSZmRm3bt3KCxcuSM3lyaLSEY0aNSqWFPExY5gHDx7Q3d2dffr0YZcuXWhtbV2sZ2VpnCMjIyOppqbG7du3Kz1+/PhxWlpaslOnTmW6kqi8RUVFsWHDhkq9mMpr+4rXqfIILpBFx0J5BffPnz9PNTU1jho1SppI3Lt3L7W1teno6EiyKAHFwcGBmpqaXLFiBVetWsX+/fvTxsbmo+8pIiMj2bBhQ6qrq0sBLflrpqSk0MjIiGZmZlICSkn/ncozSVG+YsHW1lYKKMjLy1XEiYKPoRjkioiIkPqaREVFcffu3TQ2NuacOXOUJut8fX3Zq1evUl3x/qa+G2RR0pinpyfV1dWpr69PY2PjT2K17fr169mqVSueO3eOt2/f5u3bt6UkO/k98Pbt26mrq8t58+a98TWOHj1KCwsLamtrFxvPrV+/Xuq783pQpbTOYWlpaRw4cCBlMplUjUF+jnjx4gVXrlxJCwsLurq6fnBZU3kZwx07dkjXgZcvX9LKykoq0VXW5MdM79696efnx5ycHM6aNUsKeq1bt04q86oYkHxfN2/e5KhRo5R6t166dImjRo2ihYUFHzx4wMzMzHIp3UgWfdaK5TTLUmpqKgMCAqS+W2TRfIOenh49PT2ZnJzM7OxsLliwgBYWFnz06NF7byMjI4O9evWiTCajl5eX9DnEx8fT3t5eKpOXmJjIKVOmlEtCTFpamlIPI29vb2pqavLAgQPSZ/PixQva2tqWSB/FBQsWsFWrVjx16hTv3r1LZ2dnymQypWCXs7MztbW1S3Re523HwujRo2lpaclnz57xwoULXLZsGUNDQ0u837z82IqKiqKvry8dHR2VVguSRWMUc3Nz+vn5lck16ejRo1RXV+fMmTMZGhrK6dOns3nz5hVuxc6b+jafOXOG/fr1Y5s2bXjx4kVmZ2dz3rx5bNq0KZs1a0YzMzN27979jYF7+b2nu7s7Q0NDGR0dTU1NTWkuKTo6mo0aNSrWv7Y0zosBAQE0NjZmhw4duHjxYun+Xt6Wxs3NjWZmZkoVSUrqelyeqwpLkgh0faRnz57R29ub5ubmdHBwKLV+K69PUqWnp7NVq1ZS+ZDCwkLpgA0KCqKurm6xC29ZBbsUDzI/Pz+amJhQX1+fc+bMkX529epVDhs2jOrq6uzYsSOHDRtGW1tbKWr9tgM1NzeXY8eO5eLFi0kWDRQ2bNjAXr16UVtbmwEBATx+/DidnJw4cuRIpfrSpaWgoIARERE0MzOjtra20gROSkoK3dzc2LVr12LLZstCWU5uFhQU8Pr16zxw4ABjYmKk75s8qFcaA9agoCC2a9dO2ob8e5OcnCzVy546dWqxnhhlQfF4O3HiBF1dXdmwYcNiWYLJyclS3duPHSj+3YRuaX4XCgsLGRkZyWbNmknBqqysLI4ZM4YtW7Zkjx49lJ4vD3YNHz68VI/RmTNnUktLi5mZmdyzZw9btmxJW1tbpbKyc+fOZdeuXZUmPj/E57p6Iy0tTSp3omjhwoU0MjKS/i8/t+fm5rJp06YMDg4uy938ZL3puL1+/TqDgoJobGxMa2tr+vr68ty5c1L98IrkbecdHx8ftmvXjhoaGtJNLFk02S6/sSwpOTk53L59O8ePH8/g4OASv0l9m6ysLHp7e7Nly5ZKN+pz586lt7d3pS9d+ibyXolLly4tt2CXfPsfe87/1O3bt4+GhoYcNWqUlKB35MgRtm7dWqqukJ2dzalTp9LCwoL29vYcMWLEB2X1v2lMf+LECWpqanL48OHSxI38fPHgwQO2b9/+o8sVvk15JSnKycuMm5mZ0cHBgXp6ehVuAqkkyD/33bt3UyaTMSIigv369ZOS/2bNmkVjY2N26dKFnp6edHd3Z/PmzUu1d+nrfTeaNm1aLGn05MmTnDJlCp2dnStMksjfmT59ulSGUy43N5fW1ta0traWxtmRkZHScfumY9LX15fNmjWjh4dHsf7R4eHhNDExkVZcl7b8/HxGR0ezZ8+e1NfXl5JC5J/H0aNH6ePjw6VLl/L27dsfvB15cs3IkSPp7+9PZ2dnWlpalvtKvh07djAiIoJxcXHs168f9+zZQ7Io4NK2bVt6eXl9cIuMu3fvUiaTUUNDo1iw7Ny5czQ0NORff/1V7Pcqe9WFwsJC3rp1i40aNaKurq5UNlJuy5Yt1NPT4/jx45mUlMTs7OyPGqu+fPmSUVFRUnlEBwcHRkdH09raWupTSJbO/Mk/WbhwIW1tbZXGryQ5duxYamhocPz48VKpvw89XhTPrQ8ePGCPHj0YFRVFsuh72KZNG7q4uFAmk0kJY5mZmfTx8SmxOc13ORbetIK9pOdUIyMjqaGhwa5du1JfX586OjrFkkDnzJlDfX19+vv7l0milLzst6GhIX18fMpkTvV9vF62Nz4+XkoWkrdHaNOmjZQQmpyczMOHD/PixYvS7yquWPP19aWZmRlzcnK4ePFi6XuhODd3+fJlWlpalsp4UfHz3LlzJ/X09Lhx40a6u7vTwsKCM2fOLJYQHh8fL91Pf2wSdUVaVVhSRKCrBOTn50vL+UqD4oF86NAhrlu3juHh4Rw/fjxdXV2lVTLy5y1btowODg6lsi/vY9WqVdTR0eH58+dJkk+ePGFSUhJPnDjBly9fMiUlhcOGDaO2trZSL6u/Ky+Xk5NDe3t7jhkzhrGxsbSxsZFKKsj7bNy6dYvZ2dllOjDIysri/v372apVK/bt21fpZykpKezTpw8dHR0/u4mV15cCl7SLFy9STU1NqV9EYWEh79+/Tzs7OyYkJJTLwPxNN8ZXrlyho6MjtbW1i5UOSU5O5pAhQ9i9e/eP2m55TejKyYPrSUlJLCwslIJ4zZs3l8qUyZ05c4YymYxjxoz56JKSip+x4r+vXr3KTp06SYPUxYsX09jYmHZ2dvTw8ODgwYOppaVVIpMqn/PqDfnnFxkZKfU7uHTpEtXV1ZVWMObn5zMtLY329vblusryU/F6hlpERAQjIiKk60hiYiK3bdtGY2Nj9u/fn9ra2rSysvqg7NLSoLj/MTEx3LVrF/ft28cXL14wLi6O7du3Z+fOnaVEhBcvXtDV1ZWurq6lft4uq8Sfp0+fctKkSVRTU6OpqSltbGzYqlWrt9aF/xwcOnSIrVq1KjaR+rlsv7wpjo03bNhAAwMDjho1Sgq0HD58WOolK/f48WPm5OR8UFa//HfOnTvHZcuWMTw8XLpvOXLkCJs0acLRo0dLSSBl0UO0rJIU/869e/c4b948Dhs2rFy2X1b27NlDmUzGLVu2kCS7desm9eYii1YaTZ8+nY6Ojpw2bVqpJqa9re/GoUOHio3PFMelFTXYJT+2+vXrx169ekmPy/d9165dlMlktLe3Vwoav35/rDh/4e/vTzMzM/r5+RW7Zz148GCpHZfy95KTk8OXL19K25FPLJqYmJTaPbQ8Ia1z585K905lMU6Qv+/ExESePHmS4eHhfPbsmfR4UFCQ0r2hj48PfXx8PjpRJCYmhjKZjP7+/sVKN1pbW7915V9lpTjmnDdvHmUyGSdMmFAsOXHbtm1UV1cv0bKmaWlpvHjxIp2dnens7Exzc3Np5Wt5mDdvHnV0dLhp0yZGRkbyxYsXSufDGTNmSKsKFUvZfejf48CBA1L5/1OnTvHevXscPnw4ly9fzkePHtHW1lbq86r4OZXU8flPx0JplzFNTU2lr6+vlKgYGxtLe3t76unpFQt2BQQEfHCA+0NERUVRT0+vwiXmKX4PAgICaG1tzaZNm7Jt27b09PRkeno6ExMT6ezszLZt2/LkyZPFXkPx+3Px4kW6urry1KlTLCwsZFpaGocNG0ZNTU1euXKFjx8/5tOnT+ni4kJHR8cSHxMovl5eXh6Dg4OVEnD8/PykYNfr56TExER26tRJmm//EBVxVWFJEIGuT4ifnx/19PTYo0cPdu3alZ6enjQ2NuasWbOkAfqrV6/o7Oz8TiUAS1NOTg7HjBkjHaRxcXGcOnUqdXR02KpVK9rb2/Ply5e8evUqR40aRQMDg3euP7xz5042a9aMmpqaHDhwoFT+8MaNG7S1tS2zXguJiYk8evQo9+/fL5WGOHDgAFu2bElnZ2el5z569KhCR7w/ZYGBgVRTU+Py5cv5/PlzPn/+nIGBgWzbtm25lIhTvFht2rSJPj4+HD58OB89esTTp09LNfRfD3Y9fvy4VG6my+JGTXFi6vbt25TJZFywYAHz8/P58OFDjh07lhYWFkplIMiiia+SymJ+28q1gQMHslu3btL/d+7cyRkzZrBv37709fUtse1/7qs3rl27xrlz51Imk0lNiWfNmkVNTU0uXLiQOTk5TElJYUBAAI2MjEqlF0hlNXv2bLZt25YGBgbU0dFh69atler65+XlcePGjRw8eDB79OhRIbJuFffBx8eHBgYGNDIyooGBgdTUed++fbSxsWGLFi3YqVMnWlpaltkq1LKUk5PD2NhYrlixgtu3by/Tm9SKqiz6plbk7ZcXxePS39+fEyZMYKtWrSiTyThs2DApY/fw4cPU1dVVCna96TXedXt79+6llpYW27VrRyMjI/bv3593794l+b9gl6enp9LNc1kEu0szSfFd96G8ynOVhezsbI4dO1apcfmgQYM4depUpecdP36cycnJpf6Zv63vxvXr19+6QqYiXE/l3nZN3LFjB42NjZX+zmTRcTdgwACamZmxZ8+exV5jzZo1HD58OE1NTTlu3DjGxsaSLMpst7CweGOwiyz5+wrFHm7u7u5s06aNUj+YCxcu0MrKSinY9Xr54Y915MgRpfLjZRnk2rdvH83MzGhpaUlTU1O2bNmSYWFhJIuSl5s1a8atW7fS29ubLVq0KLGWDPJePLt27ZKqUMj7MG7evLlEtlHRve37I0+eDgoKKpYUs3PnzlKba4qKiuLChQtpYGBQLvdJt27doqWlpdRu5NatW1yzZg07derE7t2788KFCySL2gE0adKE69at+6ix+qNHjyiTyThnzhyGh4czMTGR69evp6enp5QAMnjwYNra2pZKgEGuvI6F1NRUqqur08DAQGnl2IULF9itWzfq6emV+/xhWfXL/BDyKmZ//fUXY2Nj6e/vTwsLC7q4uDAzM5NXr16lq6srmzRp8taEIvmqvqZNm0ptFUhKq2nV1dVpZGRES0tLdu7cuVT7swUFBdHDw4Nt2rRhYGCg0vP8/PxoaWlJX19fpZVdd+/eZevWrYslWr+viriq8GOJQNcnYvfu3TQ0NGR8fLxSVsXKlSupoaFBMzMzOjs7087OjpaWliU+APwQnp6eNDU1ZUBAALW1tens7MzQ0FCpzrG8Lrq8JnTjxo3fOcv/zp07xbL+5s2bRwsLixLv8/Mm+/bto56eHi0sLNi0aVPq6elx2bJlJP8X7Orfv3+p74dQNGG1bNkyqqurs02bNrS0tKSBgUG514udNWsW9fX1OXLkSA4bNoz79+8nWZQ51K9fP5qZmb2xKXRlmNydOXMm1dXVuXTpUhYUFPDevXscO3Yszc3Ni5WI+RhhYWEcOnSo9P+YmBi6ubnxxo0b0kTmrVu3aGRkVKzefmlcoD/H1RuFhYVMT09n06ZNOX78ePr5+VEmk/H48ePMz8/nnDlzqKGhwVatWtHc3JxGRkaV+u9R0tauXUtdXV2eOXOGDx484PXr1zl48GBqa2tL/WsUvaleeVlTPK6ioqLYoUMHnj9/nqmpqTx37hwHDBjAli1b8t69e7x37x43btzIefPmccuWLdLkUnmXDRKEymzNmjVs2bIlT548yYSEBP711180NTXl6NGjpUnUI0eOUCaTccqUKR+1rejoaDZv3lwqA7Vs2TI2btyY/fv3lyYLIyMjKZPJ6O3tXSnGQML/vF5a3NvbmwMGDJB+7u/vT5lMVqq9Ot+174Y80FMRKR4XkZGRXLlyJUNCQnjmzBmmp6ezf//+tLe3l/pdPnr0iP369ePMmTN55coVNm/enDExMdJrzJ49mwYGBgwMDOSePXvYsGFD2tvbS6WffH19aWVlVWaJWocOHaKmpiYXLFjAQ4cOccyYMZTJZFImflxcHG1sbNi8efNS62VXmj073yY2NpbNmjWTVnPIS++Hh4czIyODt27doqurK9u1a8euXbtKPQ1Lirx046hRoxgQECCVoqvMAXg5+eccHR1Nb29v9u/fn6NHj5aSMBYuXPjWYFdp7YtceSXj3Lx5k9bW1tyzZw//+usv2tjYsFOnTvT29mbHjh2VWhHIe3aFhoZ+UDBE/p59fX3Zr18/JiQkMCcnh506deLcuXNJFgWbnJyclJLhS2uMUF7HgrxEoI+Pj1IpzLi4OPbo0YPq6uqVtiLMhyosLGRqaip79uypFCDMz8/n5s2baWpqyqCgIJJFZbJnzZr1t8kL8lV9s2fPVloxlZ+fz4iICIaHh3P//v0lfo+q+F1evHgxtbW16ebmxnbt2lFPT69YsHv27Nls3bo1V69eTbKo/Om6deuoq6vLO3fufPB+VORVhR9DBLo+EYsXL2bv3r2Zm5vLwsJC6UA7duwYZTIZQ0JCOGHCBC5fvrzMy5W97YITGxvLgQMH0tjYmMHBwVLZhJSUFFpZWUlZIWRR5sL48ePfq852eno6Z82aRQ8PDw4dOpTa2tplEtyIi4tjq1atuHbtWqkhoJ+fH9XV1aUVKwcOHKBMJuOQIUNKfX+EIgkJCdy6dSv37t1b7qtFoqOjaWJi8sYbkvv37zMmJobOzs5s1qzZJ9+XQT5QffnypdLN5+zZsymTyZSCXV5eXtTT0ytW9/xD5OTkMDAwkAYGBtLy6jVr1tDKyorNmzfnuHHjeODAAebn59PDw4OTJ09W2t/S8rmu3li4cCF79OjBEydOcOzYsVKwiyxabRsWFsbIyMhSncyqDF7/fnp6ehbL6nr58iV79epFGxubN5b9rCgTxXv27JFKhCpKTk6mo6MjnZycpElQRWVVVlAQPlceHh7FAliHDh2igYEBhw0bJo1LYmNjP/p4HD9+PGfMmEGy6Nzl4OBAZ2dndu3alf369ZPKGB47duyTHw8Jbye/tvn4+Eir7OfPn09NTU0p8bE0vE/fjYrWg+RN/Pz8qK+vz86dO9PU1JQymYxhYWG8c+cOPTw8qK2tTW1tbZqamrJTp07My8vj5cuXaWFhISWIxsXFsW3btlIJx7i4ODZu3JgHDx7k+fPnpbG8p6cnR40aVeLjZvkYpbCwkIWFhXz+/Dn79u0r9bJOT0+noaEh58+fz8TERGmS+9SpU+zZs+dHTej9k7JOEF69ejXHjBlDsiiJ18TEhN7e3rx//z4nTZokBVgePnxYan0tT5w4IZVuVBxvfg4JRwcOHKCmpibHjh3LESNG0MzMjDo6Ojx8+DDJoiRqdXV1BgQElGn7ibL+Hp49e5Zk0T2spaUlDQ0NpUQX+equ9evX09XVVSkI5+HhQV1d3XcKPr/tPcnLSZ86dYok2bNnT06ZMoXHjx+nq6sr7e3t/7a3YEkqr2Ph+PHjVFNTY2hoqFJQNTY2lk5OTmVWrepT8vDhQ+rq6vLQoUMklUvyDhgw4I1tfP5uPCsPOIaGhv7tsV4a96i3b9+mt7e3dBzGxcVJK/penzcJCwtT2ofbt29/VCD0U1hV+KFEoKuCk5/QJ02aRDs7u2KPX716lTKZrFjD5rKaKFKcUNu8eTMnT57MoUOHctGiRUqN/vLy8piWliZlnTk4OBSbjHvfPj3Z2dncvHkze/XqxenTp5f6DbL8bx4cHExXV1eln6WkpHD69Ols27Yt7969y5ycHB48eFBcmD4Tr3+XIyIi2KFDBz59+lSprN+FCxfYqlUrPnnyhKdOnSrRhqrlQX5MHDp0iHZ2dlJJVbnXg11JSUmcPHlyiQV/nj17xpCQELZr106pFM66des4bNgwamhocNq0afT29mbjxo3fuIJOeH9vutGIjo6mkZERo6KimJ6ezpEjR1Imk/HgwYPlsIefJsXzyJ07d5iVlUV7e3ulJvPy52zevJl6enoVKpCquP/5+flSfXNzc/Niz129ejXbtGlTrNa4IAilJz8/n/n5+ezbt690rc7Ly5PO6UuXLqW6ujoHDx6slHj2PuMU+Xng/v37zM7OppubG6dMmcL09HT6+vpy4sSJzMvLY0BAAGUyGY2NjaUJd6Hykn8vwsLCOHjwYC5cuJAaGhpvXJlcUsq770ZJeL1BvYGBAWNjY5mbm8sHDx5wyZIllMlkUsnsW7ducdOmTVKFFE9PT6nai7w06IkTJ2hjY0OyqLyhpqamVCqve/fuSr1VFYNSJSEtLY3btm1TWiUmX8Vx4cIF3r9/nwYGBvTy8mJhYSGXLl1KJycnvnr1igUFBW9MjvmUyP+OSUlJzM/P5+TJk+nq6spnz57RyMiI3t7eJIsmHxVXepW26OhoKWH3c1jNRRbN3VhaWkqrI8ii76KTkxP19fWlyd3p06dTW1tbabVNZXLhwgWp5QBZNL924sSJYsnnjo6O0v2I4pjgffsCb9u2jXv37lV6bNiwYVJAKzAwkIaGhmzTpg179uwpfR/Lar6kvI6FqKgoNmzYsFigRV5K8XP2pmtzeno69fT0pEQq8n9zyf7+/hw4cOB7f2cUP4PSWjn8ujt37lAmk7FZs2ZKffn+KdBUksHXyrqqsAqECk1FRQUAYGFhgcuXL2PVqlVKj+fl5aFRo0aoWrWq0u+9/v/SUqVK0Vdo9uzZmDNnDrKzs5Geno7Vq1ejS5cuSE9PR3Z2NubMmQNLS0s4Ozvj6dOnCA0NRZUqVVBYWCi9VvXq1d9r2zVq1ICdnR1WrlwJLy8v/P777yX63l736NEjAMCdO3eQnp4OANL+//jjjzA3N8fDhw+RlJSE6tWro23btvjPf/5TqvskVAzy4+DkyZPIycnBq1ev8PDhQ6iqqqJKlSrIy8tD1apVIZPJQBJXrlyBtrY2PD09UbVqVRQUFJTzO/gwKioqOHnyJNzd3dGsWTP8/vvvOHLkCPr06QMAGDVqFPr164fAwEAsWLAA//rXvzB+/Hj8+uuvH7VdkigoKMA333yD5s2bw8TEBGvXrsX06dMBAD169MD06dOxevVq3Lt3D48fP0Zubi527tz5yf6tKxIVFRVcvHgRUVFR0mM6OjrQ1tbG7NmzUbVqVYwePRp2dnZwc3PD0aNHy3FvPw0kpfPI3LlzMXPmTLx48QL169dHQkICbt++jcLCQuk5X3/9NX744Qd88cUX5bnbSuT7Fhsbi6pVq2LWrFno1q0b0tPTERwcjFevXknPbdCgAerWrVtOeyoInwfFMTZQdG9QtWpV6OjoYNeuXbhy5QqqVasm3VPUqVMH//d//4fvv/8eDRo0UPq9v7Np0yacPn0aQNF54ODBg3B1dUVycjIMDAxgYmKCW7duSf+vVq0a/v3vf6Nhw4Zo3bo1vvnmmxJ+50JFI78+fPvttzh06BBWrFiB9evXQ0NDo1S2l5SUhK5du+LkyZNQVVWFiooK6tatC2dnZ7Ro0QLdunVD165d0bdvX6SlpSEkJKTYfWl5unnzJoCi8VZubi4A4OrVq9DR0YGWlhZUVVXx888/w8HBAU5OTpg7dy5u3bqF//znP+jUqRO+/vprTJw4EcnJybhz5w78/PxQs2ZNAEWfxdOnT7F8+XJ4eXlhzJgxcHBwkH727NkzaT/kfxP5OeJjpaamYu3atdiwYQMiIiKwZ88e5OTkICsrC8eOHUPv3r1haGiIqVOnQkVFBVWrVsX9+/el8Y/8PXyK5H/Hw4cPw9XVVboXfPToETp06AB9fX1MnToVJJGRkYF69eopnYdLk46ODpYsWQJ/f38EBwdL8xyV2YsXL5CVlQUdHR0AQEFBAapXr47AwEBUr14dixcvBgCMHz8ee/bsqbTXqT///BMjR45EUFAQFi5ciBo1akBXVxe5ubmYN28e/P390bdvXzx//hyTJ08GUHRekN9Pf//99++8rWfPnmHTpk0YNmwYPDw8EB4eDgDo3r27ND8yZMgQLFu2DMuWLcOaNWugqqqK/Pz8MpvbLK9jwcDAAEFBQfD398eGDRvw4sULAEXznZ+z3NxcpfvLU6dO4erVq6hduzacnZ2xceNGLFu2DEDRXHJ+fj7OnTuHX3/99b2/MwYGBli2bBnmzp2LsLAwpfvW0vLvf/8bK1euRGZmJs6dOyddf5s2bSrNmRkbGytdlwGgWrVqJbYPenp6CA4OxqpVq7Bjxw48f/4cANCkSROMHDkS2trayMzMLLHtlZlyDbMJ76ywsJDz5s2jmpoaFy9ezJs3b/Lu3bscOHAg+/TpU65ZaCdOnGC7du14/vx5aV9Pnz5NMzMzqZF1bGwsQ0NDuX379k+yB8eePXtobGzMp0+fMiwsjBoaGlLNd8XsLCsrK7Fq5DMVExNDExMTpqSkMCsrix06dKCDg4NSNpA8e0y+PP9Td+fOHS5atEgqN5Kdnc39+/ezVatW7N27t/S8qVOnskWLFiWeDbd792526NCBQ4YMoaGhIVu0aKG0oowsyvi5c+dOmaz6/FxkZGSwV69elMlk9PLyYkREBMmiPhj29vZSyY/ExEROmTJF/N3fQ3R0NG1tbXns2DGSRcdYy5Yt6erqyqtXrzI7O5vPnz+ns7MzhwwZUuEawb6eGZqTk8MJEyawe/fuXLhwIVNSUpiUlMS+ffvS1dW1wu2/IFQWivcFUVFR3LZtGwMCAnjv3j0+fvyYbm5u1NbWZkxMDB89esSXL1+yX79+XLp06Xv1+lu4cCG1tbWl1aV3795lr169pL61ckFBQbS1tZUybqdNm0YvL68K3ehcKHn379+ntbV1mYwLyqvvRknw9fWVyuHLs/uHDx9erKIIWdRbpkmTJtLquOzsbB4+fJi9evXijBkzeOPGDW7ZsoWOjo7SSktHR0eqq6tz9uzZ0uvk5OTQ1tZW2m5Jkpc7y8rKore3N01MTCiTybhp0yaSRecHmUzGvn37Kv2et7c3Bw8e/Mmuati+fbvSvEB8fDzd3Ny4Zs0akkXHg729PQ0MDLhr1y6SRWPsBQsW0MzMrMyz6OVl5Eq7J1VFEB8fz5YtW3Lfvn3SYwUFBSwoKKCLiwtHjx4tPV7Zx6pZWVlcsWIF1dTUuHTpUpLkgwcP2KtXLzo7O9Pb27vEWqNkZ2fzzJkzUr/yLl268MCBA1LZzteV1xxneR0Ln9Mx+HcmT56stNrf19eXLVu2pLa2Nlu0aMGjR4+SLFpxqa6uzgEDBtDT05MODg60sLD4qO/pwYMH2bNnzzI97o8dO/bG8pVnzpyht7d3maxorGyrClVIsryDbcK7ycrKwsaNGxEQEIDatWvjyy+/RN26daVsB8Vs77IUHh6ODRs2YO3atahVqxaAopVmR48exYQJE+Dn5wcjIyOl3ykoKCizzIyPlZKSgpkzZ6JFixbo3r07cnNzMWTIECQmJiIoKAh//PEHqlSpgvnz5+PgwYNYu3Ytvvvuu/LebaGMFRQUoGPHjtDR0cGUKVOwd+9eBAQEoFatWvD09ERWVhY2bNiAZ8+eYd26dZ/M9/9tkpOT4eXlhevXr2PMmDGws7MDAOTk5CAyMhKTJk2Curo6goODARRlcZbkcXH37l04Ojpi4MCB6NKlCzIzM7Fz505s2LABmpqa8PHxAfBpnWs+Jenp6bhw4QIWLVqE58+fo169enBzc4Ofnx/U1NTg6+sLoOhaoKqqWs57+2nYvXs3li1bhry8PKxfvx5fffUVAOD8+fMYPHgwateujSpVquDrr79GdnY2tmzZUq7X/jfJyspCWFgYAgICMGjQILi5uSE3NxfTp0/Hvn37QBJNmjSBqqoq5s+fjxo1alSo/ReEymb27Nk4ePAgvvnmG+Tm5uLWrVvw8vJCo0aNEBwcjAMHDuD777/Hl19+CRUVFWzduvWdzys5OTkYOnQoatSogQULFiAmJgZBQUG4efMm5s+fDy0tLeka7O/vj927d2PgwIG4cuUKdu/ejXXr1pV6NQah4snJySmzLPUTJ07AxcUFnp6esLW1xddff/3G51WksWJGRgamTZuGK1euoEaNGsjIyMC+ffsQGBiI4OBgrFy5EpqamtLzL1++jIkTJ2L27NnFjqfCwkJcu3YN+/fvx9GjR/Hrr79i+vTpuHz5MmbMmIE6derAxsYGNWvWxK5du/D06VNs2bKlRLPFs7OzsW/fPmhqauLf//43jh07huHDh+OLL75Az5490bt3bxQWFmLWrFnYtGkTBgwYgFq1auHRo0fYtWsX1q1bB5lMVmL7UxZIIj09Hdra2mjWrBkmTZqEL774AlOmTMHly5cREBCA1q1bAwASExPh5eWFp0+forCwEP/6179w69YtBAcHo1GjRmW+75mZmRWqWkBJIAkVFRU8f/4cNWrUQK1atfD8+XP07t0b9evXx8iRI/HHH39Iz3dzc8Off/6JYcOGSb9bmQQFBaFatWpwcXGRHsvOzsaaNWswd+5cjB49Gi4uLsXOiyV5nszIyEBqairmzJmD/Px8XLp0CU+fPkV4eDiaNGlSItv4WOV1LFTGY/B9XL9+HePGjUNGRgYCAgLw6tUreHh4wN/fHxkZGdi7dy+2bduGFStWQF9fH3v27MHatWtRr149/Pzzzxg5ciSqVauG/Pz8D76WyY/7sjz+jx07BldXV4wdOxbW1tbFKp+UxTjl2LFjcHNzg5ubG7p37/7WMdMnofxibMKHSkpKYnR0NGNjY6Ush7LKQntTZDsoKIjt27eXsuXkz3nw4AG1tLSkuuGfotTUVKqpqVFbW5vHjx+XHo+Li6OTkxM1NDTYqVMn9ujRg61ateKVK1fKcW+FsvJ6dpE8y2LHjh3s2rUrk5KSmJOTw2PHjrFXr15s0aIFLS0t6ezsXOa1pkuS4vH//Plz+vv7U1tbmyNGjFB6Xk5ODvfv30+ZTMZBgwYV+92S2IeYmBi2adNGKdvxxYsXDAsLY8uWLenj41Mi2xP+XlpaGi9evEhnZ2c6OzvT3NycMplMqc608GavHxNJSUkcNGgQZTKZUhNkknzy5AlXr17NhQsXcvPmzRUiA/1tx7RiZujChQtJFp0Tpk+fTiMjI06ePFnqz/G+vTkFQXh3GzduZKtWrXjx4kWSZGRkJGUyGc+ePStljB46dIi7du3ivn373vu8kpOTw4kTJ9LKyore3t5UU1Ojq6sr1dTUOHz4cKU+PC9fvqS1tTU7dOhAa2trXr16tWTfrCC8RXn03fhYqamptLS0pLq6OqdNmyY93qtXLxoZGfHYsWNMTk7m48eP6ezszL59+7KgoICzZ8/muXPnpOvznDlz6OjoyEePHjEsLIzW1tZ0d3dnRkYGY2Ji6O7uTg0NDXbt2pVDhgwplXuUxMREmpmZMTAwkFu3bqWrqysPHjzIKVOm0NLSkgsWLGB2djYzMzMZFBREMzMzWltbc9CgQbx27VqJ7UdZkv/9b9++TV1dXfbu3ZsHDhygv78/mzdvzuHDhys9/8GDBzxw4ABnz57NLVu2VKj+q586xX7SPXv2pIWFBZcuXcr09HTGxcVRQ0ODLi4u3LZtGy9cuEAfHx+2bNmyUvdZ9/X1pUwmk3rzyb169YrDhg2jTCbjvHnzlH5Wmqtbzp8/z+DgYDo5OVXIXolC2YuJiaGLiwvNzMzo6emp1DsyOTmZnp6elMlkPHToEMm3z819jPJYyXns2DFqaGhw0aJFSmPoslRZVhWKQFclUFYT5oonkCdPnkgH38WLF6VSRYonhJSUFHbp0kUqwfSpkjfomzZtGp8+fSo9npWVxY0bN3Lu3LlctWqVGJR+ho4cOcKXL19KN4Y3btygkZFRsYHjzZs3+ejRozIPTJck+bF95swZzp49m2vXruXly5e5cOFC6urqcurUqUrPz87O5qFDh0rsRkG+ffnfLi4ujnp6ejxw4IDS8548eUIDAwPKZDJOmjSpRLYtvJuoqCguXLiQBgYGvH//fnnvToX2+oBc3mD96dOndHd3p4WFRbHzyOsqSrB86dKlXLFihdJjWVlZXLZsGWUyGYOCgkgWTYqPHz+elpaWXLhwIV++fFkeuysIldbr5xVfX19psioiIoLNmjXj+vXrmZCQwCFDhjAzM7PYa7zveSU3N5e2trZs2LChVHZo9uzZbNu2LefMmVPsRj0lJUUc+0KZU5w8qqjlMhVLhiYmJtLR0ZGDBg2ilZWVVCI8JSWFLi4ubNq0KXV0dNipUyfa2toyNzeXgwcPpo2NjfQ6p06dYo8ePRgZGSltQzHYJS8nfu/ePaanpxcbZ3+s/fv3S/8ODg5mq1atKJPJuGHDBpJF9wkTJkyghYUFAwMDpfKG2dnZLCwslMZFn6LCwkIpkefatWvU1NTk6NGjGRkZyYULF1JHR6fYfZNQeo4dO8bGjRtz2rRp9PDwYLNmzejt7c2srCzGxcWxS5cubNGiBU1NTSt1IsbFixd59uxZnjx5ksuXL39jsEseHHdwcCj1if63vX5Fub8Ryp7iZ3/ixAm6urqyYcOG9Pf3V3pecnIyx40bx0aNGnHHjh1lvZulqjxKJ75Ofj3+lJXcunSh3JRVqQV5CZPAwEAcOXIEGRkZGDVqFMzMzODl5QU/Pz+kp6fDxMQEtWvXRkBAAABITT4/VfIGfS4uLvjXv/6Fzp074+uvv0bNmjXRrVu38t49oZxcuXIFAwcOxG+//QZtbW30798f//3vfzFgwACEhoZCR0cH//d//wcA+M9//iMtey4sLCzRkiBlgf9/2fbevXvh6emJ//u//8PVq1dhbGyMbt26oWfPntiyZQtUVFQwYcIEAEXNU9u0aVOi2z979iyOHj2Kb775Bs2aNUO9evWwa9cu/PLLL1BTUwMAfPHFF9DQ0ECLFi1gZmZWItsX/p788zEwMICBgQGcnJw+65IL/4SkdD1dtWoVLl26hJs3b8Lc3ByWlpaYNm0aJkyYIB1TPXv2BFC8ZEF5lVl6vaTZ8+fPERoaipo1a0oN7eX/vnLlCvz9/fHq1SuMGDECEydOhI+PD8LDw1GtWjUMGDCg0pWEEYTyoHheOX/+PBo3bow7d+7ghx9+QExMDCZMmIBRo0ahe/fuSEhIQGRkJGJjY2FgYKD0Ou97XsnNzcWNGzfwxx9/4MqVK9i1axdGjhyJgoICHDp0CFWqVEH//v1Ru3ZtAMCPP/5YMm9YEN6Dvr4+5s+fj5CQEAwaNKi8d6cYxetqlSpV8Pvvv2PNmjW4d+8eFi1ahG3btqFatWro27cvVqxYgf379yMrKwt16tSBkZERMjMz8fTpU2hpaUFFRQXLli2TShHWr19f2o78Gr1lyxZMmjQJY8aMwS+//CL9nGSJ3KMcP34cc+bMgbq6OurXrw8dHR3MmjULtWvXxsOHD5GUlIQGDRrA29tbKm2cnp6OwsJCaGhowNrauszKW5aW6tWrY/fu3Th37hx+/PFH7Ny5Ey9fvkSPHj3g4OBQ7L7pY8psCW/3/PlznD59Gh4eHujbty8AYMOGDVi4cCFIYtSoUVizZg0ePnyIwsJC1KtX79Mu1/UW/v7++Ouvv5CdnY1+/fqhe/fuePXqFaZPnw4VFRV07twZ1apVw+3bt+Hk5CTdw7MUS7e9/rrybVWUMrJC2SosLFT67HV1dVG3bl28evUKGzZsQNu2baWylr/88gsGDx6M9PR0rF+/Hp06dSqv3S5xbdu2RZs2bcq8dKKiyjCPI3p0Cf9I8QBbu3YtFi9ejB49euDy5cs4ceIEJk2ahPbt2+PgwYPw9fVFYWEhfvzxR3z77bcIDg6Gqqpqhap9/qHkdVPHjBmDzp07S/1TgNIdBAgVw5v6VTx79gwhISGIjY3FtWvX0KNHD/z444+4du0aTExM0L59+0rx3QeA06dPw83NDZ6enrCzs8Pp06fRu3dvdOjQAba2trh8+TJ27NgBLS0tqT9WSXg9yPb777/jypUrsLCwwJ9//onFixdDX18f7dq1g5qaGnbu3InDhw9j9erVYkKtnIjz4dspnkf8/f0RHh4OS0tLpKenIzIyEhoaGhg1ahR++ukneHt749GjR2jfvj369etXznteRHH/L126hLy8POTl5eHSpUuYM2cOvL29pYk0AJg7dy4uXLgAkggNDYWqqipyc3Mxd+5cODo64tdffy2vtyIIlYbiOXfBggWIjIyEv78/Tpw4gdWrVyMlJQWenp7o0aMHACAuLg5jxozBokWL8N///vejt5+RkYG8vDx4enri8ePHcHFxgaWlJfz8/HD8+HG0bt0aw4cPx5dffvnR2xKEj8Fy6LvxTxSvq2vXrsWlS5dQUFCAUaNG4ccff8TNmzexYsUKXL58GTY2NnBxcUFycrLS9fPly5eYNm0abt68ia+//hqXLl2Cubk5tm7dCisrK4wfP14KNsu3s2LFClhaWmLkyJEl/p6ePXsmBQ3u3LmDBg0aICEhAceOHcPq1avRqVMndO/eHQ0aNJD6eF64cAH37t3DmjVroK6uXuL7VNZiY2PRv39/eHp64rfffpOCKpqamujatWup3TcJ//Ps2TMYGRnhm2++gbu7O7p27Sr9bN26dVi0aBHMzMzg6OhYqftFLl68GGvWrMGSJUtQq1Yt/Pjjj6hRowbi4+MRHx+PadOmQU1NDTk5OahWrZoUWK9I50mhclO8Dm7evBmJiYl49OgRxo0bh7t372Lp0qVITk7GnDlzlHq4PXnyBN99912l7PUsjr+PI9JGhL/1+uR+Xl4exowZA2trawCAj48PJk+eDJLo2rUrdHR0kJqaClVVVfz3v/9FlSpVKk2GkoGBAYKCguDm5oacnBz07NkTderUAVA8I0WoXBSPg7179+L69euoU6cOnJyc4OHhgby8PKxduxanT5/G7t278ejRI9y/fx/t27evFEEuAIiOjoaJiQns7Ozw+PFjLFmyBDY2Njhy5Aiys7PRo0cPZGdnIzo6Gk+ePMH3339fIttVUVHB6dOn4e3tDW9vb9jZ2eHUqVPo06cPateujeHDh+PAgQOYO3cuatasierVq2PevHkiyFWOxPnw7eTnkXv37iE9PR1z586Fnp4egKJkijlz5mDJkiUICAiAl5cXRo0ahVu3blWIwa7iipEPzQzNzc1F9erVMW7cuPJ8K4JQqcjPDQcPHpSCWL/99huqVauG7du3AwDq1KmDvLw86fr9888/S6vOP5Z8An3ChAmYMWMGgoODoaKigrFjxyIzMxNxcXHIyckRgS6h3FW0IBfwv3GBn58ftmzZgsaNG+PBgwfo1q0bNm/ejN9//x39+vXDihUrsHbtWsybNw+ampoICwuT3stXX32FadOmwdLSEtevX8fQoUMxYMAA1KlTBwcOHMCyZcswYMAA6Vh1cHBAvXr10K5du1J5T99++y0AICkpCd27d4e5uTkmTpyIhg0bIicnBxs3bkSVKlVgb2+PX3/9FVOnTsWjR49QrVo1fPfdd6WyT2Xt7NmzaNq0Kezt7aXHNmzYAAcHB+Tn50v3TVFRUXj69Cnq1atXjntbOX377bdYunQpXFxccO3aNTx//hx169YFAPTs2RNVq1bFtGnTULNmTYwYMQLVq1cv3x0uBa9evcKVK1cwefJkaGpq4vr161i5ciV27tyJ1NRU9O/fH2FhYdi+fTu+++47uLu7o1q1apUmUVf4NMivg7Nnz8bOnTvRqlUrkERcXBxMTU1RUFCA4OBgjB49GrNnz5aCXfL5pjclpH/qKtI45VP06UcfhFIlP2GsXLkS586dQ2xsrFJm+bhx46CiooIpU6YAADp37oyffvpJ+vmnWKbt7xgYGGD+/Pnw8vJSGrgKlZviTej27dshk8nw888/IyMjA7Vr10aNGjXg7OwMCwsLPHz4ECtWrMDVq1cREREBCwuLct77j0cSly5dko7ttWvXon79+pgxYwaOHj0KV1dX5ObmolmzZli+fLl0g1tSXg+yLV26FNbW1tizZw/09PTg5uaGBg0aQFVVFTVr1pRuYgShIkhOTkbVqlWl8kHyY+bLL79UKq9pYGCAgoICDBkyBCdPnoSOjg4CAwPxzTffVIjJOfm2Fy9ejE2bNillhlatWhUGBgaoV68epk6divDwcCkz1NDQEEDReaQyTiIIQkVw9uxZLFiwAE+fPpVu/H/55RfMnDkTkyZNwuzZszF58mTUr18fqqqq2LBhA6pUqVKikwO//vorJkyYgOnTpyM0NBQ5OTmYMmUKUlNTS3xcIAgfqiJOHq1btw67du3CypUr0ahRI6xatQo+Pj7o0qULNm7ciN9//x0DBgxAy5YtcffuXQwZMgSA8nt58eIF0tPToampiX379uHnn3/G6NGjUVhYiIMHD0JFRUWpjGj79u0BFC+LXJJq1aoFe3t77Nq1CyoqKvD29oa7uzsAIDw8HOnp6cjNzUX9+vWlxyuLhw8fIiMjQ/p/Tk4OfvnlF/j6+sLJyQnVq1eHnZ0dnJycxPmxFCm2oPj111+VqvLY29ujatWq0NLSqrTjU5K4evUq6tati9TUVCxduhQNGjRAx44dUadOHSxevBjdu3fH5MmTpTm7ypKkLnxaYmJisGfPHixbtgwNGzZU+lmDBg3g4uKC5cuXo2/fvti0aZPSKszKFuQSPp74RghvVFhYKP07MDBQ6rf18uVLHDp0COfPn5d+7unpid69e8Pb2xtRUVFKr1MZTzpt2rTB4cOHxWT6Z2bz5s3Ys2cPQkNDsXLlSowfPx4pKSnYtm0bYmNjART1ntDU1ISvry/U1dVx5syZct7rkqGiogI3Nze0bt0a165dw8WLF6Grq4vCwkJkZmbiP//5D+rWrYvOnTuX+M2aPMimqqoK4H9BNj8/P8yePRt79uxBYGAgTpw4gZ9++kkcl0KFs3HjRsydOxdA0aqtevXqoUePHnj16hXS0tIAFK10AgBjY2P89NNPSEpKAgCpHENhYWGFmJx7PTNURUUFK1euhIWFBZycnJCWloawsDBoaGjAzMxMKn9SUFBQIfZfECqL1yvP169fH2ZmZnj58iWWL18uPf7HH38gICAAc+fOxahRozBmzBiEh4dDVVUV+fn5JT5O/+WXXzBhwgTUqFED27ZtQ0ZGRqVZoSEIpaGwsBAXL15Er1690KhRI1y6dAk7d+7E0KFD8fPPP6Nnz554/Pgx/vOf/6Bz584YMWKEdPwq+vHHHxETE4MFCxagXr16CAkJwV9//YWxY8fCyMgIhw8fxrx585CVlaX0eyUV5CIpzR/k5eUhNzcX33//Pfr164cuXbpg3759mDZtGgDA3d0d9vb2uHTpEs6cOVNqK8vKk4mJCa5cuYIdO3YAgNRzrLCwEH/88Qfu3r0LNTU1EeQqA3p6eli+fDlmzZqFrVu34uXLl9LPunTpgv/85z/luHelq3bt2hg6dCiOHj2KwMBA2NnZwcvLC6NHj4aGhgYaNWqEKlWqKAW2RJBLKAuK880AkJaWhho1auCHH36QflZQUIC4uDh07twZ//3vf+Hq6opu3brht99+K4c9Fj4l4iwmvJH8xvfixYvIzMzEihUroKWlhT179iAoKAghISFwcXGBpqYmAGDMmDGoX79+sabWlVVlaNAnvJ/k5GTo6OhATU0NsbGx2LBhA06cOIEXL15ATU0NU6ZMQePGjQEUDSpbt26NsLAwvHz5Uqmf26eqefPmaN68OVatWoXHjx9LK9UuXboEPT09jBgxolTKEsmDbPfv35eCbF26dFEKsv3rX/+Syr8JQkWjq6uL/v374/Lly6hSpQrCwsLg7u6O9PR0jB8/Hr/99hsaNWoEoKhpdo0aNYpNDFeUpBGRGSoI5U9xFVZWVhYKCgrw888/o1+/fqhSpQpWrVqF6dOnY8KECQCKSrt8//33aNGihfQaBQUFpXZc/vLLL5g9ezZUVFSU+gIJglC874aKigqePHmCL7/8Eqmpqdi4cSOMjIzQr18/1KxZE7NmzYKhoSGWL1+udJ/9puO3SpUq+Pbbb+Ht7Y3p06crlRFNT0/H8+fPUbNmzRJ9PxcvXkSDBg1Qt25dqKio4OjRo4iIiMDt27dhZGQEAwMDDB48GEDRyjUA8Pb2xpAhQ9CpUyd89dVXlTJJrVWrVujatStmzJiBwsJC2NraIisrC6dOnUKzZs0wZswYcX4sQ3/XgqKys7W1haGhIVRVVaU5idzcXKxZswZfffUVvvnmm3LeQ+FzJB/Hnjx5Es2aNcOrV6/w8OFDqKqqokqVKsjLy4OqqipkMhlI4sqVKzAyMoK2tjaA0l2NLHz6xMyDILl58ya+/fZb6WIXGxuLgQMHQlVVFebm5gCAjh07oqCgACtWrMCKFSvQv39/NG3aFADg6OgIQExqCZ++N5UIq169Os6dOwd3d3dERUVBX18fY8eORbNmzWBjY4N79+5Jga4HDx7g6NGjqFmzZqU7Fr777jvcv38fixYtwuPHj7Fnzx6sWbOmVHtvlFeQTRBKgq6uLnR1dXHs2DHo6+vjyy+/RM2aNeHl5YWCggI4ODhgwIAB+OKLL3D8+HGoqqrC2Ni4vHf7jeSZoXPnzsXhw4fRvXt3mJqaolGjRjh+/LjIDBWEUqbYKy8oKAjnzp3D9evXYWhoCHNzc2lCef369ahSpQq8vLwAFJ8QKO3JAXmpVkEQ/kcxSJ2ZmYkvvvgCKioqGDp0KGrUqIHbt2/jyZMnsLGxQfXq1VG3bl1YWVnhjz/+gI6OzjtvR76ycvr06QgJCUFWVhamT58u3d+UVCnk5ORkdOvWDWPGjIGTkxNOnjwJNzc3dOnSBQ0aNMCRI0ewa9cujB07FgMHDgRQVCEjMzMTPj4+aNCgwUfvQ0VVs2ZNDBs2TDoPL1myBF9++SUePnyI4OBgEeQqB59zC4rvvvsODx8+xIQJE/Dy5Uu8evUKeXl52LRpE1RUVCpljyOh4jt58iS8vLywfv16WFlZISQkBIMHD0ZoaKhUzefFixf44YcfUKtWLaXfFUEu4e+I2QdBsn37dly4cAFr1qxBTEwMgKLaxatWrcLly5elSXxLS0uoqKggODgYs2fPxqRJk/DHH39IryMmtYRPmeJALzs7G/n5+ahduzasra2RlpaGW7duYeLEiTA0NMT333+P3Nxc/Pnnn1JJCgD44Ycf0KBBA3h4eFS61X96enro1KkTdu/ejW+++QarV6+GTCYrk22XR5BNED7E65NIjRs3hqGhIfz9/TF+/HiMHz9eyrquUaMGAgIC0Lx5c7Rr1w6Ojo6oVq1ahU0aEZmhglA+FMcnS5cuRWhoKPr374/ffvsNFy9exLFjx+Dl5SVNKG/atAnp6enw8fEREwKCUAHIj9/ly5fj0KFD+Pe//w0rKyvo6+sDAGbMmIEnT55Iqy/37t2L3377DQMGDADwfsmk8mDXqFGjcPbsWXTp0qXEJ7R//fVXLFu2DG5ubqhSpQquX78Od3d3uLq6AihKSFu3bh3mz5+P+vXro2fPnsjKysKRI0fw9OlT1KtXr0T2o6L67rvv4OXlBSsrK1y4cAH16tVD8+bN8euvv5b3rn225C0oKtv9+bv47rvv0LZtW5w5cwb/93//h969e1fo+w2h8mvZsiWqVauGxYsXY8qUKRg2bBgCAgJgb28PT09PZGVlYcOGDfjiiy+gpaVV3rsrfEJU+HqRd+GzdfbsWSnzCAB2796N9PR0BAcHIywsDL6+vrCxsZGev3nzZpw9exYzZswQGSBCpaA4Oa2YKW1gYIBOnTpJN56ZmZm4e/cuvv32W0yYMAHPnj1DeHg4qlat+llkRBUUFEg1/ssyIzEtLQ3z5s3D2bNn8c0332DChAlQU1Mrs+0LwruQl1oAgJSUFKkkT82aNXH06FEMGzYMbdu2xYQJE/DNN98gNTUVQUFB2LBhAxYvXgx9fX2l16ioHj58CB8fn2KZoaqqqp/FeVAQysutW7ewZMkSmJiYSBUXLl++jNWrVyM+Ph6BgYH4+uuvsXz5cty9exeBgYHieBSECiIkJARLly5Fx44dER0djXr16qF79+6wtrbGypUrsXbtWjRv3hz37t3Dq1evsHnz5o+ahH78+DHq1atXqueAY8eOYcCAAfjyyy8xYsQIODg4SD+Li4vD2LFj4eTkBHt7e6SmpkJFRUX0phKECkCUfxPKyuv3hvLv3s6dOxEWFoa5c+fixx9/xOnTp7Fs2TLEx8fjp59+wg8//IClS5dCVVVVfF+FdyYCXYLS5P6IESOwZ88eNGrUCFu3bgVQNJm1YsUKrF27tliwS05MagmfurdlSj958gQXL17E48eP4e7uDhsbG8yYMQMHDhxArVq1ULduXaxevVpcfMtIeQXZBOGfHD16FJqamvj6668BAAsXLsS+ffuQm5sLKysrdOnSBT/99BOioqIwbNgwmJiYYPDgwThz5gyaNGmC0NBQHD16FH5+fmjTpk05v5t/lpubiz179ojMUEEoQ0lJSTAzM4OqqipmzZqFjh07Sj87f/48hg8fjtGjR8PS0hIvXrzAV199JcoSCUI5Ujz28vPzMXv2bOjo6MDY2Bg3b97EtGnTkJ2djX79+sHAwABTp05FWloavvzyS8ycObPE7i9K+xxw6tQp9OnTB71798aIESOUykz17dsX33zzDebOnSvOQ4IgCJ+xyMhIaGlpoWbNmlBVVUViYiL69euH/v37KyVJ3Lp1C7Vr15YSNcT9pfA+RKDrM6c46H358iX27NkDVVVVLFy4EPXr10dQUBC+/PJLPHjwAMHBwVi3bh28vb3Rs2fPct5zQSgdf5cpfe3aNSxevBiFhYW4ceMGatWqhVatWqFq1ari4isIn7GVK1ciICAAI0eOhKOjI1avXo3AwEAMHz4cp06dwvXr19G6dWu4urri559/xrFjx+Dm5oaqVauiYcOGCAsLw4sXL+Dl5YUrV65g7969n2RZFRHsF4TSd/LkSfTt2xeurq4YOHCg0oSyjY0NjIyMMGLECOmxkurHIwjC+1E89jZt2oS0tDRs2bIFnp6eMDExAQAkJCTAx8cHmZmZcHNzg5GRkdJrfEr3FydOnICrqyt8fHzQvn17VK9eHQDg6uqKRo0aYdiwYeW8h4IgCEJ5uXLlCuzs7PDbb79BW1sb/fv3x6+//op169YhNDQUQUFB+L//+z8AytdPkawlvC8R6PqMKZ4wwsPDcfbsWdSrVw8ODg64f/8+xo4di/r162PZsmX44osv8OjRIwQEBODWrVtYv369uGkWKp33yZRWJCZ3BUEYOXIkLl68iO7duyMuLg5du3aFgYEBAGDRokXYs2cPtLS0MHDgQPz888+4c+cOLly4AAsLC6nc3/Pnz5GXl4cff/yxnN+NIAgVmXxC2dfXF6ampqhRowYyMjLQu3dvODg4wM7Orrx3URA+a4r32f7+/ggNDcW///1vJCYmwtraGn5+ftJzr1+/Dj8/PyQnJ8Pb21saO3yKQeqoqCgMHjwYDg4O+Pnnn3H//n1s3boV4eHh+P3338t79wRBEIQy8qYA1bNnzxASEoLY2Fhcu3YNPXr0wI8//ohr167BxMQE7du3F3NrwkcTgS4Bfn5+2LBhA7S1tXH8+HHo6OhgyJAhyM/Px9ixY/Hzzz9j2rRpOHv2LP773/+iadOmUFFR+SQH34LwT943U1oQhM9bbm6ulLU8YsQInD17FllZWVi8eDFatmwpPW/RokXYu3cvWrRoAWdnZ6Vm5J9CTy5BECqWqKgoDBo0CObm5vj1119x5coVPHjwAFu3bhXnE0GoIJKTkzF58mSMHj0a3377LY4ePYpp06bB0tISM2fOlJ539epVbN26FePGjfvkJ/hOnDgBFxcX/Pjjj+jYsSM6d+6MP//8s7x3SxAEQSgjikGuvXv34vr166hTpw6cnJxQWFiIvLw8rF27FqdPn0Z8fDwePXqEli1bYs2aNeW850JlINb/febWrl2Lv/76C+vWrUNQUBAmTZqE48ePY9GiRahRowb8/Pzw+PFjdOzYERs3bkSTJk1EkEuo1Fq3bo3g4GAEBwfj0KFDyMnJAQBkZGSgSpUqaNCgQTnvoSAIFYk8yAUA8+bNg6GhIdLT03Hy5ElkZGRIP3Nzc4O5uTn27t2L/fv3K72GmJQWBOF9GRoaYvny5di1axeOHj2Kxo0bY9euXVBVVUV+fn55754gfPbWrFkDR0dHPH/+HN988w1++OEHdOjQARMmTMBff/2F8ePHS89t1KgRJkyYgKpVq6KgoKAc9/rj6enpYfny5SgoKMCQIUNEkEsQBOEzIw9y+fn5YcqUKTh37hyuX78uzanVqFEDzs7OmDJlCgICAtCuXTvcv38fERER5bznQmUgVnR95saNG4cffvgBI0aMwLlz5zB9+nRYWFhg+fLl0NDQwNChQ1G/fn1cvHgRhoaGqFatmghyCZ8FkSktCMLfUcxUCw4ORmJiInx8fAAAo0aNwrlz5+Dk5ARbW1vUrl1b+r2tW7fC2tr6k8/YFgShYoiJiUH//v0xatQoODg4iDGKIFQQz58/R8+ePXHr1i0sXrwYRkZGqFq1KtLT07F3717MnDkT+vr6CAwMLO9dLRWvXr3Cl19+Wd67IQiCIJSDzZs3Y+HChVi6dCnU1NSQkZGBlJQUXLp0Cb/++itatGghPTcjIwPjxo3Dd999h8mTJ5ffTguVgljR9RnLzs7G5cuXpbr+27dvh76+PlxcXDBixAgcP34c3t7eOHv2LNq0aYNq1aohPz9fBLmEz4LIlBYE4W0Ug1yxsbG4d+8etm3bBn9/fwDAnDlzoKmpiZUrV2Lbtm1KK7s6d+5cKTK2BUGoGHR0dLBkyRL4+/sjODgY6enp5b1LgvDZKSwsVPp/fn4+6tati40bN6JBgwaYM2cOzp07h8LCQtSpUwcdO3bEsGHD8Pz582K/W1mIIJcgCMLnKzk5GTo6OlBTU0NsbCwmT56MXr16Yfz48Zg5cyYuXbokPbd27dpo3bo1Tp06hZcvX5bjXguVgQh0fcZq1qyJadOmoXXr1oiLi8OdO3egp6cHoCgI1rJlS5iYmKBdu3bS71SrVq28dlcQypyuri5CQ0ORkJCA2rVrIy8vD4A4DgThcycPcs2aNQseHh7IzMxEkyZNEBwcLGWh+fv7Q1NTE2FhYVi7di2ysrKUXkOs6BIEoaQYGBhg/vz5WLlypQiiC0IZe70XyYIFC+Dt7Y3t27ejTp062Lp1K/Ly8jB16lQp2FW7dm1069YNq1evRpUqVSptsEsQBEGo/N5UKK569eo4d+4c3N3d4eLigqysLIwdOxZ79uzB7du3ce/ePem5Dx48wNGjR1GzZk0x1yZ8NPEN+sw1bdoUKioq8Pb2RrVq1dCqVSsUFhYiOjoaBgYGGDBgAACgoKBATMoJnyV5prSbmxuys7Ph4OCAOnXqlPduCYJQzmJiYrBjxw4sWLAAWlpayM3NxdGjRzFq1CioqKhg0qRJmDt3LlxcXHD16lXUrFmzvHdZEIRKrE2bNjh8+DC++OKL8t4VQfisKCa/7N27FxoaGqhbty48PT2RkJCAsWPHYsuWLbCzs8OMGTMwevRo6OjoSMcqSek1BEEQBOFTopjskZ2djfz8fNSuXRvW1tZIS0vDrVu3MHHiRBgaGuL7779Hbm4u/vzzT9SoUUN6jR9++AENGjSAh4eHGMcKH0306BIAAGFhYfDz84O9vT3i4+ORnp6OrVu3ip5cgvD/HT58GF5eXti7dy/q1q1b3rsjCEI52759O4KDg7Ft2zalzLPt27fD09MTAwcOxPDhwwEAeXl5UFVVFddTQRAEQaiEDhw4gClTpmDhwoXQ1NTE0aNH4erqiqCgIPz73//Gb7/9hhcvXsDIyAjt27eHn59fee+yIAiCIHwUxXvboKAgnDt3DtevX4eBgQE6deok9eHKzMzE3bt38e2332LChAl49uwZwsPDUbVqVaVAmSCUBPFtEgAA5ubmcHR0xPXr1/Hrr79iy5YtqFatGgoKCsSknCDgf5nSIsglCJ8fxZyg3NxcAEW1xB8+fIgbN24oPbdx48ZQVVXF0qVLpYksVVVVcT0VBEEQhErq/v37aNmyJTQ1NbFv3z4MHz4cU6ZMgbq6OsaPH4/o6Gh8/fXXiI6OxsyZM8t7dwVBEAThoxQWFkr3tkuXLkVISAhatmwJMzMz3LhxA2PHjsX27dsBAPPmzcOgQYPQt29fZGRkYMOGDVLPahHkEkqaKF0oAAC+/fZbjB07Vso6B4qa6Ir6qILwP2IZtSB8nuSD+LVr1yI9PR0ODg5o1KgR/vWvf2Ht2rXo27cv/vvf/wIoar5uYGCAZs2aISAgAM2bN4epqako/ysIgiAIlcCbVmdnZ2cjKysLf/31F7y9vTFmzBjY29sjOTkZt2/fxsOHDwH8715CtAUQBEEQPmXyANWtW7dw8+ZNTJo0Cebm5gCAy5cvY/Xq1QgJCUGLFi3Qq1cvtG7dGrVq1UKrVq1QtWpVMd8slBrxrRKUyINcJMVJRxAEQRAUREdH4/Lly/jyyy/Rq1cv9O7dG4sWLcLz58/RsWNH/Pjjj1iyZAlyc3PRpUsX7NmzB0lJSeW924IgCIIglADFEksZGRmoXbs2AEAmk2HlypWIjo6Gh4cHevToAQCoWbMmvvnmG9SrV0/pdUSQSxAEQfjUJSUlwdzcHKqqqmjTpo30uIaGBnr06IHhw4fjwoULsLS0RIMGDaSfFxQUiPlmodSIb5bwRqK8kiAIgvA5e1O98EWLFmHcuHEICQkBAPTq1QtffPEFduzYgdGjR+P3339H3bp1ERISAlVVVdSuXRt16tQpj90XBEEQBKEEkZTGBSEhIThx4gS+/PJL9OjRAyYmJrC1tUVoaChyc3Nx8eJFVK9eHXPmzEHt2rWhr69fznsvCIIgCCWrQYMGWLlyJfr27Ytr167B2NgYtWrVAgA0a9YM33zzTbEy/4BI9hBKlwh0CYIgCIIgvEY+mXX16lX89ttvUrkhHx8fjBkzBsHBwQAABwcHdOzYEffv3wdJfP3111BVVcWcOXNw69Yt6OjolNt7EARBEATh4ymWK5w/fz5Wr14Na2trHD16FBMmTMDIkSMxduxYFBQUYNOmTfD394eamhq+/PJLhIWFSb1IxOSeIAiCUJm0bt0awcHBcHV1xR9//AFTU1PUqFEDGRkZqFKlitJKLkEoCypU7LAuCIIgCIIgAAD27duHiRMnYujQoejcubOUoQYAw4cPR1RUFIYNGwYrKyt8++23uHjxInx9fVFQUIAHDx4gKCgIjRo1Ksd3IAiCIAjCx1AMcj148ADe3t4YOnQomjZtCgBwcXHB/fv3MXToUJibmyM5ORnJycn49ttv8eeff6JKlSqiF4kgCIJQqUVFRWHQoEEwNzfHr7/+iitXruDBgwfYunWr1CJHEMqCCHQJgiAIgiDgzQ3mBw4ciLt376JXr16wsbGRVnY9fvwYFhYW+PbbbzFkyBBYWVnhzp07OHnyJKpXrw5tbW388ssv5fE2BEEQBEH4SN27d4eHhwe0tbUBACtXrsTatWtRp04dLFy4EPXr1wcAZGVlYciQIXjw4AFcXV1hbm6O6tWrS6/zplLIgiAIglDZREdHw9nZGerq6jAxMcGQIUMAQCR7CGVKjLgEQRAEQfjsFRYWKgW5srKyAABLly6FTCZDSEgItm/fjpycHADA8+fPYWJigu7du8Pc3BwA8Ntvv6F79+7o3LmzCHIJgiAIwifq8ePH0NHRgaampvRYx44dUVhYiKtXryIhIQHyfOFatWph8eLF+OWXX+Dr64vo6Gil1xJBLkEQBOFzoKuri9DQUCQkJKB27drIy8sDABHkEsqUWNElCIIgCMJnTTHbet26dTh37hxu3bqFli1bok+fPqhfvz48PDxw+fJlWFhYQE9PD8uXL8dXX32F2bNnAxCZaoIgCIJQGcmDWJ06dUJqairs7Ozw9ddfY/LkyWjWrJn0vOzsbMybNw9jxowRvbgEQRCEz9axY8fg5uaGwYMHw8HBAXXq1CnvXRI+IyLQJQiCIAiCAMDf3x9btmxB27ZtoaKigt27d+Pf//43Jk6ciCZNmmDs2LGIiYlBYWEh/vWvfyEsLAyqqqpvLHkoCIIgCMKnRzFxJTs7G56enti7dy8CAgLQvn17PH78GHZ2dvj+++8xceJEpVVfcgUFBSLYJQiCIHy2Dh8+DC8vL+zduxd169Yt790RPiMi0CUIgiAIwmcvNjYWnp6emDVrFpo3bw4AuHPnDvr3748ff/wRISEhqF69Oq5du4a8vDyoq6uLBvOCIAiCUIkorvA+cuQIUlNTcePGDQDAqlWrlIJdXbt2xQ8//IAxY8agZcuW5bnbgiAIglDhZGZmSv2tBaGsiILRgiAIgiB89p4+fYpatWpBXV0dAJCXl4fffvsNixYtwoULF7Bjxw4AgJqaGho3bowqVaqgoKBABLkEQRAEoZKQB7lmzZqFCRMmYMeOHTh37hxatGgBW1tbDBs2DPv27cMPP/yATZs24fLly9i2bVs577UgCIIgVDwiyCWUBzE7IwiCIAjCZ+VNpQbz8/Nx7949JCUl4Y8//kC1atVQWFiIX3/9Ff/617+QmZlZ7HVEWSJBEARBqFz27NmDiIgIBAcH4//+7/9QrVo1VKlSBa1atUK1atUwfPhwzJ8/H+3bt0d0dDS++uqr8t5lQRAEQRAEAWJFlyAIgiAIn5G8vDwpyPX06VPk5uYiPz8f6urq+OGHH7BmzRrcvn0bKioqqFKlCnJzc1GrVi388MMP5bzngiAIgiCUtjt37uC3337D77//DlVVVWnMcPLkSWRkZKBHjx4YNmwYTp06hW+++QZVq1ZFQUFBOe+1IAiCIAiCIFZ0CYIgCIJQ6UVHR0NTU1MqobB48WIcPHgQBQUFsLa2Rp8+feDi4oIFCxbg+fPnMDc3R506dRASEoIqVarAzMysnN+BIAiCIAilRb7a+9GjR3j16hVUVVWlxwHgp59+wv79+zFr1iz8+OOP0NLSkn5XrPAWBEEQBEEof2JFlyAIgiAIldqyZcswdOhQREREAABCQ0MREhICS0tL1KtXDxs3bsS8efPQtWtXjB49Gs+ePcPw4cMxd+5cAMDGjRtFxrYgCIIgVGLylVsWFha4fPkyVq1apfQ4STRq1AgtW7aEq6srqlWrhvz8/HLbX0EQBEEQBEGZWNElCIIgCEKllZKSgr59++Lq1atYtmwZXr16hTNnziAwMBA6OjpwdnbGrFmzcOjQIZDE0KFDYW1tjRs3buCrr77CDz/8ABUVFeTn56NaNTFsEgRBEITKrEWLFhg4cCB8fX2RmZmJ9u3bo1q1ali6dClq1aqFevXqSc8V4wJBEARBEISKQ4XytfiCIAiCIAiVjL+/Pxo1aoQOHTqgc+fOqFKlCu7fv49ly5ahcePG0vNmzZqFo0ePwtDQEC4uLkoTWYWFhahSRSyCFwRBEITPQVZWFjZu3IiAgADUrl0bX375JerWrYs1a9ZAVVVVjAsEQRAEQRAqIJGCJAiCIAhCpZSRkYGrV6/i2LFjiIiIQF5eHv7zn//g8uXLOHXqFP7880/UqFEDADBmzBhUqVIFW7ZsQf369dGrVy/pdcRkliAIgiB8PmrVqoW+ffuibdu2uHfvHqpXr45mzZqhSpUqYoW3IAiCIAhCBSVWdAmCIAiCUGllZGTAzs4Od+/exejRo+Hi4oJhw4YhPj4e/fv3R6dOnaRgFwCsXbsW3bt3F43lBUEQBEFQUlBQIMYHgiAIgiAIFZRIURYEQRAEodLKzc1FzZo10aJFC0RERGD37t2YP38+1NTUsGLFCuzcuRM5OTnS8x0cHFC1alUUFBSU414LgiAIglDRiCCXIAiCIAhCxSVWdAmCIAiCUOmlpqbCy8sLjx49woABA9C+fXuMHDkS169fR7du3dCzZ09Ur169vHdTEARBEARBEARBEARBeE9iRZcgCIIgCJXed999B29vb/z0009YsWIFDhw4gFmzZiEtLQ337t2Dqqpqee+iIAiCIAiCIAiCIAiC8AHEii5BEARBED4b9+7dw/Tp03Hz5k0UFBTgu+++w/r161GtWjWQhIqKSnnvoiAIgiAIgiAIgiAIgvAeRKBLEARBEITPyoMHD7B//348efIEI0aMQLVq1USDeUEQBEEQBEEQBEEQhE+UCHQJgiAIgvDZUVy9lZ+fj2rVqpXzHgmCIAiCIAiCIAiCIAgfQgS6BEEQBEEQBEEQBEEQBEEQBEEQhE9SlfLeAUEQBEEQBEEQBEEQBEEQBEEQBEH4ECLQJQiCIAiCIAiCIAiCIAiCIAiCIHySRKBLEARBEARBEARBEARBEARBEARB+CSJQJcgCIIgCIIgCIIgCIIgCIIgCILwSRKBLkEQBEEQBEEQBEEQBEEQBEEQBOGTJAJdgiAIgiAIgiAIgiAIgiAIgiAIwidJBLoEQRAEQRAEQRAEQRAEQRAEQRCET1K18t4BQRAEQRAEQRAEQZmnpye2bdv2t8/R1tbGmjVrymiPBEEQBEEQBEEQKiYVkizvnRAEQRAEQRAEQRD+JykpCc+ePZP+v3jxYly9ehULFy6UHqtduzb++9//lsfuCYIgCIIgCIIgVBhiRZcgCIIgCIIgCEIF06BBAzRo0ED6/7fffovq1atD8/+1dzchUbVhHMavEZXGMIZMHBgiml1EH0KKhDoEUUTSoloERZiViFSEpU2bVkEFQ1KLwkkZmBAXtQmibZCLJmiICNtU9km16IvZiCbOu4h3Nm3KN5z3xPVbnedwnsN9r//nfs769eUrSpIkSZL+hwy6JEmSJCmAbty4wdjYGJOTk8zNzbFy5Up6enrYtm1b6ZlHjx6RSqWYmJggEolw4MAB7t69SzQa5fz58wDcvn2bdDrNq1evqKmpobW1lf7+fhoaGsrVmiRJkiT9sopyFyBJkiRJ+j2jo6OcOXOGzZs3MzQ0RCqVorq6mpMnT/Lx40cAXrx4QWdnJwAXL17k6NGjpNNp8vl86T35fJ6BgQG2bNnCtWvXOH36NLlcjhMnTpSjLUmSJEn6bU50SZIkSVLAvH37loMHD9Lb21u6F4vF2LlzJ/l8nu3btzM0NERtbS3Dw8OEw2EA4vE4e/bsKe3J5/MsWrSI7u5uqqurAYhEIjx58oRisUgoFFrYxiRJkiTpNxl0SZIkSVLAJJNJAAqFApOTk7x+/ZoHDx4AMDMzA0Aul6O9vb0UcgE0NjYSi8VK66amJgYHB+no6GDr1q0kEglaW1tJJBIL2I0kSZIkzZ9HF0qSJElSwLx584bOzk6amprYt28fIyMjzM7OAlAsFgH48uULdXV1P+1dtmxZ6bqxsZF0Os3y5cvJZDLs3buX9vZ2rl+/vjCNSJIkSdJ/5ESXJEmSJAXI3Nwc3d3dVFVVcfPmTVatWkVlZSXPnz/n1q1bpeei0SifPn36af/nz5+Jx+OldVtbG21tbUxNTZHL5chms5w9e5Z169axdu3aBelJkiRJkubLiS5JkiRJCpCvX7/y8uVLdu/ezZo1a6is/PH94r1794AfQRj8OJZwfHyc6enp0t6nT5/y7t270vrChQvs2rWLYrFIOBxm06ZNnDp1CoD3798vVEuSJEmSNG9OdEmSJElSgNTV1RGLxRgdHSUajbJkyRLGx8fJZrMATE1NAdDT08OdO3c4dOgQXV1dFAoFLl26REVFBaFQCICWlhYymQzJZJIdO3bw/ft3hoeHiUQitLS0lK1HSZIkSfpVTnRJkiRJUsBcuXKFhoYGkskkx48f5/Hjx1y9epV4PM7Dhw8BWLFiBSMjI0xPT3Ps2DEGBwc5fPgw9fX1LF68GIBEIkEqleLZs2ccOXKEvr4+wuEw2WyWSCRSxg4lSZIk6deEiv/+qViSJEmS9Ne4f/8+VVVVbNiwoXSvUCiwceNGBgYG2L9/fxmrkyRJkqQ/w6MLJUmSJOkvNDExweXLl+nr62P16tV8+/aNTCZDbW0tHR0d5S5PkiRJkv4Igy5JkiRJ+gt1dXUxMzPD2NgYHz58oKamhubmZs6dO8fSpUvLXZ4kSZIk/REeXShJkiRJkiRJkqRAqih3AZIkSZIkSZIkSdJ8GHRJkiRJkiRJkiQpkAy6JEmSJEmSJEmSFEgGXZIkSZIkSZIkSQokgy5JkiRJkiRJkiQFkkGXJEmSJEmSJEmSAsmgS5IkSZIkSZIkSYFk0CVJkiRJkiRJkqRA+gcN1k2r/xW1XAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 2100x1000 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "tag_distribution = tags['tag'].value_counts()\n",
    "\n",
    "plt.figure(figsize=(21, 10))\n",
    "sns.barplot(x=tag_distribution.index[:50], y=tag_distribution.values[:50], palette=\"viridis\")\n",
    "plt.xticks(rotation=45)\n",
    "plt.xlabel('Tags', fontsize=12)\n",
    "plt.ylabel('Frequency', fontsize=12)\n",
    "plt.title('Top 50 Most Frequent Tags', fontsize=14)\n",
    "plt.show()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Semantic Clustering**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 75,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>cluster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>s</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>end</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>reverse</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>disaster</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>future</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2894</th>\n",
       "      <td>2894</td>\n",
       "      <td>strongman</td>\n",
       "      <td>156</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2895</th>\n",
       "      <td>2895</td>\n",
       "      <td>pacifist</td>\n",
       "      <td>126</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2896</th>\n",
       "      <td>2896</td>\n",
       "      <td>piracy</td>\n",
       "      <td>186</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2897</th>\n",
       "      <td>2897</td>\n",
       "      <td>pauli</td>\n",
       "      <td>112</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2898</th>\n",
       "      <td>2898</td>\n",
       "      <td>marine</td>\n",
       "      <td>28</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2899 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      Unnamed: 0        tag  cluster\n",
       "0              0          s      104\n",
       "1              1        end      104\n",
       "2              2    reverse      104\n",
       "3              3   disaster      104\n",
       "4              4     future      104\n",
       "...          ...        ...      ...\n",
       "2894        2894  strongman      156\n",
       "2895        2895   pacifist      126\n",
       "2896        2896     piracy      186\n",
       "2897        2897      pauli      112\n",
       "2898        2898     marine       28\n",
       "\n",
       "[2899 rows x 3 columns]"
      ]
     },
     "execution_count": 75,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_clusters = pd.read_csv(\"../dataset/tag_clusters.csv\")\n",
    "tag_clusters"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Unsupervised Word Sense Disambiguation \n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "context vector from CA model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "df_cv = pd.read_json(\"../dataset/df_context_vec.json\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Joining the context vector to tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>movieId</th>\n",
       "      <th>imdbId</th>\n",
       "      <th>tmdbId</th>\n",
       "      <th>title</th>\n",
       "      <th>genres</th>\n",
       "      <th>imdb_syn</th>\n",
       "      <th>tmdb_syn</th>\n",
       "      <th>summarized_syn</th>\n",
       "      <th>summarized_syn_cleaned</th>\n",
       "      <th>summarized_syn_tokens</th>\n",
       "      <th>...</th>\n",
       "      <th>IMAX</th>\n",
       "      <th>Musical</th>\n",
       "      <th>Mystery</th>\n",
       "      <th>Romance</th>\n",
       "      <th>Sci-Fi</th>\n",
       "      <th>Thriller</th>\n",
       "      <th>War</th>\n",
       "      <th>Western</th>\n",
       "      <th>weighted_cbow_synopsis</th>\n",
       "      <th>final_context_vector</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>114709</td>\n",
       "      <td>862</td>\n",
       "      <td>Toy Story (1995)</td>\n",
       "      <td>[Adventure, Animation, Children, Comedy, Fantasy]</td>\n",
       "      <td>A little boy named Andy loves to be in his roo...</td>\n",
       "      <td>Led by Woody, Andy's toys live happily in his ...</td>\n",
       "      <td>a little boy name andy love to be in room play...</td>\n",
       "      <td>[little, boy, andy, love, room, play, toy, esp...</td>\n",
       "      <td>[a, little, boy, name, andy, love, to, be, in,...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>113497</td>\n",
       "      <td>8844</td>\n",
       "      <td>Jumanji (1995)</td>\n",
       "      <td>[Adventure, Children, Fantasy]</td>\n",
       "      <td>Jumanji, one of the most unique--and dangerous...</td>\n",
       "      <td>When siblings Judy and Peter discover an encha...</td>\n",
       "      <td>jumanji one of the most uniqueand dangerousboa...</td>\n",
       "      <td>[jumanji, uniqueand, dangerousboard, game, fal...</td>\n",
       "      <td>[jumanji, one, of, the, most, uniqueand, dange...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>4</td>\n",
       "      <td>114885</td>\n",
       "      <td>31357</td>\n",
       "      <td>Waiting to Exhale (1995)</td>\n",
       "      <td>[Comedy, Drama, Romance]</td>\n",
       "      <td>This story based on the best selling novel by ...</td>\n",
       "      <td>Cheated on, mistreated and stepped on, the wom...</td>\n",
       "      <td>this story base on the best sell novel by terr...</td>\n",
       "      <td>[story, base, best, sell, novel, terry, mcmill...</td>\n",
       "      <td>[this, story, base, on, the, best, sell, novel...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>5</td>\n",
       "      <td>113041</td>\n",
       "      <td>11862</td>\n",
       "      <td>Father of the Bride Part II (1995)</td>\n",
       "      <td>[Comedy]</td>\n",
       "      <td>In this sequel to \"Father of the Bride\", Georg...</td>\n",
       "      <td>Just when George Banks has recovered from his ...</td>\n",
       "      <td>in this sequel to father of the bride george b...</td>\n",
       "      <td>[sequel, father, bride, george, bank, accept, ...</td>\n",
       "      <td>[in, this, sequel, to, father, of, the, bride,...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>6</td>\n",
       "      <td>113277</td>\n",
       "      <td>949</td>\n",
       "      <td>Heat (1995)</td>\n",
       "      <td>[Action, Crime, Thriller]</td>\n",
       "      <td>Hunters and their prey--Neil and his professio...</td>\n",
       "      <td>Obsessive master thief Neil McCauley leads a t...</td>\n",
       "      <td>hunter and preyneil and professional criminal ...</td>\n",
       "      <td>[hunter, preyneil, professional, criminal, cre...</td>\n",
       "      <td>[hunter, and, preyneil, and, professional, cri...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6178</th>\n",
       "      <td>130856</td>\n",
       "      <td>494826</td>\n",
       "      <td>48376</td>\n",
       "      <td>Severe Clear (2010)</td>\n",
       "      <td>[Comedy, Documentary]</td>\n",
       "      <td>None</td>\n",
       "      <td>Severe Clear is a film based on the memoirs of...</td>\n",
       "      <td>severe clear be a film base on the memoir of f...</td>\n",
       "      <td>[severe, clear, film, base, memoir, lieutenant...</td>\n",
       "      <td>[severe, clear, be, a, film, base, on, the, me...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6179</th>\n",
       "      <td>130958</td>\n",
       "      <td>143338</td>\n",
       "      <td>78402</td>\n",
       "      <td>Killer Crocodile (1989)</td>\n",
       "      <td>[Horror]</td>\n",
       "      <td>None</td>\n",
       "      <td>A group of environmentalists arrives at a fara...</td>\n",
       "      <td>a group of environmentalist arrives at a faraw...</td>\n",
       "      <td>[group, environmentalist, arrives, faraway, tr...</td>\n",
       "      <td>[a, group, of, environmentalist, arrives, at, ...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6180</th>\n",
       "      <td>130984</td>\n",
       "      <td>208423</td>\n",
       "      <td>317168</td>\n",
       "      <td>Santo vs. las lobas (1976)</td>\n",
       "      <td>[Action, Fantasy, Horror]</td>\n",
       "      <td>None</td>\n",
       "      <td>Also known as Santo vs. the She-Wolves</td>\n",
       "      <td>also know as santo v the shewolves</td>\n",
       "      <td>[know, santo, v, shewolves]</td>\n",
       "      <td>[also, know, as, santo, v, the, shewolves]</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6181</th>\n",
       "      <td>131011</td>\n",
       "      <td>69109</td>\n",
       "      <td>79572</td>\n",
       "      <td>Execution Squad (1972)</td>\n",
       "      <td>[Crime, Drama]</td>\n",
       "      <td>None</td>\n",
       "      <td>Bertone is a moderately honest homicide cop. U...</td>\n",
       "      <td>bertone be a moderately honest homicide cop be...</td>\n",
       "      <td>[bertone, moderately, honest, homicide, cop, e...</td>\n",
       "      <td>[bertone, be, a, moderately, honest, homicide,...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6182</th>\n",
       "      <td>131015</td>\n",
       "      <td>1430116</td>\n",
       "      <td>143928</td>\n",
       "      <td>Hellgate (2011)</td>\n",
       "      <td>[Horror, Thriller]</td>\n",
       "      <td>None</td>\n",
       "      <td>A western businessman, his Thai wife and son e...</td>\n",
       "      <td>a western businessman thai wife and son experi...</td>\n",
       "      <td>[western, businessman, thai, wife, son, experi...</td>\n",
       "      <td>[a, western, businessman, thai, wife, and, son...</td>\n",
       "      <td>...</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>6183 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      movieId   imdbId  tmdbId                               title  \\\n",
       "0           1   114709     862                    Toy Story (1995)   \n",
       "1           2   113497    8844                      Jumanji (1995)   \n",
       "2           4   114885   31357            Waiting to Exhale (1995)   \n",
       "3           5   113041   11862  Father of the Bride Part II (1995)   \n",
       "4           6   113277     949                         Heat (1995)   \n",
       "...       ...      ...     ...                                 ...   \n",
       "6178   130856   494826   48376                 Severe Clear (2010)   \n",
       "6179   130958   143338   78402             Killer Crocodile (1989)   \n",
       "6180   130984   208423  317168          Santo vs. las lobas (1976)   \n",
       "6181   131011    69109   79572              Execution Squad (1972)   \n",
       "6182   131015  1430116  143928                     Hellgate (2011)   \n",
       "\n",
       "                                                 genres  \\\n",
       "0     [Adventure, Animation, Children, Comedy, Fantasy]   \n",
       "1                        [Adventure, Children, Fantasy]   \n",
       "2                              [Comedy, Drama, Romance]   \n",
       "3                                              [Comedy]   \n",
       "4                             [Action, Crime, Thriller]   \n",
       "...                                                 ...   \n",
       "6178                              [Comedy, Documentary]   \n",
       "6179                                           [Horror]   \n",
       "6180                          [Action, Fantasy, Horror]   \n",
       "6181                                     [Crime, Drama]   \n",
       "6182                                 [Horror, Thriller]   \n",
       "\n",
       "                                               imdb_syn  \\\n",
       "0     A little boy named Andy loves to be in his roo...   \n",
       "1     Jumanji, one of the most unique--and dangerous...   \n",
       "2     This story based on the best selling novel by ...   \n",
       "3     In this sequel to \"Father of the Bride\", Georg...   \n",
       "4     Hunters and their prey--Neil and his professio...   \n",
       "...                                                 ...   \n",
       "6178                                               None   \n",
       "6179                                               None   \n",
       "6180                                               None   \n",
       "6181                                               None   \n",
       "6182                                               None   \n",
       "\n",
       "                                               tmdb_syn  \\\n",
       "0     Led by Woody, Andy's toys live happily in his ...   \n",
       "1     When siblings Judy and Peter discover an encha...   \n",
       "2     Cheated on, mistreated and stepped on, the wom...   \n",
       "3     Just when George Banks has recovered from his ...   \n",
       "4     Obsessive master thief Neil McCauley leads a t...   \n",
       "...                                                 ...   \n",
       "6178  Severe Clear is a film based on the memoirs of...   \n",
       "6179  A group of environmentalists arrives at a fara...   \n",
       "6180             Also known as Santo vs. the She-Wolves   \n",
       "6181  Bertone is a moderately honest homicide cop. U...   \n",
       "6182  A western businessman, his Thai wife and son e...   \n",
       "\n",
       "                                         summarized_syn  \\\n",
       "0     a little boy name andy love to be in room play...   \n",
       "1     jumanji one of the most uniqueand dangerousboa...   \n",
       "2     this story base on the best sell novel by terr...   \n",
       "3     in this sequel to father of the bride george b...   \n",
       "4     hunter and preyneil and professional criminal ...   \n",
       "...                                                 ...   \n",
       "6178  severe clear be a film base on the memoir of f...   \n",
       "6179  a group of environmentalist arrives at a faraw...   \n",
       "6180                 also know as santo v the shewolves   \n",
       "6181  bertone be a moderately honest homicide cop be...   \n",
       "6182  a western businessman thai wife and son experi...   \n",
       "\n",
       "                                 summarized_syn_cleaned  \\\n",
       "0     [little, boy, andy, love, room, play, toy, esp...   \n",
       "1     [jumanji, uniqueand, dangerousboard, game, fal...   \n",
       "2     [story, base, best, sell, novel, terry, mcmill...   \n",
       "3     [sequel, father, bride, george, bank, accept, ...   \n",
       "4     [hunter, preyneil, professional, criminal, cre...   \n",
       "...                                                 ...   \n",
       "6178  [severe, clear, film, base, memoir, lieutenant...   \n",
       "6179  [group, environmentalist, arrives, faraway, tr...   \n",
       "6180                        [know, santo, v, shewolves]   \n",
       "6181  [bertone, moderately, honest, homicide, cop, e...   \n",
       "6182  [western, businessman, thai, wife, son, experi...   \n",
       "\n",
       "                                  summarized_syn_tokens  ...  IMAX  Musical  \\\n",
       "0     [a, little, boy, name, andy, love, to, be, in,...  ...     0        0   \n",
       "1     [jumanji, one, of, the, most, uniqueand, dange...  ...     0        0   \n",
       "2     [this, story, base, on, the, best, sell, novel...  ...     0        0   \n",
       "3     [in, this, sequel, to, father, of, the, bride,...  ...     0        0   \n",
       "4     [hunter, and, preyneil, and, professional, cri...  ...     0        0   \n",
       "...                                                 ...  ...   ...      ...   \n",
       "6178  [severe, clear, be, a, film, base, on, the, me...  ...     0        0   \n",
       "6179  [a, group, of, environmentalist, arrives, at, ...  ...     0        0   \n",
       "6180         [also, know, as, santo, v, the, shewolves]  ...     0        0   \n",
       "6181  [bertone, be, a, moderately, honest, homicide,...  ...     0        0   \n",
       "6182  [a, western, businessman, thai, wife, and, son...  ...     0        0   \n",
       "\n",
       "      Mystery  Romance  Sci-Fi  Thriller  War  Western  \\\n",
       "0           0        0       0         0    0        0   \n",
       "1           0        0       0         0    0        0   \n",
       "2           0        1       0         0    0        0   \n",
       "3           0        0       0         0    0        0   \n",
       "4           0        0       0         1    0        0   \n",
       "...       ...      ...     ...       ...  ...      ...   \n",
       "6178        0        0       0         0    0        0   \n",
       "6179        0        0       0         0    0        0   \n",
       "6180        0        0       0         0    0        0   \n",
       "6181        0        0       0         0    0        0   \n",
       "6182        0        0       0         1    0        0   \n",
       "\n",
       "                                 weighted_cbow_synopsis  \\\n",
       "0     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "1     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "2     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "3     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "4     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "...                                                 ...   \n",
       "6178  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "6179  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "6180  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "6181  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "6182  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "\n",
       "                                   final_context_vector  \n",
       "0     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "1     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "2     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "3     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "4     [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "...                                                 ...  \n",
       "6178  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "6179  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "6180  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "6181  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "6182  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "\n",
       "[6183 rows x 32 columns]"
      ]
     },
     "execution_count": 78,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_cv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [],
   "source": [
    "# joining on movieId\n",
    "\n",
    "\n",
    "tag_cv = tags.merge(df_cv[['movieId', 'final_context_vector']], on='movieId', how='inner')\n",
    "\n",
    "# Now, 'tag_cv' will contain all columns from 'tags' and 'final_context_vector' from 'df_cv',\n",
    "# joined on 'movieId'.\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0.2</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>Unnamed: 0.1</th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>timestamp</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>has_glove_vec</th>\n",
       "      <th>final_context_vector</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>7</td>\n",
       "      <td>266</td>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>2015-02-20 22:42:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[ 0.18209    0.88297   -0.49805    0.53137   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>98</td>\n",
       "      <td>1584</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>2010-05-30 03:36:40</td>\n",
       "      <td>action</td>\n",
       "      <td>[ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>99</td>\n",
       "      <td>1585</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>2010-05-30 03:36:37</td>\n",
       "      <td>adventure</td>\n",
       "      <td>[ 0.094151   0.49795   -0.87618   -0.66309    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>100</td>\n",
       "      <td>1586</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>2010-05-30 03:36:38</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>[ 0.13512   -0.23763   -0.1364    -0.25487    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>104</td>\n",
       "      <td>1590</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>2010-05-30 03:36:32</td>\n",
       "      <td>stylized</td>\n",
       "      <td>[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...</td>\n",
       "      <td>False</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49912</th>\n",
       "      <td>50146</td>\n",
       "      <td>109241</td>\n",
       "      <td>390890</td>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>2014-02-14 21:49:07</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>[ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49913</th>\n",
       "      <td>50176</td>\n",
       "      <td>109289</td>\n",
       "      <td>390938</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>2014-12-27 18:19:58</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[ 0.11309   -0.8528    -0.25529    0.02635   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49914</th>\n",
       "      <td>50177</td>\n",
       "      <td>109290</td>\n",
       "      <td>390939</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>2014-12-27 18:20:04</td>\n",
       "      <td>slow</td>\n",
       "      <td>[ 0.37381    0.017462  -0.77856    0.35216   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49915</th>\n",
       "      <td>50189</td>\n",
       "      <td>109310</td>\n",
       "      <td>390959</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>2015-01-30 23:09:16</td>\n",
       "      <td>image</td>\n",
       "      <td>[ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49916</th>\n",
       "      <td>50190</td>\n",
       "      <td>109311</td>\n",
       "      <td>390960</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>2015-01-30 23:09:25</td>\n",
       "      <td>story</td>\n",
       "      <td>[-0.35058    0.58245   -0.065584  -0.41768    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49917 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       Unnamed: 0.2  Unnamed: 0  Unnamed: 0.1  userId  movieId  \\\n",
       "0                 0           7           266     318      260   \n",
       "1                52          98          1584     964      260   \n",
       "2                53          99          1585     964      260   \n",
       "3                54         100          1586     964      260   \n",
       "4                55         104          1590     964      260   \n",
       "...             ...         ...           ...     ...      ...   \n",
       "49912         50146      109241        390890  138280   108981   \n",
       "49913         50176      109289        390938  138280   112940   \n",
       "49914         50177      109290        390939  138280   112940   \n",
       "49915         50189      109310        390959  138280   117871   \n",
       "49916         50190      109311        390960  138280   117871   \n",
       "\n",
       "                    tag            timestamp     un-lemmatised  \\\n",
       "0                     s  2015-02-20 22:42:49               NaN   \n",
       "1                action  2010-05-30 03:36:40            action   \n",
       "2             adventure  2010-05-30 03:36:37         adventure   \n",
       "3           atmospheric  2010-05-30 03:36:38       atmospheric   \n",
       "4               stylize  2010-05-30 03:36:32          stylized   \n",
       "...                 ...                  ...               ...   \n",
       "49912         sexuality  2014-02-14 21:49:07         sexuality   \n",
       "49913  counterespionage  2014-12-27 18:19:58  counterespionage   \n",
       "49914              slow  2014-12-27 18:20:04              slow   \n",
       "49915             image  2015-01-30 23:09:16             image   \n",
       "49916             story  2015-01-30 23:09:25             story   \n",
       "\n",
       "                                               glove_vec  has_glove_vec  \\\n",
       "0      [ 0.18209    0.88297   -0.49805    0.53137   -...           True   \n",
       "1      [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...           True   \n",
       "2      [ 0.094151   0.49795   -0.87618   -0.66309    ...           True   \n",
       "3      [ 0.13512   -0.23763   -0.1364    -0.25487    ...           True   \n",
       "4      [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...          False   \n",
       "...                                                  ...            ...   \n",
       "49912  [ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...           True   \n",
       "49913  [ 0.11309   -0.8528    -0.25529    0.02635   -...           True   \n",
       "49914  [ 0.37381    0.017462  -0.77856    0.35216   -...           True   \n",
       "49915  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...           True   \n",
       "49916  [-0.35058    0.58245   -0.065584  -0.41768    ...           True   \n",
       "\n",
       "                                    final_context_vector  \n",
       "0      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "1      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "2      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "3      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "4      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "...                                                  ...  \n",
       "49912  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49913  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49914  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49915  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49916  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "\n",
       "[49917 rows x 11 columns]"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_cv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['Unnamed: 0.2', 'Unnamed: 0', 'Unnamed: 0.1', 'userId', 'movieId',\n",
       "       'tag', 'timestamp', 'un-lemmatised', 'glove_vec', 'has_glove_vec',\n",
       "       'final_context_vector'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 81,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_cv.columns"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Result from the join = 47942 rows\n",
    "Previous rows in tags = 48220\n",
    "\n",
    "- The movies that didn't exist after applying the tmdb API is the cause of this result\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Performing Unsupervised WSD"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "\n",
    "def get_glove(file_path):\n",
    "    embeddings_index = {}\n",
    "    with open(file_path, 'r', encoding='utf-8') as f:\n",
    "        for line in f:\n",
    "            word, coefs = line.split(maxsplit=1)\n",
    "            coefs = np.fromstring(coefs, \"f\", sep=\" \")\n",
    "            embeddings_index[word] = coefs\n",
    "    return embeddings_index\n",
    "\n",
    "path_to_glove_file = \"../pretrain_model/glove.6B/glove.6B.200d.txt\"\n",
    "glove_vec = get_glove(path_to_glove_file)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "       Unnamed: 0.2  Unnamed: 0  Unnamed: 0.1  userId  movieId  \\\n",
      "0                 0           7           266     318      260   \n",
      "1                52          98          1584     964      260   \n",
      "2                53          99          1585     964      260   \n",
      "3                54         100          1586     964      260   \n",
      "4                55         104          1590     964      260   \n",
      "...             ...         ...           ...     ...      ...   \n",
      "49912         50146      109241        390890  138280   108981   \n",
      "49913         50176      109289        390938  138280   112940   \n",
      "49914         50177      109290        390939  138280   112940   \n",
      "49915         50189      109310        390959  138280   117871   \n",
      "49916         50190      109311        390960  138280   117871   \n",
      "\n",
      "                    tag            timestamp     un-lemmatised  \\\n",
      "0                     s  2015-02-20 22:42:49               NaN   \n",
      "1                action  2010-05-30 03:36:40            action   \n",
      "2             adventure  2010-05-30 03:36:37         adventure   \n",
      "3           atmospheric  2010-05-30 03:36:38       atmospheric   \n",
      "4               stylize  2010-05-30 03:36:32          stylized   \n",
      "...                 ...                  ...               ...   \n",
      "49912         sexuality  2014-02-14 21:49:07         sexuality   \n",
      "49913  counterespionage  2014-12-27 18:19:58  counterespionage   \n",
      "49914              slow  2014-12-27 18:20:04              slow   \n",
      "49915             image  2015-01-30 23:09:16             image   \n",
      "49916             story  2015-01-30 23:09:25             story   \n",
      "\n",
      "                                               glove_vec  has_glove_vec  \\\n",
      "0      [ 0.18209    0.88297   -0.49805    0.53137   -...           True   \n",
      "1      [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...           True   \n",
      "2      [ 0.094151   0.49795   -0.87618   -0.66309    ...           True   \n",
      "3      [ 0.13512   -0.23763   -0.1364    -0.25487    ...           True   \n",
      "4      [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...          False   \n",
      "...                                                  ...            ...   \n",
      "49912  [ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...           True   \n",
      "49913  [ 0.11309   -0.8528    -0.25529    0.02635   -...           True   \n",
      "49914  [ 0.37381    0.017462  -0.77856    0.35216   -...           True   \n",
      "49915  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...           True   \n",
      "49916  [-0.35058    0.58245   -0.065584  -0.41768    ...           True   \n",
      "\n",
      "                                    final_context_vector  \n",
      "0      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "1      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "2      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "3      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "4      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "...                                                  ...  \n",
      "49912  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "49913  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "49914  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "49915  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "49916  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
      "\n",
      "[49917 rows x 11 columns]\n"
     ]
    }
   ],
   "source": [
    "import ast\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "\n",
    "def safe_literal_eval(x):\n",
    "    try:\n",
    "        return np.array(ast.literal_eval(x))\n",
    "    except (ValueError, SyntaxError):\n",
    "        print(f\"Failed to evaluate: {x}\")\n",
    "        return np.array([])  # or however you want to handle failures\n",
    "\n",
    "# Assuming tag_cv is your DataFrae\n",
    "\n",
    "tag_cv['final_context_vector'] = tag_cv['final_context_vector'].apply(\n",
    "    lambda x: safe_literal_eval(x) if isinstance(x, str) else x\n",
    ")\n",
    "\n",
    "print(tag_cv)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {},
   "outputs": [],
   "source": [
    "import ast\n",
    "\n",
    "tag_cv['final_context_vector'] = tag_cv['final_context_vector'].apply(lambda x: np.array(ast.literal_eval(x)) if isinstance(x, str) else x)\n",
    "\n",
    "# removing nan values in the tag_cv\n",
    "\n",
    "tag_cv = tag_cv.dropna(subset=['tag'])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0.2</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>Unnamed: 0.1</th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>timestamp</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>has_glove_vec</th>\n",
       "      <th>final_context_vector</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>7</td>\n",
       "      <td>266</td>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>2015-02-20 22:42:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[ 0.18209    0.88297   -0.49805    0.53137   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>98</td>\n",
       "      <td>1584</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>2010-05-30 03:36:40</td>\n",
       "      <td>action</td>\n",
       "      <td>[ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>99</td>\n",
       "      <td>1585</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>2010-05-30 03:36:37</td>\n",
       "      <td>adventure</td>\n",
       "      <td>[ 0.094151   0.49795   -0.87618   -0.66309    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>100</td>\n",
       "      <td>1586</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>2010-05-30 03:36:38</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>[ 0.13512   -0.23763   -0.1364    -0.25487    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>104</td>\n",
       "      <td>1590</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>2010-05-30 03:36:32</td>\n",
       "      <td>stylized</td>\n",
       "      <td>[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...</td>\n",
       "      <td>False</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49912</th>\n",
       "      <td>50146</td>\n",
       "      <td>109241</td>\n",
       "      <td>390890</td>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>2014-02-14 21:49:07</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>[ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49913</th>\n",
       "      <td>50176</td>\n",
       "      <td>109289</td>\n",
       "      <td>390938</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>2014-12-27 18:19:58</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[ 0.11309   -0.8528    -0.25529    0.02635   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49914</th>\n",
       "      <td>50177</td>\n",
       "      <td>109290</td>\n",
       "      <td>390939</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>2014-12-27 18:20:04</td>\n",
       "      <td>slow</td>\n",
       "      <td>[ 0.37381    0.017462  -0.77856    0.35216   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49915</th>\n",
       "      <td>50189</td>\n",
       "      <td>109310</td>\n",
       "      <td>390959</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>2015-01-30 23:09:16</td>\n",
       "      <td>image</td>\n",
       "      <td>[ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49916</th>\n",
       "      <td>50190</td>\n",
       "      <td>109311</td>\n",
       "      <td>390960</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>2015-01-30 23:09:25</td>\n",
       "      <td>story</td>\n",
       "      <td>[-0.35058    0.58245   -0.065584  -0.41768    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49630 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       Unnamed: 0.2  Unnamed: 0  Unnamed: 0.1  userId  movieId  \\\n",
       "0                 0           7           266     318      260   \n",
       "1                52          98          1584     964      260   \n",
       "2                53          99          1585     964      260   \n",
       "3                54         100          1586     964      260   \n",
       "4                55         104          1590     964      260   \n",
       "...             ...         ...           ...     ...      ...   \n",
       "49912         50146      109241        390890  138280   108981   \n",
       "49913         50176      109289        390938  138280   112940   \n",
       "49914         50177      109290        390939  138280   112940   \n",
       "49915         50189      109310        390959  138280   117871   \n",
       "49916         50190      109311        390960  138280   117871   \n",
       "\n",
       "                    tag            timestamp     un-lemmatised  \\\n",
       "0                     s  2015-02-20 22:42:49               NaN   \n",
       "1                action  2010-05-30 03:36:40            action   \n",
       "2             adventure  2010-05-30 03:36:37         adventure   \n",
       "3           atmospheric  2010-05-30 03:36:38       atmospheric   \n",
       "4               stylize  2010-05-30 03:36:32          stylized   \n",
       "...                 ...                  ...               ...   \n",
       "49912         sexuality  2014-02-14 21:49:07         sexuality   \n",
       "49913  counterespionage  2014-12-27 18:19:58  counterespionage   \n",
       "49914              slow  2014-12-27 18:20:04              slow   \n",
       "49915             image  2015-01-30 23:09:16             image   \n",
       "49916             story  2015-01-30 23:09:25             story   \n",
       "\n",
       "                                               glove_vec  has_glove_vec  \\\n",
       "0      [ 0.18209    0.88297   -0.49805    0.53137   -...           True   \n",
       "1      [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...           True   \n",
       "2      [ 0.094151   0.49795   -0.87618   -0.66309    ...           True   \n",
       "3      [ 0.13512   -0.23763   -0.1364    -0.25487    ...           True   \n",
       "4      [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...          False   \n",
       "...                                                  ...            ...   \n",
       "49912  [ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...           True   \n",
       "49913  [ 0.11309   -0.8528    -0.25529    0.02635   -...           True   \n",
       "49914  [ 0.37381    0.017462  -0.77856    0.35216   -...           True   \n",
       "49915  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...           True   \n",
       "49916  [-0.35058    0.58245   -0.065584  -0.41768    ...           True   \n",
       "\n",
       "                                    final_context_vector  \n",
       "0      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "1      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "2      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "3      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "4      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "...                                                  ...  \n",
       "49912  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49913  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49914  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49915  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "49916  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...  \n",
       "\n",
       "[49630 rows x 11 columns]"
      ]
     },
     "execution_count": 86,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_cv"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Reading the genre glove vec into a dictionary"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle\n",
    "\n",
    "# Reading from file\n",
    "with open('../pretrain_model/genre_glove_vec.pkl', 'rb') as f:\n",
    "    genre_glove_vec = pickle.load(f)\n",
    "\n",
    "# loaded_genre_glove_vec now contains your original dictionary\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 88,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>movieId</th>\n",
       "      <th>genres</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>['Adventure', 'Animation', 'Children', 'Comedy...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>['Adventure', 'Children', 'Fantasy']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>4</td>\n",
       "      <td>['Comedy', 'Drama', 'Romance']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>5</td>\n",
       "      <td>['Comedy']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>6</td>\n",
       "      <td>['Action', 'Crime', 'Thriller']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6178</th>\n",
       "      <td>130856</td>\n",
       "      <td>['Comedy', 'Documentary']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6179</th>\n",
       "      <td>130958</td>\n",
       "      <td>['Horror']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6180</th>\n",
       "      <td>130984</td>\n",
       "      <td>['Action', 'Fantasy', 'Horror']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6181</th>\n",
       "      <td>131011</td>\n",
       "      <td>['Crime', 'Drama']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6182</th>\n",
       "      <td>131015</td>\n",
       "      <td>['Horror', 'Thriller']</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>6183 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      movieId                                             genres\n",
       "0           1  ['Adventure', 'Animation', 'Children', 'Comedy...\n",
       "1           2               ['Adventure', 'Children', 'Fantasy']\n",
       "2           4                     ['Comedy', 'Drama', 'Romance']\n",
       "3           5                                         ['Comedy']\n",
       "4           6                    ['Action', 'Crime', 'Thriller']\n",
       "...       ...                                                ...\n",
       "6178   130856                          ['Comedy', 'Documentary']\n",
       "6179   130958                                         ['Horror']\n",
       "6180   130984                    ['Action', 'Fantasy', 'Horror']\n",
       "6181   131011                                 ['Crime', 'Drama']\n",
       "6182   131015                             ['Horror', 'Thriller']\n",
       "\n",
       "[6183 rows x 2 columns]"
      ]
     },
     "execution_count": 88,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# loading in the movie and genre df\n",
    "df_mg = pd.read_csv(\"../dataset/movie_genre.csv\")\n",
    "df_mg"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 89,
   "metadata": {},
   "outputs": [],
   "source": [
    "# join to main df 'tag_cv'\n",
    "\n",
    "tag_cv = pd.merge(tag_cv, df_mg, on='movieId')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 90,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0.2</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>Unnamed: 0.1</th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>timestamp</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>has_glove_vec</th>\n",
       "      <th>final_context_vector</th>\n",
       "      <th>genres</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>7</td>\n",
       "      <td>266</td>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>2015-02-20 22:42:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[ 0.18209    0.88297   -0.49805    0.53137   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>98</td>\n",
       "      <td>1584</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>2010-05-30 03:36:40</td>\n",
       "      <td>action</td>\n",
       "      <td>[ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>99</td>\n",
       "      <td>1585</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>2010-05-30 03:36:37</td>\n",
       "      <td>adventure</td>\n",
       "      <td>[ 0.094151   0.49795   -0.87618   -0.66309    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>100</td>\n",
       "      <td>1586</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>2010-05-30 03:36:38</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>[ 0.13512   -0.23763   -0.1364    -0.25487    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>104</td>\n",
       "      <td>1590</td>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>2010-05-30 03:36:32</td>\n",
       "      <td>stylized</td>\n",
       "      <td>[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...</td>\n",
       "      <td>False</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49625</th>\n",
       "      <td>50146</td>\n",
       "      <td>109241</td>\n",
       "      <td>390890</td>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>2014-02-14 21:49:07</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>[ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Drama', 'Mystery']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49626</th>\n",
       "      <td>50176</td>\n",
       "      <td>109289</td>\n",
       "      <td>390938</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>2014-12-27 18:19:58</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[ 0.11309   -0.8528    -0.25529    0.02635   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Thriller']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49627</th>\n",
       "      <td>50177</td>\n",
       "      <td>109290</td>\n",
       "      <td>390939</td>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>2014-12-27 18:20:04</td>\n",
       "      <td>slow</td>\n",
       "      <td>[ 0.37381    0.017462  -0.77856    0.35216   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Thriller']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49628</th>\n",
       "      <td>50189</td>\n",
       "      <td>109310</td>\n",
       "      <td>390959</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>2015-01-30 23:09:16</td>\n",
       "      <td>image</td>\n",
       "      <td>[ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Drama', 'War']</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49629</th>\n",
       "      <td>50190</td>\n",
       "      <td>109311</td>\n",
       "      <td>390960</td>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>2015-01-30 23:09:25</td>\n",
       "      <td>story</td>\n",
       "      <td>[-0.35058    0.58245   -0.065584  -0.41768    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Drama', 'War']</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49630 rows × 12 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       Unnamed: 0.2  Unnamed: 0  Unnamed: 0.1  userId  movieId  \\\n",
       "0                 0           7           266     318      260   \n",
       "1                52          98          1584     964      260   \n",
       "2                53          99          1585     964      260   \n",
       "3                54         100          1586     964      260   \n",
       "4                55         104          1590     964      260   \n",
       "...             ...         ...           ...     ...      ...   \n",
       "49625         50146      109241        390890  138280   108981   \n",
       "49626         50176      109289        390938  138280   112940   \n",
       "49627         50177      109290        390939  138280   112940   \n",
       "49628         50189      109310        390959  138280   117871   \n",
       "49629         50190      109311        390960  138280   117871   \n",
       "\n",
       "                    tag            timestamp     un-lemmatised  \\\n",
       "0                     s  2015-02-20 22:42:49               NaN   \n",
       "1                action  2010-05-30 03:36:40            action   \n",
       "2             adventure  2010-05-30 03:36:37         adventure   \n",
       "3           atmospheric  2010-05-30 03:36:38       atmospheric   \n",
       "4               stylize  2010-05-30 03:36:32          stylized   \n",
       "...                 ...                  ...               ...   \n",
       "49625         sexuality  2014-02-14 21:49:07         sexuality   \n",
       "49626  counterespionage  2014-12-27 18:19:58  counterespionage   \n",
       "49627              slow  2014-12-27 18:20:04              slow   \n",
       "49628             image  2015-01-30 23:09:16             image   \n",
       "49629             story  2015-01-30 23:09:25             story   \n",
       "\n",
       "                                               glove_vec  has_glove_vec  \\\n",
       "0      [ 0.18209    0.88297   -0.49805    0.53137   -...           True   \n",
       "1      [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...           True   \n",
       "2      [ 0.094151   0.49795   -0.87618   -0.66309    ...           True   \n",
       "3      [ 0.13512   -0.23763   -0.1364    -0.25487    ...           True   \n",
       "4      [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...          False   \n",
       "...                                                  ...            ...   \n",
       "49625  [ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...           True   \n",
       "49626  [ 0.11309   -0.8528    -0.25529    0.02635   -...           True   \n",
       "49627  [ 0.37381    0.017462  -0.77856    0.35216   -...           True   \n",
       "49628  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...           True   \n",
       "49629  [-0.35058    0.58245   -0.065584  -0.41768    ...           True   \n",
       "\n",
       "                                    final_context_vector  \\\n",
       "0      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "1      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "2      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "3      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "4      [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "...                                                  ...   \n",
       "49625  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49626  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49627  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49628  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49629  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "\n",
       "                                  genres  \n",
       "0      ['Action', 'Adventure', 'Sci-Fi']  \n",
       "1      ['Action', 'Adventure', 'Sci-Fi']  \n",
       "2      ['Action', 'Adventure', 'Sci-Fi']  \n",
       "3      ['Action', 'Adventure', 'Sci-Fi']  \n",
       "4      ['Action', 'Adventure', 'Sci-Fi']  \n",
       "...                                  ...  \n",
       "49625               ['Drama', 'Mystery']  \n",
       "49626                       ['Thriller']  \n",
       "49627                       ['Thriller']  \n",
       "49628         ['Action', 'Drama', 'War']  \n",
       "49629         ['Action', 'Drama', 'War']  \n",
       "\n",
       "[49630 rows x 12 columns]"
      ]
     },
     "execution_count": 90,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_cv"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### WSD using the Context Vector of Movie Synopsis and Genre GloVe vectors "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "from sklearn.neighbors import KernelDensity\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "from nltk.corpus import wordnet as wn\n",
    "import pandas as pd\n",
    "\n",
    "def get_word_senses(word):\n",
    "    \"\"\"Retrieve all possible senses of a word from WordNet.\"\"\"\n",
    "    return wn.synsets(word)\n",
    "\n",
    "def compute_kde(x, y):\n",
    "    \"\"\"Compute the KDE score between two vectors.\"\"\"\n",
    "    kde = KernelDensity()\n",
    "    kde.fit(x.reshape(-1, 1))\n",
    "    log_dens = kde.score_samples(y.reshape(-1, 1))\n",
    "    return np.exp(log_dens).mean()\n",
    "\n",
    "def convert_synset_to_vector(synset, glove_vec):\n",
    "    \"\"\"Convert WordNet synset to GloVe vector by averaging lemma vectors.\"\"\"\n",
    "    lemma_names = synset.lemma_names()\n",
    "    vectors = [glove_vec.get(lemma, np.zeros((200,))) for lemma in lemma_names]\n",
    "    if len(vectors) == 0:\n",
    "        return np.zeros((200,))\n",
    "    return np.mean(vectors, axis=0)\n",
    "\n",
    "def get_max_similarity_genre(genres, sense_vector, genre_glove_vec):\n",
    "    \"\"\"Find the genre with the maximum similarity.\"\"\"\n",
    "    max_similarity = float('-inf')\n",
    "    max_genre = None\n",
    "    \n",
    "    for genre in genres:\n",
    "        genre_vec = np.array(genre_glove_vec.get(genre, np.zeros((200,))))\n",
    "        similarity = cosine_similarity(sense_vector.reshape(1, -1), genre_vec.reshape(1, -1))\n",
    "        \n",
    "        if similarity > max_similarity:\n",
    "            max_similarity = similarity\n",
    "            max_genre = genre\n",
    "\n",
    "    return max_genre, max_similarity\n",
    "\n",
    "def disambiguate_word_sense(row, glove_vec, genre_glove_vec):\n",
    "    \"\"\"Disambiguate the sense of a word using the context vector and genre.\"\"\"\n",
    "    word = row['tag']\n",
    "    context_vector = np.array(row['final_context_vector'])\n",
    "    genres = row['genres']\n",
    "    \n",
    "    expected_shape = 200\n",
    "    if context_vector.shape != (expected_shape,):\n",
    "        raise ValueError(f\"Invalid shape for context_vector: {context_vector.shape}\")\n",
    "\n",
    "    senses = get_word_senses(word)\n",
    "    if not senses:\n",
    "        return word, 0.0\n",
    "    \n",
    "    max_prob = float('-inf')\n",
    "    best_sense = None\n",
    "    \n",
    "    for sense in senses:\n",
    "        sense_vector = convert_synset_to_vector(sense, glove_vec)\n",
    "        \n",
    "        if sense_vector.shape != (expected_shape,):\n",
    "            raise ValueError(f\"Invalid shape for sense_vector: {sense_vector.shape}\")\n",
    "\n",
    "        prob_density_context = compute_kde(sense_vector.reshape(-1, 1), context_vector.reshape(-1, 1))\n",
    "        max_genre, prob_density_genre = get_max_similarity_genre(genres, sense_vector, genre_glove_vec)\n",
    "        \n",
    "        prob_density = max(prob_density_context, prob_density_genre)\n",
    "        \n",
    "        if prob_density > max_prob:\n",
    "            max_prob = prob_density\n",
    "            best_sense = sense.name()\n",
    "    \n",
    "    return best_sense, max_prob\n",
    "\n",
    "# Assuming tag_cv, glove_vec, and genre_glove_vec are available\n",
    "tag_cv['disambiguated_sense'], tag_cv['confidence'] = zip(*tag_cv.apply(lambda row: disambiguate_word_sense(row, glove_vec, genre_glove_vec), axis=1))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tag_cv.drop(columns=['Unnamed: 0','Unnamed: 0.1','Unnamed: 0.2'], inplace=True)\n",
    "tag_cv.to_csv(\"../dataset/tag_cv.csv\",index=False)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Output of the WSD\n",
    "- 2 additional columns: disambiguated_sense and confidence \n",
    "\n",
    "disambiguated_sense: This column will contain the WordNet synset that has the highest Kernel Density Estimation (KDE) score when compared to the final_context_vector for each row. The synset is a specific sense or meaning of the word (tag) in the same row.\n",
    "\n",
    "confidence: This column will contain the KDE score for the chosen disambiguated_sense, which gives an idea of how well the sense matches the context. The higher the KDE score, the more \"confident\" the model is that the chosen sense is correct."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {},
   "outputs": [],
   "source": [
    "tag_cv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\n",
      "[<class 'list'>]\n"
     ]
    }
   ],
   "source": [
    "print(tag_cv['final_context_vector'].isna().sum())  # Count NaN values\n",
    "print(tag_cv['final_context_vector'].apply(type).unique())  # Check types\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 103,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>disambiguated_sense</th>\n",
       "      <th>confidence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>mho.n.01</td>\n",
       "      <td>0.396197</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>legal_action.n.01</td>\n",
       "      <td>0.395202</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>adventure.n.01</td>\n",
       "      <td>0.394330</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>atmospheric.a.01</td>\n",
       "      <td>0.388486</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>stylize.v.01</td>\n",
       "      <td>0.398942</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49625</th>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>sex.n.04</td>\n",
       "      <td>0.370642</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49626</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>counterespionage.n.01</td>\n",
       "      <td>0.367513</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49627</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>slow.v.03</td>\n",
       "      <td>0.395033</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49628</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>trope.n.01</td>\n",
       "      <td>0.390764</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49629</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>fib.n.01</td>\n",
       "      <td>0.393206</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49630 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       userId  movieId               tag    disambiguated_sense  confidence\n",
       "0         318      260                 s               mho.n.01    0.396197\n",
       "1         964      260            action      legal_action.n.01    0.395202\n",
       "2         964      260         adventure         adventure.n.01    0.394330\n",
       "3         964      260       atmospheric       atmospheric.a.01    0.388486\n",
       "4         964      260           stylize           stylize.v.01    0.398942\n",
       "...       ...      ...               ...                    ...         ...\n",
       "49625  138280   108981         sexuality               sex.n.04    0.370642\n",
       "49626  138280   112940  counterespionage  counterespionage.n.01    0.367513\n",
       "49627  138280   112940              slow              slow.v.03    0.395033\n",
       "49628  138280   117871             image             trope.n.01    0.390764\n",
       "49629  138280   117871             story               fib.n.01    0.393206\n",
       "\n",
       "[49630 rows x 5 columns]"
      ]
     },
     "execution_count": 103,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_wsd = tag_cv[['userId','movieId','tag','disambiguated_sense','confidence']]\n",
    "df_wsd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "             tag           disambiguated_sense  confidence\n",
      "20064      death                    death.n.06    0.398942\n",
      "33324  holocaust                holocaust.n.02    0.398942\n",
      "33330       john                     john.n.02    0.398942\n",
      "5290         elf  extremely_low_frequency.n.01    0.398942\n",
      "5289   christmas                christmas.n.01    0.398942\n",
      "20434  australia                australia.n.01    0.398942\n",
      "40031    british                  british.n.01    0.398942\n",
      "20433      china                    china.n.01    0.398942\n",
      "5280      gothic                   gothic.n.01    0.398942\n",
      "28583     greece                   greece.n.01    0.398942\n",
      "33327       goth                     goth.n.02    0.398942\n",
      "40044       gore                     gore.n.01    0.398942\n",
      "28582    stylize                  stylize.v.01    0.398942\n",
      "33315     circus                   circus.n.06    0.398942\n"
     ]
    }
   ],
   "source": [
    "sorted_df = df_wsd[[\"tag\", \"disambiguated_sense\", \"confidence\"]].sort_values(by=\"confidence\", ascending=False).head(20)\n",
    "\n",
    "distinct_tags_df = sorted_df.drop_duplicates(subset=[\"tag\"]).copy()\n",
    "print(distinct_tags_df[[\"tag\", \"disambiguated_sense\", \"confidence\"]])\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 105,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>disambiguated_sense</th>\n",
       "      <th>confidence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "Empty DataFrame\n",
       "Columns: [userId, movieId, tag, disambiguated_sense, confidence]\n",
       "Index: []"
      ]
     },
     "execution_count": 105,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_wsd[df_wsd['tag'] == '']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Tag Recommendation\n",
    "Cascading effect by using the output of the CF model as a starting point for recommendation\n",
    "\n",
    "1. Take in the recommendations from the CF model k x (movieId, sentiment)\n",
    "2. We will use these recommendations as a lookup table on userId. \n",
    "3. The (movieId, sentiment) serves as a preliminary filter for the CB filtering process\n",
    "4. For each movieId in the list of k recommendations, filter on the tags that have been applied to that movieId by other users. \n",
    "5. Compute similarity scores between the tags that have been applied to the movie with the tag of a user.\n",
    "    - Done using the CB features we calculated\n",
    "6. (Assuming the sentiment feature has been brought in already): use the sentiment part of the CF recommendation to refine the similar tags from step 5 -> making sure the sentiment of the tag is the same as the sentiment given from the CF movie. \n",
    "7. Tag recommendation "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### get the recommendations (movieId, sentiment) from CF model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 106,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>recommendations</th>\n",
       "      <th>tags_movies</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>[[260, 0.1389], [780, 0.1588], [1196, 0.294600...</td>\n",
       "      <td>[[260, [action, space, luke, sequel, robot, he...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2274</td>\n",
       "      <td>[[2762, 0.1212], [2959, 0.1212], [3996, 0.2166...</td>\n",
       "      <td>[[2762, [nan, enigmatic, thriller, unpredictab...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3031</td>\n",
       "      <td>[[70, -0.49810000000000004], [353, 0.25], [805...</td>\n",
       "      <td>[[70, [gore, brother, vampire, intense, nan, s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4087</td>\n",
       "      <td>[[296, 0.0051], [805, 0.2713], [1136, 0.205000...</td>\n",
       "      <td>[[296, [action, rivet, masterpiece, drug, dial...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4450</td>\n",
       "      <td>[[1994, 0.1524], [4995, 0.20500000000000002], ...</td>\n",
       "      <td>[[1994, [thriller, ghost]], [4995, [education,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1547</th>\n",
       "      <td>117265</td>\n",
       "      <td>[[47, 0.176], [50, 0.1822], [356, 0.1751], [10...</td>\n",
       "      <td>[[47, [overrate, investigation, philosophical,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1548</th>\n",
       "      <td>117607</td>\n",
       "      <td>[[1257, 0.1369], [1748, 0.1617], [2916, -0.027...</td>\n",
       "      <td>[[1257, [imagination, goofy, silly, skiing, qu...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1549</th>\n",
       "      <td>123915</td>\n",
       "      <td>[[1, 0.1628], [22, -0.2524], [70, 0.1625], [11...</td>\n",
       "      <td>[[1, [woody, adventure, watch, buy, comedy, fa...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1550</th>\n",
       "      <td>127468</td>\n",
       "      <td>[[12, 0.1932], [21, 0.16040000000000001], [26,...</td>\n",
       "      <td>[[12, [vampire, gothic]], [21, [mafia, hollywo...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1551</th>\n",
       "      <td>136810</td>\n",
       "      <td>[[32, 0.13140000000000002], [436, 0.1314000000...</td>\n",
       "      <td>[[32, [interest, british, genetics, original, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1552 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId                                    recommendations  \\\n",
       "0        318  [[260, 0.1389], [780, 0.1588], [1196, 0.294600...   \n",
       "1       2274  [[2762, 0.1212], [2959, 0.1212], [3996, 0.2166...   \n",
       "2       3031  [[70, -0.49810000000000004], [353, 0.25], [805...   \n",
       "3       4087  [[296, 0.0051], [805, 0.2713], [1136, 0.205000...   \n",
       "4       4450  [[1994, 0.1524], [4995, 0.20500000000000002], ...   \n",
       "...      ...                                                ...   \n",
       "1547  117265  [[47, 0.176], [50, 0.1822], [356, 0.1751], [10...   \n",
       "1548  117607  [[1257, 0.1369], [1748, 0.1617], [2916, -0.027...   \n",
       "1549  123915  [[1, 0.1628], [22, -0.2524], [70, 0.1625], [11...   \n",
       "1550  127468  [[12, 0.1932], [21, 0.16040000000000001], [26,...   \n",
       "1551  136810  [[32, 0.13140000000000002], [436, 0.1314000000...   \n",
       "\n",
       "                                            tags_movies  \n",
       "0     [[260, [action, space, luke, sequel, robot, he...  \n",
       "1     [[2762, [nan, enigmatic, thriller, unpredictab...  \n",
       "2     [[70, [gore, brother, vampire, intense, nan, s...  \n",
       "3     [[296, [action, rivet, masterpiece, drug, dial...  \n",
       "4     [[1994, [thriller, ghost]], [4995, [education,...  \n",
       "...                                                 ...  \n",
       "1547  [[47, [overrate, investigation, philosophical,...  \n",
       "1548  [[1257, [imagination, goofy, silly, skiing, qu...  \n",
       "1549  [[1, [woody, adventure, watch, buy, comedy, fa...  \n",
       "1550  [[12, [vampire, gothic]], [21, [mafia, hollywo...  \n",
       "1551  [[32, [interest, british, genetics, original, ...  \n",
       "\n",
       "[1552 rows x 3 columns]"
      ]
     },
     "execution_count": 106,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_rec = pd.read_json('../dataset/df_rec.json', orient='split')\n",
    "df_rec\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>recommendations</th>\n",
       "      <th>tags_movies</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>[(260, 0.1389), (780, 0.1588), (1196, 0.2946),...</td>\n",
       "      <td>[[260, [action, space, luke, sequel, robot, he...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2274</td>\n",
       "      <td>[(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...</td>\n",
       "      <td>[[2762, [nan, enigmatic, thriller, unpredictab...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3031</td>\n",
       "      <td>[(70, -0.4981), (353, 0.25), (805, 0.25), (487...</td>\n",
       "      <td>[[70, [gore, brother, vampire, intense, nan, s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4087</td>\n",
       "      <td>[(296, 0.0051), (805, 0.2713), (1136, 0.205), ...</td>\n",
       "      <td>[[296, [action, rivet, masterpiece, drug, dial...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4450</td>\n",
       "      <td>[(1994, 0.1524), (4995, 0.205), (4226, 0.145),...</td>\n",
       "      <td>[[1994, [thriller, ghost]], [4995, [education,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1547</th>\n",
       "      <td>117265</td>\n",
       "      <td>[(47, 0.176), (50, 0.1822), (356, 0.1751), (10...</td>\n",
       "      <td>[[47, [overrate, investigation, philosophical,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1548</th>\n",
       "      <td>117607</td>\n",
       "      <td>[(1257, 0.1369), (1748, 0.1617), (2916, -0.027...</td>\n",
       "      <td>[[1257, [imagination, goofy, silly, skiing, qu...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1549</th>\n",
       "      <td>123915</td>\n",
       "      <td>[(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...</td>\n",
       "      <td>[[1, [woody, adventure, watch, buy, comedy, fa...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1550</th>\n",
       "      <td>127468</td>\n",
       "      <td>[(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...</td>\n",
       "      <td>[[12, [vampire, gothic]], [21, [mafia, hollywo...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1551</th>\n",
       "      <td>136810</td>\n",
       "      <td>[(32, 0.1314), (436, 0.1314), (593, 0.1314), (...</td>\n",
       "      <td>[[32, [interest, british, genetics, original, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1552 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId                                    recommendations  \\\n",
       "0        318  [(260, 0.1389), (780, 0.1588), (1196, 0.2946),...   \n",
       "1       2274  [(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...   \n",
       "2       3031  [(70, -0.4981), (353, 0.25), (805, 0.25), (487...   \n",
       "3       4087  [(296, 0.0051), (805, 0.2713), (1136, 0.205), ...   \n",
       "4       4450  [(1994, 0.1524), (4995, 0.205), (4226, 0.145),...   \n",
       "...      ...                                                ...   \n",
       "1547  117265  [(47, 0.176), (50, 0.1822), (356, 0.1751), (10...   \n",
       "1548  117607  [(1257, 0.1369), (1748, 0.1617), (2916, -0.027...   \n",
       "1549  123915  [(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...   \n",
       "1550  127468  [(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...   \n",
       "1551  136810  [(32, 0.1314), (436, 0.1314), (593, 0.1314), (...   \n",
       "\n",
       "                                            tags_movies  \n",
       "0     [[260, [action, space, luke, sequel, robot, he...  \n",
       "1     [[2762, [nan, enigmatic, thriller, unpredictab...  \n",
       "2     [[70, [gore, brother, vampire, intense, nan, s...  \n",
       "3     [[296, [action, rivet, masterpiece, drug, dial...  \n",
       "4     [[1994, [thriller, ghost]], [4995, [education,...  \n",
       "...                                                 ...  \n",
       "1547  [[47, [overrate, investigation, philosophical,...  \n",
       "1548  [[1257, [imagination, goofy, silly, skiing, qu...  \n",
       "1549  [[1, [woody, adventure, watch, buy, comedy, fa...  \n",
       "1550  [[12, [vampire, gothic]], [21, [mafia, hollywo...  \n",
       "1551  [[32, [interest, british, genetics, original, ...  \n",
       "\n",
       "[1552 rows x 3 columns]"
      ]
     },
     "execution_count": 107,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_rec['recommendations'] = df_rec['recommendations'].apply(lambda x: [(int(a), round(b, 4)) for a, b in x])\n",
    "df_rec"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### The (movieId, sentiment) serves as a preliminary filter for the CB filtering process \n",
    "\n",
    "- Provides a set of preliminary tags that the CB model can look at to refine and produce similar recommendationn\n",
    "\n",
    "For each movieId in the list of k recommendations, filter on the tags that have been applied to that movieId by other users. \n",
    "- So for each movieId - get the tags that have been applied by other users"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>timestamp</th>\n",
       "      <th>un-lemmatised</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>has_glove_vec</th>\n",
       "      <th>final_context_vector</th>\n",
       "      <th>genres</th>\n",
       "      <th>disambiguated_sense</th>\n",
       "      <th>confidence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>2015-02-20 22:42:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>[ 0.18209    0.88297   -0.49805    0.53137   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "      <td>mho.n.01</td>\n",
       "      <td>0.396197</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>2010-05-30 03:36:40</td>\n",
       "      <td>action</td>\n",
       "      <td>[ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "      <td>legal_action.n.01</td>\n",
       "      <td>0.395202</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>2010-05-30 03:36:37</td>\n",
       "      <td>adventure</td>\n",
       "      <td>[ 0.094151   0.49795   -0.87618   -0.66309    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "      <td>adventure.n.01</td>\n",
       "      <td>0.394330</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>2010-05-30 03:36:38</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>[ 0.13512   -0.23763   -0.1364    -0.25487    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "      <td>atmospheric.a.01</td>\n",
       "      <td>0.388486</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>2010-05-30 03:36:32</td>\n",
       "      <td>stylized</td>\n",
       "      <td>[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...</td>\n",
       "      <td>False</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Adventure', 'Sci-Fi']</td>\n",
       "      <td>stylize.v.01</td>\n",
       "      <td>0.398942</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49625</th>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>2014-02-14 21:49:07</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>[ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Drama', 'Mystery']</td>\n",
       "      <td>sex.n.04</td>\n",
       "      <td>0.370642</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49626</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>2014-12-27 18:19:58</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[ 0.11309   -0.8528    -0.25529    0.02635   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Thriller']</td>\n",
       "      <td>counterespionage.n.01</td>\n",
       "      <td>0.367513</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49627</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>2014-12-27 18:20:04</td>\n",
       "      <td>slow</td>\n",
       "      <td>[ 0.37381    0.017462  -0.77856    0.35216   -...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Thriller']</td>\n",
       "      <td>slow.v.03</td>\n",
       "      <td>0.395033</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49628</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>2015-01-30 23:09:16</td>\n",
       "      <td>image</td>\n",
       "      <td>[ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Drama', 'War']</td>\n",
       "      <td>trope.n.01</td>\n",
       "      <td>0.390764</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49629</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>2015-01-30 23:09:25</td>\n",
       "      <td>story</td>\n",
       "      <td>[-0.35058    0.58245   -0.065584  -0.41768    ...</td>\n",
       "      <td>True</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>['Action', 'Drama', 'War']</td>\n",
       "      <td>fib.n.01</td>\n",
       "      <td>0.393206</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49630 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       userId  movieId               tag            timestamp  \\\n",
       "0         318      260                 s  2015-02-20 22:42:49   \n",
       "1         964      260            action  2010-05-30 03:36:40   \n",
       "2         964      260         adventure  2010-05-30 03:36:37   \n",
       "3         964      260       atmospheric  2010-05-30 03:36:38   \n",
       "4         964      260           stylize  2010-05-30 03:36:32   \n",
       "...       ...      ...               ...                  ...   \n",
       "49625  138280   108981         sexuality  2014-02-14 21:49:07   \n",
       "49626  138280   112940  counterespionage  2014-12-27 18:19:58   \n",
       "49627  138280   112940              slow  2014-12-27 18:20:04   \n",
       "49628  138280   117871             image  2015-01-30 23:09:16   \n",
       "49629  138280   117871             story  2015-01-30 23:09:25   \n",
       "\n",
       "          un-lemmatised                                          glove_vec  \\\n",
       "0                   NaN  [ 0.18209    0.88297   -0.49805    0.53137   -...   \n",
       "1                action  [ 2.0240e-02  8.4992e-01 -7.8150e-01 -8.2769e-...   \n",
       "2             adventure  [ 0.094151   0.49795   -0.87618   -0.66309    ...   \n",
       "3           atmospheric  [ 0.13512   -0.23763   -0.1364    -0.25487    ...   \n",
       "4              stylized  [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. ...   \n",
       "...                 ...                                                ...   \n",
       "49625         sexuality  [ 2.7006e-01  3.4214e-01  4.9813e-01 -4.3149e-...   \n",
       "49626  counterespionage  [ 0.11309   -0.8528    -0.25529    0.02635   -...   \n",
       "49627              slow  [ 0.37381    0.017462  -0.77856    0.35216   -...   \n",
       "49628             image  [ 1.1091e-02  4.8461e-01  1.9142e-02  8.3725e-...   \n",
       "49629             story  [-0.35058    0.58245   -0.065584  -0.41768    ...   \n",
       "\n",
       "       has_glove_vec                               final_context_vector  \\\n",
       "0               True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "1               True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "2               True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "3               True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "4              False  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "...              ...                                                ...   \n",
       "49625           True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49626           True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49627           True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49628           True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "49629           True  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "\n",
       "                                  genres    disambiguated_sense  confidence  \n",
       "0      ['Action', 'Adventure', 'Sci-Fi']               mho.n.01    0.396197  \n",
       "1      ['Action', 'Adventure', 'Sci-Fi']      legal_action.n.01    0.395202  \n",
       "2      ['Action', 'Adventure', 'Sci-Fi']         adventure.n.01    0.394330  \n",
       "3      ['Action', 'Adventure', 'Sci-Fi']       atmospheric.a.01    0.388486  \n",
       "4      ['Action', 'Adventure', 'Sci-Fi']           stylize.v.01    0.398942  \n",
       "...                                  ...                    ...         ...  \n",
       "49625               ['Drama', 'Mystery']               sex.n.04    0.370642  \n",
       "49626                       ['Thriller']  counterespionage.n.01    0.367513  \n",
       "49627                       ['Thriller']              slow.v.03    0.395033  \n",
       "49628         ['Action', 'Drama', 'War']             trope.n.01    0.390764  \n",
       "49629         ['Action', 'Drama', 'War']               fib.n.01    0.393206  \n",
       "\n",
       "[49630 rows x 11 columns]"
      ]
     },
     "execution_count": 108,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_cv"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Merging all the content-based features into one dataframe\n",
    "- for ease of lookup \n",
    "\n",
    "Features: \n",
    "    - GloVe vectors - same gloVe vectors from previous\n",
    "    - POS tagging\n",
    "    - Sentiment\n",
    "    - NER - entities\n",
    "    - Tag Frequency \n",
    "    - Semantic clusters\n",
    "    - Word Sense Disambiguation (WSD) \n",
    "\n",
    "- WSD in separate dataframe (needs to be in conisderation with movieId)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "WSD dataframe"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_wsd = tag_cv[['userId', 'movieId', 'tag', 'disambiguated_sense', 'confidence']].copy()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>overrate</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>violent</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2893</th>\n",
       "      <td>newspaper</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2894</th>\n",
       "      <td>static</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2895</th>\n",
       "      <td>repeat</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2896</th>\n",
       "      <td>seal</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2897</th>\n",
       "      <td>counterespionage</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2898 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                   tag\n",
       "0                    s\n",
       "1               action\n",
       "2                twist\n",
       "3             overrate\n",
       "4              violent\n",
       "...                ...\n",
       "2893         newspaper\n",
       "2894            static\n",
       "2895            repeat\n",
       "2896              seal\n",
       "2897  counterespionage\n",
       "\n",
       "[2898 rows x 1 columns]"
      ]
     },
     "execution_count": 110,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Creating a dataframe with only the distinct tags \n",
    "dist_tags = words[['tag']].drop_duplicates().reset_index(drop=True)\n",
    "dist_tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 111,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>ner_model</th>\n",
       "      <th>POS</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(s, O)]</td>\n",
       "      <td>PROPN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(s, O)]</td>\n",
       "      <td>INTJ</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(action, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(twist, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(twist, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3078</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(newspaper, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3079</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(static, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3080</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(repeat, O)]</td>\n",
       "      <td>VERB</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3081</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(seal, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3082</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>O</td>\n",
       "      <td>[(counterespionage, O)]</td>\n",
       "      <td>NOUN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>3083 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                   tag                                          glove_vec  \\\n",
       "0                    s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "1                    s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "2               action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "3                twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "4                twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "...                ...                                                ...   \n",
       "3078         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "3079            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "3080            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "3081              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "3082  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "     ner_label                ner_model    POS  \n",
       "0            O                 [(s, O)]  PROPN  \n",
       "1            O                 [(s, O)]   INTJ  \n",
       "2            O            [(action, O)]   NOUN  \n",
       "3            O             [(twist, O)]   NOUN  \n",
       "4            O             [(twist, O)]   NOUN  \n",
       "...        ...                      ...    ...  \n",
       "3078         O         [(newspaper, O)]   NOUN  \n",
       "3079         O            [(static, O)]   NOUN  \n",
       "3080         O            [(repeat, O)]   VERB  \n",
       "3081         O              [(seal, O)]   NOUN  \n",
       "3082         O  [(counterespionage, O)]   NOUN  \n",
       "\n",
       "[3083 rows x 5 columns]"
      ]
     },
     "execution_count": 111,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# placing the glove_vec to the df_feat dataframe, access in the \"words\"\n",
    "words\n",
    "\n",
    "words['ner_label'] = words['ner_model'].apply(lambda x: x[0][1] if x else None)\n",
    "words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0.1</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>tag</th>\n",
       "      <th>sentiment_roberta</th>\n",
       "      <th>sentiment_label</th>\n",
       "      <th>sentiment_value</th>\n",
       "      <th>scaled_sentiment_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>s</td>\n",
       "      <td>('neutral', 0.5123)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.5123</td>\n",
       "      <td>0.24385</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>action</td>\n",
       "      <td>('neutral', 0.6874)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.6874</td>\n",
       "      <td>0.15630</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>twist</td>\n",
       "      <td>('neutral', 0.7575)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.7575</td>\n",
       "      <td>0.12125</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>twist</td>\n",
       "      <td>('neutral', 0.7575)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.7575</td>\n",
       "      <td>0.12125</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>overrate</td>\n",
       "      <td>('neutral', 0.5669)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.5669</td>\n",
       "      <td>0.21655</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50186</th>\n",
       "      <td>50186</td>\n",
       "      <td>50186</td>\n",
       "      <td>history</td>\n",
       "      <td>('neutral', 0.6321)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.6321</td>\n",
       "      <td>0.18395</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50187</th>\n",
       "      <td>50187</td>\n",
       "      <td>50187</td>\n",
       "      <td>informatics</td>\n",
       "      <td>('neutral', 0.7477)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.7477</td>\n",
       "      <td>0.12615</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50188</th>\n",
       "      <td>50188</td>\n",
       "      <td>50188</td>\n",
       "      <td>mathematics</td>\n",
       "      <td>('neutral', 0.7053)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.7053</td>\n",
       "      <td>0.14735</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50189</th>\n",
       "      <td>50189</td>\n",
       "      <td>50189</td>\n",
       "      <td>image</td>\n",
       "      <td>('neutral', 0.7328)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.7328</td>\n",
       "      <td>0.13360</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50190</th>\n",
       "      <td>50190</td>\n",
       "      <td>50190</td>\n",
       "      <td>story</td>\n",
       "      <td>('neutral', 0.5695)</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.5695</td>\n",
       "      <td>0.21525</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>50191 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       Unnamed: 0.1  Unnamed: 0          tag    sentiment_roberta  \\\n",
       "0                 0           0            s  ('neutral', 0.5123)   \n",
       "1                 1           1       action  ('neutral', 0.6874)   \n",
       "2                 2           2        twist  ('neutral', 0.7575)   \n",
       "3                 3           3        twist  ('neutral', 0.7575)   \n",
       "4                 4           4     overrate  ('neutral', 0.5669)   \n",
       "...             ...         ...          ...                  ...   \n",
       "50186         50186       50186      history  ('neutral', 0.6321)   \n",
       "50187         50187       50187  informatics  ('neutral', 0.7477)   \n",
       "50188         50188       50188  mathematics  ('neutral', 0.7053)   \n",
       "50189         50189       50189        image  ('neutral', 0.7328)   \n",
       "50190         50190       50190        story  ('neutral', 0.5695)   \n",
       "\n",
       "      sentiment_label  sentiment_value  scaled_sentiment_value  \n",
       "0             neutral           0.5123                 0.24385  \n",
       "1             neutral           0.6874                 0.15630  \n",
       "2             neutral           0.7575                 0.12125  \n",
       "3             neutral           0.7575                 0.12125  \n",
       "4             neutral           0.5669                 0.21655  \n",
       "...               ...              ...                     ...  \n",
       "50186         neutral           0.6321                 0.18395  \n",
       "50187         neutral           0.7477                 0.12615  \n",
       "50188         neutral           0.7053                 0.14735  \n",
       "50189         neutral           0.7328                 0.13360  \n",
       "50190         neutral           0.5695                 0.21525  \n",
       "\n",
       "[50191 rows x 7 columns]"
      ]
     },
     "execution_count": 112,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# reading in the sentiment df\n",
    "df_sent = pd.read_csv('../dataset/df_tag_sentiment.csv')\n",
    "df_sent"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 113,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>POS</th>\n",
       "      <th>sentiment_label</th>\n",
       "      <th>scaled_sentiment_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.24385</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3568</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15630</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4610</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.12125</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5879</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.21655</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6027</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.25750</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>97104</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.10295</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>97105</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>positive</td>\n",
       "      <td>0.76810</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>97106</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19360</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>97107</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17375</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>97108</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.14290</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2898 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    tag                                          glove_vec  \\\n",
       "0                     s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "3568             action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "4610              twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "5879           overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   \n",
       "6027            violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...   \n",
       "...                 ...                                                ...   \n",
       "97104         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "97105            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "97106            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "97107              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "97108  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "      ner_label    POS sentiment_label  scaled_sentiment_value  \n",
       "0             O  PROPN         neutral                 0.24385  \n",
       "3568          O   NOUN         neutral                 0.15630  \n",
       "4610          O   NOUN         neutral                 0.12125  \n",
       "5879          O   VERB         neutral                 0.21655  \n",
       "6027          O    ADJ         neutral                 0.25750  \n",
       "...         ...    ...             ...                     ...  \n",
       "97104         O   NOUN         neutral                 0.10295  \n",
       "97105         O   NOUN        positive                 0.76810  \n",
       "97106         O   VERB         neutral                 0.19360  \n",
       "97107         O   NOUN         neutral                 0.17375  \n",
       "97108         O   NOUN         neutral                 0.14290  \n",
       "\n",
       "[2898 rows x 6 columns]"
      ]
     },
     "execution_count": 113,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_feat = dist_tags.merge(words[['tag', 'glove_vec']], on='tag', how='left') # glove\n",
    "df_feat = df_feat.merge(words[['tag', 'ner_label']], on='tag', how='left') #ner\n",
    "df_feat = df_feat.merge(words[['tag', 'POS']], on='tag', how='left') # pos\n",
    "df_feat = df_feat.merge(df_sent[['tag', 'sentiment_label', 'scaled_sentiment_value']], on='tag', how='left') #sentiment \n",
    "\n",
    "\n",
    "df_feat.drop_duplicates(subset=['tag'], inplace=True)\n",
    "df_feat\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 137,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_feat.to_json(\"../dataset/df_feat.json\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 115,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>recommendations</th>\n",
       "      <th>tags_movies</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>[(260, 0.1389), (780, 0.1588), (1196, 0.2946),...</td>\n",
       "      <td>[[260, [action, space, luke, sequel, robot, he...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2274</td>\n",
       "      <td>[(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...</td>\n",
       "      <td>[[2762, [nan, enigmatic, thriller, unpredictab...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3031</td>\n",
       "      <td>[(70, -0.4981), (353, 0.25), (805, 0.25), (487...</td>\n",
       "      <td>[[70, [gore, brother, vampire, intense, nan, s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4087</td>\n",
       "      <td>[(296, 0.0051), (805, 0.2713), (1136, 0.205), ...</td>\n",
       "      <td>[[296, [action, rivet, masterpiece, drug, dial...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4450</td>\n",
       "      <td>[(1994, 0.1524), (4995, 0.205), (4226, 0.145),...</td>\n",
       "      <td>[[1994, [thriller, ghost]], [4995, [education,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1547</th>\n",
       "      <td>117265</td>\n",
       "      <td>[(47, 0.176), (50, 0.1822), (356, 0.1751), (10...</td>\n",
       "      <td>[[47, [overrate, investigation, philosophical,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1548</th>\n",
       "      <td>117607</td>\n",
       "      <td>[(1257, 0.1369), (1748, 0.1617), (2916, -0.027...</td>\n",
       "      <td>[[1257, [imagination, goofy, silly, skiing, qu...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1549</th>\n",
       "      <td>123915</td>\n",
       "      <td>[(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...</td>\n",
       "      <td>[[1, [woody, adventure, watch, buy, comedy, fa...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1550</th>\n",
       "      <td>127468</td>\n",
       "      <td>[(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...</td>\n",
       "      <td>[[12, [vampire, gothic]], [21, [mafia, hollywo...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1551</th>\n",
       "      <td>136810</td>\n",
       "      <td>[(32, 0.1314), (436, 0.1314), (593, 0.1314), (...</td>\n",
       "      <td>[[32, [interest, british, genetics, original, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1552 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId                                    recommendations  \\\n",
       "0        318  [(260, 0.1389), (780, 0.1588), (1196, 0.2946),...   \n",
       "1       2274  [(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...   \n",
       "2       3031  [(70, -0.4981), (353, 0.25), (805, 0.25), (487...   \n",
       "3       4087  [(296, 0.0051), (805, 0.2713), (1136, 0.205), ...   \n",
       "4       4450  [(1994, 0.1524), (4995, 0.205), (4226, 0.145),...   \n",
       "...      ...                                                ...   \n",
       "1547  117265  [(47, 0.176), (50, 0.1822), (356, 0.1751), (10...   \n",
       "1548  117607  [(1257, 0.1369), (1748, 0.1617), (2916, -0.027...   \n",
       "1549  123915  [(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...   \n",
       "1550  127468  [(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...   \n",
       "1551  136810  [(32, 0.1314), (436, 0.1314), (593, 0.1314), (...   \n",
       "\n",
       "                                            tags_movies  \n",
       "0     [[260, [action, space, luke, sequel, robot, he...  \n",
       "1     [[2762, [nan, enigmatic, thriller, unpredictab...  \n",
       "2     [[70, [gore, brother, vampire, intense, nan, s...  \n",
       "3     [[296, [action, rivet, masterpiece, drug, dial...  \n",
       "4     [[1994, [thriller, ghost]], [4995, [education,...  \n",
       "...                                                 ...  \n",
       "1547  [[47, [overrate, investigation, philosophical,...  \n",
       "1548  [[1257, [imagination, goofy, silly, skiing, qu...  \n",
       "1549  [[1, [woody, adventure, watch, buy, comedy, fa...  \n",
       "1550  [[12, [vampire, gothic]], [21, [mafia, hollywo...  \n",
       "1551  [[32, [interest, british, genetics, original, ...  \n",
       "\n",
       "[1552 rows x 3 columns]"
      ]
     },
     "execution_count": 115,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_rec"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Recommendations using Similarity Metric \n",
    "- We will use a blend of similarity metrics as the similarity of some features will need certain metrics over others\n",
    "- For glove vectors, scaled_sentiment_value, term(tag) frequency, semantic clusters: exact match\n",
    "- For POS, disambiguated_sense, sentiment_label, ner: exact  matching\n",
    "\n",
    "\n",
    "**Since different similarity scores are used - we have to normalize each of the scores, then average to get final similarity score between tags**\n",
    "- why? otherwise one type of similarity may dominate others causing an imbalance in the final score "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Try testing on a single user - and then evaluating the relevance of the recommendation\n",
    "- then we can pilot on other users \n",
    "\n",
    "get_user_recommendations: function gets movieId, sentiment pairs from df_rec, AND the tags that a user has applied previously - these tags will be used to calculate similarity with other tags for the content-based filtering. \n",
    "    - In terms of additional context, considering the tag, movieId for a user provides more nuanced recommendations and can be integrated in the context-aware model \n",
    "    - The WSD serves as an additional context layer already - as the movieId is considered here "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 116,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>recommendations</th>\n",
       "      <th>tags_movies</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>[(260, 0.1389), (780, 0.1588), (1196, 0.2946),...</td>\n",
       "      <td>[[260, [action, space, luke, sequel, robot, he...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2274</td>\n",
       "      <td>[(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...</td>\n",
       "      <td>[[2762, [nan, enigmatic, thriller, unpredictab...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3031</td>\n",
       "      <td>[(70, -0.4981), (353, 0.25), (805, 0.25), (487...</td>\n",
       "      <td>[[70, [gore, brother, vampire, intense, nan, s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4087</td>\n",
       "      <td>[(296, 0.0051), (805, 0.2713), (1136, 0.205), ...</td>\n",
       "      <td>[[296, [action, rivet, masterpiece, drug, dial...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4450</td>\n",
       "      <td>[(1994, 0.1524), (4995, 0.205), (4226, 0.145),...</td>\n",
       "      <td>[[1994, [thriller, ghost]], [4995, [education,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1547</th>\n",
       "      <td>117265</td>\n",
       "      <td>[(47, 0.176), (50, 0.1822), (356, 0.1751), (10...</td>\n",
       "      <td>[[47, [overrate, investigation, philosophical,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1548</th>\n",
       "      <td>117607</td>\n",
       "      <td>[(1257, 0.1369), (1748, 0.1617), (2916, -0.027...</td>\n",
       "      <td>[[1257, [imagination, goofy, silly, skiing, qu...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1549</th>\n",
       "      <td>123915</td>\n",
       "      <td>[(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...</td>\n",
       "      <td>[[1, [woody, adventure, watch, buy, comedy, fa...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1550</th>\n",
       "      <td>127468</td>\n",
       "      <td>[(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...</td>\n",
       "      <td>[[12, [vampire, gothic]], [21, [mafia, hollywo...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1551</th>\n",
       "      <td>136810</td>\n",
       "      <td>[(32, 0.1314), (436, 0.1314), (593, 0.1314), (...</td>\n",
       "      <td>[[32, [interest, british, genetics, original, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1552 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId                                    recommendations  \\\n",
       "0        318  [(260, 0.1389), (780, 0.1588), (1196, 0.2946),...   \n",
       "1       2274  [(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...   \n",
       "2       3031  [(70, -0.4981), (353, 0.25), (805, 0.25), (487...   \n",
       "3       4087  [(296, 0.0051), (805, 0.2713), (1136, 0.205), ...   \n",
       "4       4450  [(1994, 0.1524), (4995, 0.205), (4226, 0.145),...   \n",
       "...      ...                                                ...   \n",
       "1547  117265  [(47, 0.176), (50, 0.1822), (356, 0.1751), (10...   \n",
       "1548  117607  [(1257, 0.1369), (1748, 0.1617), (2916, -0.027...   \n",
       "1549  123915  [(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...   \n",
       "1550  127468  [(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...   \n",
       "1551  136810  [(32, 0.1314), (436, 0.1314), (593, 0.1314), (...   \n",
       "\n",
       "                                            tags_movies  \n",
       "0     [[260, [action, space, luke, sequel, robot, he...  \n",
       "1     [[2762, [nan, enigmatic, thriller, unpredictab...  \n",
       "2     [[70, [gore, brother, vampire, intense, nan, s...  \n",
       "3     [[296, [action, rivet, masterpiece, drug, dial...  \n",
       "4     [[1994, [thriller, ghost]], [4995, [education,...  \n",
       "...                                                 ...  \n",
       "1547  [[47, [overrate, investigation, philosophical,...  \n",
       "1548  [[1257, [imagination, goofy, silly, skiing, qu...  \n",
       "1549  [[1, [woody, adventure, watch, buy, comedy, fa...  \n",
       "1550  [[12, [vampire, gothic]], [21, [mafia, hollywo...  \n",
       "1551  [[32, [interest, british, genetics, original, ...  \n",
       "\n",
       "[1552 rows x 3 columns]"
      ]
     },
     "execution_count": 116,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_rec"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Compute Individual Similarity Metrics and get user features\n",
    "- NOTE: the tags recommended MUST not be the same as the user tags\n",
    "For each feature set (content based features) - calculate the similarity scores between the tags given by the target user and the tags in the recommendation movieId set\n",
    "\n",
    "1. Consolidate user features into one dataframe for efficiency of comparison "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 117,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_user_data(df_rec, tag_cv, target_userId):\n",
    "    \"\"\"\n",
    "    Retrieve movie recommendations, user tags, and tags_movies for a target userId.\n",
    "\n",
    "    Parameters:\n",
    "        df_rec (DataFrame): The DataFrame containing userId, recommendations, and tags_movies columns.\n",
    "        tag_cv (DataFrame): The DataFrame containing userId, movieId, and tags.\n",
    "        target_userId (int): The userId for whom the data is to be fetched.\n",
    "\n",
    "    Returns:\n",
    "        tuple: A tuple containing three lists:\n",
    "               - The first list contains recommendations (movieId, sentiment) for the target userId.\n",
    "               - The second list contains tags applied by the target userId in the format (movieId, tag).\n",
    "               - The third list contains tags_movies entries for the target userId in the format [(movieId, [tags...]), ...].\n",
    "    \"\"\"\n",
    "    # Fetch movie recommendations\n",
    "    recommendations = get_user_recommendations(df_rec, target_userId)\n",
    "    \n",
    "    # Fetch tags applied by the user\n",
    "    user_tags = get_user_tags(tag_cv, target_userId)\n",
    "    \n",
    "    # Fetch tags_movies data for the user\n",
    "    tags_movies = get_tags_movies_for_user(df_rec, target_userId)\n",
    "    \n",
    "    return recommendations, user_tags, tags_movies\n",
    "\n",
    "\n",
    "def get_user_recommendations(df_rec, target_userId):\n",
    "    filtered_df = df_rec[df_rec['userId'] == target_userId]\n",
    "    if len(filtered_df) == 0:\n",
    "        return []\n",
    "    recommendations = filtered_df['recommendations'].iloc[0]\n",
    "    return recommendations\n",
    "\n",
    "\n",
    "def get_user_tags(tag_cv, target_userId):\n",
    "    filtered_df = tag_cv[tag_cv['userId'] == target_userId]\n",
    "    if len(filtered_df) == 0:\n",
    "        return []\n",
    "    user_tags = filtered_df[['movieId', 'tag']].values.tolist()\n",
    "    return user_tags\n",
    "\n",
    "\n",
    "def get_tags_movies_for_user(df_rec, target_userId):\n",
    "    filtered_df = df_rec[df_rec['userId'] == target_userId]\n",
    "    if len(filtered_df) == 0:\n",
    "        return []\n",
    "    tags_movies = filtered_df['tags_movies'].iloc[0]\n",
    "    return tags_movies\n",
    "\n",
    "\n",
    "\n",
    "\n",
    "def get_user_feature_set_and_wsd(df_feat, df_wsd, user_tags, tag_clusters, target_userId):\n",
    "    \"\"\"\n",
    "    Fetch additional features, WSD, and TF/TF-IDF info for a list of user tags.\n",
    "    \n",
    "    Parameters:\n",
    "        df_feat (DataFrame): The DataFrame containing features for each tag.\n",
    "        df_wsd (DataFrame): The DataFrame containing WSD information.\n",
    "        user_tags (list): The list containing tags applied by the user in the format (movieId, tag).\n",
    "        target_userId (int): The userId for whom the WSD data is to be fetched.\n",
    "        \n",
    "    Returns:\n",
    "        tuple: A tuple containing three DataFrames:\n",
    "               - The first DataFrame contains additional features for each user tag.\n",
    "               - The second DataFrame contains WSD information for the user.\n",
    "               - The third DataFrame contains TF and TF-IDF information for the user tags.\n",
    "    \"\"\"\n",
    "    # Filtering df_feat to only include rows where the tag is in user_tags\n",
    "    filtered_df_feat = df_feat[df_feat['tag'].isin([tag for _, tag in user_tags])]\n",
    "    \n",
    "    # Filtering df_wsd to include only rows for the target_userId\n",
    "    filtered_df_wsd = df_wsd[df_wsd['userId'] == target_userId]\n",
    "    \n",
    "    # joining the cluster to the tags\n",
    "\n",
    "    filtered_df_feat = pd.merge(filtered_df_feat, tag_clusters, on='tag', how='inner')\n",
    "    # Create a set of (movieId, tag) tuples for easier filtering\n",
    "    user_tags_set = set(tuple(x) for x in user_tags)\n",
    "\n",
    "\n",
    "    return filtered_df_feat, filtered_df_wsd\n",
    "\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Get user features**\n",
    "\n",
    "Run here ->\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 134,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tag_cv.to_json('../dataset/tag_csv.json')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "metadata": {},
   "outputs": [],
   "source": [
    "# tag_clusters.to_csv(\"../dataset/tag_clusters.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 136,
   "metadata": {},
   "outputs": [],
   "source": [
    "# df_wsd.to_csv(\"../dataset/df_wsd.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 125,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>disambiguated_sense</th>\n",
       "      <th>confidence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>260</td>\n",
       "      <td>s</td>\n",
       "      <td>mho.n.01</td>\n",
       "      <td>0.396197</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>legal_action.n.01</td>\n",
       "      <td>0.395202</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>adventure.n.01</td>\n",
       "      <td>0.394330</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>atmospheric.a.01</td>\n",
       "      <td>0.388486</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>stylize.v.01</td>\n",
       "      <td>0.398942</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49625</th>\n",
       "      <td>138280</td>\n",
       "      <td>108981</td>\n",
       "      <td>sexuality</td>\n",
       "      <td>sex.n.04</td>\n",
       "      <td>0.370642</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49626</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>counterespionage</td>\n",
       "      <td>counterespionage.n.01</td>\n",
       "      <td>0.367513</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49627</th>\n",
       "      <td>138280</td>\n",
       "      <td>112940</td>\n",
       "      <td>slow</td>\n",
       "      <td>slow.v.03</td>\n",
       "      <td>0.395033</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49628</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>image</td>\n",
       "      <td>trope.n.01</td>\n",
       "      <td>0.390764</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49629</th>\n",
       "      <td>138280</td>\n",
       "      <td>117871</td>\n",
       "      <td>story</td>\n",
       "      <td>fib.n.01</td>\n",
       "      <td>0.393206</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>49630 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       userId  movieId               tag    disambiguated_sense  confidence\n",
       "0         318      260                 s               mho.n.01    0.396197\n",
       "1         964      260            action      legal_action.n.01    0.395202\n",
       "2         964      260         adventure         adventure.n.01    0.394330\n",
       "3         964      260       atmospheric       atmospheric.a.01    0.388486\n",
       "4         964      260           stylize           stylize.v.01    0.398942\n",
       "...       ...      ...               ...                    ...         ...\n",
       "49625  138280   108981         sexuality               sex.n.04    0.370642\n",
       "49626  138280   112940  counterespionage  counterespionage.n.01    0.367513\n",
       "49627  138280   112940              slow              slow.v.03    0.395033\n",
       "49628  138280   117871             image             trope.n.01    0.390764\n",
       "49629  138280   117871             story               fib.n.01    0.393206\n",
       "\n",
       "[49630 rows x 5 columns]"
      ]
     },
     "execution_count": 125,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_wsd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 128,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Recommendations: [(260, 0.2438), (115149, 0.1563), (2762, 0.1212), (2959, 0.1212), (3996, 0.2166), (6016, 0.2575), (7438, 0.2575), (296, 0.0051), (805, 0.2713), (1136, 0.205)]\n",
      "User Tags: [[260, 'action'], [260, 'adventure'], [260, 'atmospheric'], [260, 'stylize'], [2959, 'action'], [2959, 'atmospheric'], [2959, 'disturb'], [2959, 'philosophy'], [2959, 'psychology'], [2959, 'quirky'], [2959, 'surreal'], [2959, 'violence'], [780, 'action'], [780, 'adventure'], [780, 'aviation'], [780, 'disaster'], [780, 'humorous'], [780, 'tense'], [1196, 'action'], [1196, 'adventure'], [1196, 'classic'], [1196, 'music'], [1196, 'sequel'], [1197, 'action'], [1197, 'classic'], [1197, 'comedy'], [1197, 'funny'], [1197, 'medieval'], [1197, 'pirate'], [1197, 'quirky'], [1197, 'revenge'], [1197, 'romance'], [1197, 'torture'], [1210, 'sequel'], [1210, 'space'], [4369, 'action'], [4369, 'car'], [4993, 'action'], [4993, 'adventure'], [4993, 'atmospheric'], [4993, 'music'], [4993, 'nature'], [4993, 'scenic'], [4993, 'stylize'], [4993, \"wizard's\"], [6539, 'action'], [6539, 'adventure'], [6539, 'comedy'], [48774, 'atmospheric'], [48774, 'christianity'], [48774, 'england'], [48774, 'future'], [48774, 'futuristic'], [48774, 'pregnancy'], [48774, 'survival'], [48774, 'thriller'], [53972, 'action'], [53972, 'comedy'], [53972, 'computer'], [53972, 'murder'], [53972, 'terrorism'], [79132, 'action'], [79132, 'clever'], [79132, 'complicate'], [79132, 'intense'], [79132, 'surreal'], [79132, 'tokyo'], [79274, 'animation'], [79274, 'batman'], [79274, 'comic'], [79274, 'dc'], [79274, 'fight'], [79274, 'joker'], [99112, 'conspiracy'], [99112, 'investigation'], [102445, 'action'], [102445, 'adventure'], [102445, 'space'], [103228, 'anime'], [103228, 'cinematography'], [103228, 'music'], [103228, 'robot'], [103228, 'romance']]\n",
      "Tags Movies for userId 505: [[260, ['action', 'space', 'luke', 'sequel', 'robot', 'heroic', 'series', 'adventure', 'awesome', 'stylize', 'force', 'outdated', 'franchise', 'knight', 'princess', 'soundtrack', 'epic', 's', 'classic', 'atmospheric', 'complete']], [115149, ['action']], [2762, ['nan', 'enigmatic', 'thriller', 'unpredictable', 'afterlife', 'theater', 'drama', 'horror', 'stylize', 'suspense', 'touch', 'fake', 'death', 'watch', 'ominous', 'scary', 'act', 'ghost', 'psychological', 'frighten', 'boring', 'psychology', 'predictable', 'atmospheric', 'twist']], [2959, ['action', 'justice', 'rebellious', 'philosophical', 'men', 'original', 'nan', 'crime', 'confrontational', 'disturb', 'dark', 'complicate', 'quirky', 'r', 'stylize', 'violence', 'anarchism', 'philosophy', 'narrate', 'insanity', 'watch', 'smart', 'consumerism', 'challenge', 'psychological', 'sabotage', 'satirical', 'masculine', 'violent', 'cynical', 'thoughtprovoking', 'capitalism', 's', 'psychology', 'identity', 'stylish', 'classic', 'masculinity', 'intense', 'surreal', 'psychedelic', 'atmospheric', 'fight', 'twist']], [3996, ['overrate', 'action', 'ridiculous', 'poetic', 'nan', 'crime', 'romance', 'hate', 'dvd', 'murder', 'stylize', 'china', 'westernization', 'beautiful', 'watch', 'colourful', 'soundtrack', 'fly', 'dreamlike', 'culture', 'atmospheric', 'tragic']], [6016, ['interest', 'drug', 'forceful', 'enthral', 'poverty', 'nan', 'amaze', 'crime', 'sweep', 'feel', 'disturb', 'nightclub', 'loser', 'photography', 'brazil', 'drama', 'stylize', 'photographer', 'violence', 'depress', 'refresh', 'idiot', 'portuguese', 'chicken', 'violent', 'soccer', 'robbery', 'slam', 'classic', 'gangster', 'intense', 'atmospheric', 'gang']], [7438, ['action', 'overrate', 'storytelling', 'crime', 'vengeance', 'thriller', 'adventure', 'quirky', 'drama', 'stylize', 'violence', 'dialogue', 'watch', 'samurai', 'japan', 'bill', 'revenge', 'bloody', 'violent', 'classic', 'surreal', 'atmospheric']], [296, ['action', 'rivet', 'masterpiece', 'drug', 'dialog', 'quote', 'comedy', 'storytelling', 'philosophical', 'homosexuality', 'amaze', 'nan', 'character', 'crime', 'mobster', 'funny', 'cool', 'thriller', 'dark', 'unpredictable', 'dvd', 'quirky', 'drama', 'stylize', 'humorous', 'violence', 'suspense', 'dialogue', 'watch', 'humor', 'entertain', 'satire', 'violent', 'nonlinear', 'gun', 's', 'classic', 'rape', 'intense', 'atmospheric', 'innovative', 'act']], [805, ['vengeance', 'rape']], [1136, ['british', 'comedy', 'nan', 'biblical', 'funny', 'awesome', 'humorous', 'parody', 'religion', 'hilarious', 'watch', 'english', 'humor', 'england', 'satire', 'medieval', 'spoof', 'satirical', 'rabbit', 's', 'inventive', 'influential', 'classic']]]\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>POS</th>\n",
       "      <th>sentiment_label</th>\n",
       "      <th>scaled_sentiment_value</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>cluster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15630</td>\n",
       "      <td>158</td>\n",
       "      <td>142</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>music</td>\n",
       "      <td>[0.026302, 0.49343, 0.15147, -0.8506, 0.70278,...</td>\n",
       "      <td>CW</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.25580</td>\n",
       "      <td>564</td>\n",
       "      <td>89</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>fight</td>\n",
       "      <td>[-0.19856, 0.17457, -0.62895, -0.45929, -0.071...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17885</td>\n",
       "      <td>159</td>\n",
       "      <td>142</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>violence</td>\n",
       "      <td>[0.025781, 0.8007, -0.18627, -0.40211, -0.2174...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>negative</td>\n",
       "      <td>-0.59850</td>\n",
       "      <td>557</td>\n",
       "      <td>153</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>surreal</td>\n",
       "      <td>[0.26532, -0.083012, -0.33654, -0.31641, 0.501...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17225</td>\n",
       "      <td>698</td>\n",
       "      <td>154</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>disturb</td>\n",
       "      <td>[0.73229, -0.069107, 0.50046, 0.14098, 0.08063...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.11775</td>\n",
       "      <td>200</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>quirky</td>\n",
       "      <td>[0.42383, -0.096889, 0.12294, -0.34541, 0.5612...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.18185</td>\n",
       "      <td>657</td>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>adventure</td>\n",
       "      <td>[0.094151, 0.49795, -0.87618, -0.66309, 0.8435...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.16350</td>\n",
       "      <td>893</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>atmospheric</td>\n",
       "      <td>[0.13512, -0.23763, -0.1364, -0.25487, 1.1195,...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.14715</td>\n",
       "      <td>951</td>\n",
       "      <td>83</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>stylize</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.08885</td>\n",
       "      <td>201</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>aviation</td>\n",
       "      <td>[0.28546, 0.37475, 0.019193, -0.18236, 0.18596...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.13205</td>\n",
       "      <td>742</td>\n",
       "      <td>30</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>disaster</td>\n",
       "      <td>[-0.11391, 0.085762, -0.47509, -0.75199, -0.09...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>negative</td>\n",
       "      <td>-0.47310</td>\n",
       "      <td>3</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>humorous</td>\n",
       "      <td>[-0.22947, 0.072875, 0.39434, -0.42828, 0.4785...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>positive</td>\n",
       "      <td>0.79795</td>\n",
       "      <td>658</td>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>tense</td>\n",
       "      <td>[0.62009, 0.25015, 0.82526, -0.43723, -0.71044...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17600</td>\n",
       "      <td>975</td>\n",
       "      <td>168</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>classic</td>\n",
       "      <td>[-0.39525, -0.17758, -0.60726, -0.65832, 0.566...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>positive</td>\n",
       "      <td>0.78175</td>\n",
       "      <td>894</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>sequel</td>\n",
       "      <td>[-0.21662, 0.26481, -0.71755, -0.27488, -0.108...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.11545</td>\n",
       "      <td>895</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>comedy</td>\n",
       "      <td>[0.2321, 0.16945, -0.27101, -0.84832, -0.07012...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19710</td>\n",
       "      <td>896</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>funny</td>\n",
       "      <td>[0.39595, -0.083109, -0.28795, -0.29139, -0.16...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.25830</td>\n",
       "      <td>981</td>\n",
       "      <td>42</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>medieval</td>\n",
       "      <td>[0.83105, -0.60986, 0.90761, -0.67421, 0.32792...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15580</td>\n",
       "      <td>1078</td>\n",
       "      <td>108</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>pirate</td>\n",
       "      <td>[-0.20215, 0.28188, -0.22138, -0.64008, 0.3194...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.16295</td>\n",
       "      <td>743</td>\n",
       "      <td>30</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>revenge</td>\n",
       "      <td>[-0.10463, 0.92201, -0.17947, -0.37589, -0.198...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.22035</td>\n",
       "      <td>1087</td>\n",
       "      <td>105</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>romance</td>\n",
       "      <td>[0.75581, 0.11897, 0.14055, -1.2454, 0.67806, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19270</td>\n",
       "      <td>897</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>torture</td>\n",
       "      <td>[0.10057, -0.51019, -0.3099, -0.22356, -0.8863...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.21920</td>\n",
       "      <td>1157</td>\n",
       "      <td>60</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>space</td>\n",
       "      <td>[0.3793, 0.030922, 0.40804, 0.053421, 0.013814...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15985</td>\n",
       "      <td>744</td>\n",
       "      <td>30</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>philosophy</td>\n",
       "      <td>[0.046143, 0.049765, 0.76812, 0.25986, 0.53467...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.22685</td>\n",
       "      <td>1183</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>psychology</td>\n",
       "      <td>[0.0061765, 0.21331, 0.67127, 0.17676, 0.38886...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.13140</td>\n",
       "      <td>1222</td>\n",
       "      <td>71</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>car</td>\n",
       "      <td>[0.015682, 0.19355, -0.55093, -0.070453, -0.65...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.18720</td>\n",
       "      <td>1259</td>\n",
       "      <td>24</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>nature</td>\n",
       "      <td>[0.49353, 0.035632, 0.19833, -0.56364, 0.03879...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>positive</td>\n",
       "      <td>0.75290</td>\n",
       "      <td>982</td>\n",
       "      <td>42</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>scenic</td>\n",
       "      <td>[1.0291, -0.069796, -0.78114, -0.41458, 0.6566...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.20615</td>\n",
       "      <td>1327</td>\n",
       "      <td>34</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>wizard's</td>\n",
       "      <td>[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17070</td>\n",
       "      <td>202</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>christianity</td>\n",
       "      <td>[0.15906, -0.083004, 1.0756, 0.12575, -0.68546...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15540</td>\n",
       "      <td>1374</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>england</td>\n",
       "      <td>[0.22048, -0.036548, -0.092576, 0.319, -0.0958...</td>\n",
       "      <td>LOC</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.18330</td>\n",
       "      <td>1423</td>\n",
       "      <td>50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>future</td>\n",
       "      <td>[0.038352, 0.59489, 0.2866, 0.2362, 0.15166, 0...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.22890</td>\n",
       "      <td>4</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>futuristic</td>\n",
       "      <td>[0.30524, -0.15001, -0.60024, -0.092749, 0.806...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19095</td>\n",
       "      <td>700</td>\n",
       "      <td>154</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>pregnancy</td>\n",
       "      <td>[-0.59323, 0.50446, 0.15791, -0.75862, 0.10482...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.18775</td>\n",
       "      <td>1431</td>\n",
       "      <td>11</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>survival</td>\n",
       "      <td>[-0.40477, 0.43125, -0.16201, 0.63483, 0.45825...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.21600</td>\n",
       "      <td>5</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>thriller</td>\n",
       "      <td>[-0.25104, -0.19485, -0.47218, -0.80518, 0.146...</td>\n",
       "      <td>CW</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15135</td>\n",
       "      <td>898</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>computer</td>\n",
       "      <td>[0.57791, 0.34929, 0.17129, -1.1676, 0.985, 0....</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.18950</td>\n",
       "      <td>1480</td>\n",
       "      <td>90</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>murder</td>\n",
       "      <td>[-0.049579, 0.28798, -0.33646, -0.59353, -0.49...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>negative</td>\n",
       "      <td>-0.53280</td>\n",
       "      <td>1524</td>\n",
       "      <td>35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>terrorism</td>\n",
       "      <td>[0.042855, 0.1601, 0.090715, -0.66671, -0.0987...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>negative</td>\n",
       "      <td>-0.50860</td>\n",
       "      <td>1547</td>\n",
       "      <td>97</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>clever</td>\n",
       "      <td>[-0.033481, -0.37371, -0.099627, -0.077827, 0....</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.23415</td>\n",
       "      <td>1552</td>\n",
       "      <td>78</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>complicate</td>\n",
       "      <td>[0.16897, 0.52192, 0.79479, 0.49642, 0.98086, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.12920</td>\n",
       "      <td>1595</td>\n",
       "      <td>176</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>intense</td>\n",
       "      <td>[0.24969, -0.074882, -0.12261, -0.82541, -0.05...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17610</td>\n",
       "      <td>976</td>\n",
       "      <td>168</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>tokyo</td>\n",
       "      <td>[0.42349, 0.54243, -0.64395, -0.79788, -0.2809...</td>\n",
       "      <td>LOC</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.14680</td>\n",
       "      <td>1631</td>\n",
       "      <td>57</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>animation</td>\n",
       "      <td>[0.037307, 0.35589, -0.49355, -0.83947, 0.9023...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.16275</td>\n",
       "      <td>899</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>batman</td>\n",
       "      <td>[-0.3231, 0.31649, -0.48935, 0.17673, 0.58579,...</td>\n",
       "      <td>CW</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19095</td>\n",
       "      <td>1088</td>\n",
       "      <td>105</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>comic</td>\n",
       "      <td>[-0.569, 0.75402, -0.6974, -0.65754, 0.71069, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17945</td>\n",
       "      <td>900</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>dc</td>\n",
       "      <td>[-0.47599, 0.28054, -0.26551, -0.015324, 0.896...</td>\n",
       "      <td>PER</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.22650</td>\n",
       "      <td>1089</td>\n",
       "      <td>105</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>joker</td>\n",
       "      <td>[-0.07533, -0.34123, -0.46686, -0.019233, 0.67...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.14160</td>\n",
       "      <td>1090</td>\n",
       "      <td>105</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>conspiracy</td>\n",
       "      <td>[0.012371, -0.32872, -0.54506, -0.44153, -0.25...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.16385</td>\n",
       "      <td>1525</td>\n",
       "      <td>35</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50</th>\n",
       "      <td>investigation</td>\n",
       "      <td>[-0.42026, -0.29589, -0.22441, -1.0126, -0.120...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.16370</td>\n",
       "      <td>1637</td>\n",
       "      <td>65</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51</th>\n",
       "      <td>anime</td>\n",
       "      <td>[-0.49183, 0.84263, -0.78158, -0.9366, -0.0781...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.13490</td>\n",
       "      <td>901</td>\n",
       "      <td>15</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>52</th>\n",
       "      <td>cinematography</td>\n",
       "      <td>[0.70629, 0.33715, -0.0067912, -0.38115, 0.247...</td>\n",
       "      <td>CW</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.13355</td>\n",
       "      <td>1652</td>\n",
       "      <td>127</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>53</th>\n",
       "      <td>robot</td>\n",
       "      <td>[-0.24619, 0.21412, -0.35943, -0.4598, 0.24798...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.13250</td>\n",
       "      <td>1091</td>\n",
       "      <td>105</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "               tag                                          glove_vec  \\\n",
       "0           action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "1            music  [0.026302, 0.49343, 0.15147, -0.8506, 0.70278,...   \n",
       "2            fight  [-0.19856, 0.17457, -0.62895, -0.45929, -0.071...   \n",
       "3         violence  [0.025781, 0.8007, -0.18627, -0.40211, -0.2174...   \n",
       "4          surreal  [0.26532, -0.083012, -0.33654, -0.31641, 0.501...   \n",
       "5          disturb  [0.73229, -0.069107, 0.50046, 0.14098, 0.08063...   \n",
       "6           quirky  [0.42383, -0.096889, 0.12294, -0.34541, 0.5612...   \n",
       "7        adventure  [0.094151, 0.49795, -0.87618, -0.66309, 0.8435...   \n",
       "8      atmospheric  [0.13512, -0.23763, -0.1364, -0.25487, 1.1195,...   \n",
       "9          stylize  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "10        aviation  [0.28546, 0.37475, 0.019193, -0.18236, 0.18596...   \n",
       "11        disaster  [-0.11391, 0.085762, -0.47509, -0.75199, -0.09...   \n",
       "12        humorous  [-0.22947, 0.072875, 0.39434, -0.42828, 0.4785...   \n",
       "13           tense  [0.62009, 0.25015, 0.82526, -0.43723, -0.71044...   \n",
       "14         classic  [-0.39525, -0.17758, -0.60726, -0.65832, 0.566...   \n",
       "15          sequel  [-0.21662, 0.26481, -0.71755, -0.27488, -0.108...   \n",
       "16          comedy  [0.2321, 0.16945, -0.27101, -0.84832, -0.07012...   \n",
       "17           funny  [0.39595, -0.083109, -0.28795, -0.29139, -0.16...   \n",
       "18        medieval  [0.83105, -0.60986, 0.90761, -0.67421, 0.32792...   \n",
       "19          pirate  [-0.20215, 0.28188, -0.22138, -0.64008, 0.3194...   \n",
       "20         revenge  [-0.10463, 0.92201, -0.17947, -0.37589, -0.198...   \n",
       "21         romance  [0.75581, 0.11897, 0.14055, -1.2454, 0.67806, ...   \n",
       "22         torture  [0.10057, -0.51019, -0.3099, -0.22356, -0.8863...   \n",
       "23           space  [0.3793, 0.030922, 0.40804, 0.053421, 0.013814...   \n",
       "24      philosophy  [0.046143, 0.049765, 0.76812, 0.25986, 0.53467...   \n",
       "25      psychology  [0.0061765, 0.21331, 0.67127, 0.17676, 0.38886...   \n",
       "26             car  [0.015682, 0.19355, -0.55093, -0.070453, -0.65...   \n",
       "27          nature  [0.49353, 0.035632, 0.19833, -0.56364, 0.03879...   \n",
       "28          scenic  [1.0291, -0.069796, -0.78114, -0.41458, 0.6566...   \n",
       "29        wizard's  [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ...   \n",
       "30    christianity  [0.15906, -0.083004, 1.0756, 0.12575, -0.68546...   \n",
       "31         england  [0.22048, -0.036548, -0.092576, 0.319, -0.0958...   \n",
       "32          future  [0.038352, 0.59489, 0.2866, 0.2362, 0.15166, 0...   \n",
       "33      futuristic  [0.30524, -0.15001, -0.60024, -0.092749, 0.806...   \n",
       "34       pregnancy  [-0.59323, 0.50446, 0.15791, -0.75862, 0.10482...   \n",
       "35        survival  [-0.40477, 0.43125, -0.16201, 0.63483, 0.45825...   \n",
       "36        thriller  [-0.25104, -0.19485, -0.47218, -0.80518, 0.146...   \n",
       "37        computer  [0.57791, 0.34929, 0.17129, -1.1676, 0.985, 0....   \n",
       "38          murder  [-0.049579, 0.28798, -0.33646, -0.59353, -0.49...   \n",
       "39       terrorism  [0.042855, 0.1601, 0.090715, -0.66671, -0.0987...   \n",
       "40          clever  [-0.033481, -0.37371, -0.099627, -0.077827, 0....   \n",
       "41      complicate  [0.16897, 0.52192, 0.79479, 0.49642, 0.98086, ...   \n",
       "42         intense  [0.24969, -0.074882, -0.12261, -0.82541, -0.05...   \n",
       "43           tokyo  [0.42349, 0.54243, -0.64395, -0.79788, -0.2809...   \n",
       "44       animation  [0.037307, 0.35589, -0.49355, -0.83947, 0.9023...   \n",
       "45          batman  [-0.3231, 0.31649, -0.48935, 0.17673, 0.58579,...   \n",
       "46           comic  [-0.569, 0.75402, -0.6974, -0.65754, 0.71069, ...   \n",
       "47              dc  [-0.47599, 0.28054, -0.26551, -0.015324, 0.896...   \n",
       "48           joker  [-0.07533, -0.34123, -0.46686, -0.019233, 0.67...   \n",
       "49      conspiracy  [0.012371, -0.32872, -0.54506, -0.44153, -0.25...   \n",
       "50   investigation  [-0.42026, -0.29589, -0.22441, -1.0126, -0.120...   \n",
       "51           anime  [-0.49183, 0.84263, -0.78158, -0.9366, -0.0781...   \n",
       "52  cinematography  [0.70629, 0.33715, -0.0067912, -0.38115, 0.247...   \n",
       "53           robot  [-0.24619, 0.21412, -0.35943, -0.4598, 0.24798...   \n",
       "\n",
       "   ner_label    POS sentiment_label  scaled_sentiment_value  Unnamed: 0  \\\n",
       "0          O   NOUN         neutral                 0.15630         158   \n",
       "1         CW   NOUN         neutral                 0.25580         564   \n",
       "2          O   VERB         neutral                 0.17885         159   \n",
       "3          O   NOUN        negative                -0.59850         557   \n",
       "4          O    ADJ         neutral                 0.17225         698   \n",
       "5          O   VERB         neutral                 0.11775         200   \n",
       "6          O    ADJ         neutral                 0.18185         657   \n",
       "7          O   NOUN         neutral                 0.16350         893   \n",
       "8          O  PROPN         neutral                 0.14715         951   \n",
       "9          O   VERB         neutral                 0.08885         201   \n",
       "10         O   NOUN         neutral                 0.13205         742   \n",
       "11         O   NOUN        negative                -0.47310           3   \n",
       "12         O    ADJ        positive                 0.79795         658   \n",
       "13         O    ADJ         neutral                 0.17600         975   \n",
       "14         O   NOUN        positive                 0.78175         894   \n",
       "15         O   NOUN         neutral                 0.11545         895   \n",
       "16         O   NOUN         neutral                 0.19710         896   \n",
       "17         O    ADJ         neutral                 0.25830         981   \n",
       "18         O    ADJ         neutral                 0.15580        1078   \n",
       "19         O   NOUN         neutral                 0.16295         743   \n",
       "20         O   NOUN         neutral                 0.22035        1087   \n",
       "21         O   NOUN         neutral                 0.19270         897   \n",
       "22         O   NOUN         neutral                 0.21920        1157   \n",
       "23         O   NOUN         neutral                 0.15985         744   \n",
       "24         O   NOUN         neutral                 0.22685        1183   \n",
       "25         O   NOUN         neutral                 0.13140        1222   \n",
       "26         O   NOUN         neutral                 0.18720        1259   \n",
       "27         O   NOUN        positive                 0.75290         982   \n",
       "28         O    ADJ         neutral                 0.20615        1327   \n",
       "29         O  PROPN         neutral                 0.17070         202   \n",
       "30         O  PROPN         neutral                 0.15540        1374   \n",
       "31       LOC   VERB         neutral                 0.18330        1423   \n",
       "32         O   NOUN         neutral                 0.22890           4   \n",
       "33         O    ADJ         neutral                 0.19095         700   \n",
       "34         O   NOUN         neutral                 0.18775        1431   \n",
       "35         O   NOUN         neutral                 0.21600           5   \n",
       "36        CW   NOUN         neutral                 0.15135         898   \n",
       "37         O   NOUN         neutral                 0.18950        1480   \n",
       "38         O   NOUN        negative                -0.53280        1524   \n",
       "39         O   NOUN        negative                -0.50860        1547   \n",
       "40         O    ADJ         neutral                 0.23415        1552   \n",
       "41         O   VERB         neutral                 0.12920        1595   \n",
       "42         O    ADJ         neutral                 0.17610         976   \n",
       "43       LOC  PROPN         neutral                 0.14680        1631   \n",
       "44         O   NOUN         neutral                 0.16275         899   \n",
       "45        CW  PROPN         neutral                 0.19095        1088   \n",
       "46         O   NOUN         neutral                 0.17945         900   \n",
       "47       PER   VERB         neutral                 0.22650        1089   \n",
       "48         O  PROPN         neutral                 0.14160        1090   \n",
       "49         O   NOUN         neutral                 0.16385        1525   \n",
       "50         O   NOUN         neutral                 0.16370        1637   \n",
       "51         O   NOUN         neutral                 0.13490         901   \n",
       "52        CW   NOUN         neutral                 0.13355        1652   \n",
       "53         O   NOUN         neutral                 0.13250        1091   \n",
       "\n",
       "    cluster  \n",
       "0       142  \n",
       "1        89  \n",
       "2       142  \n",
       "3       153  \n",
       "4       154  \n",
       "5         3  \n",
       "6        13  \n",
       "7        15  \n",
       "8        83  \n",
       "9         3  \n",
       "10       30  \n",
       "11      104  \n",
       "12       13  \n",
       "13      168  \n",
       "14       15  \n",
       "15       15  \n",
       "16       15  \n",
       "17       42  \n",
       "18      108  \n",
       "19       30  \n",
       "20      105  \n",
       "21       15  \n",
       "22       60  \n",
       "23       30  \n",
       "24        7  \n",
       "25       71  \n",
       "26       24  \n",
       "27       42  \n",
       "28       34  \n",
       "29        3  \n",
       "30        6  \n",
       "31       50  \n",
       "32      104  \n",
       "33      154  \n",
       "34       11  \n",
       "35      104  \n",
       "36       15  \n",
       "37       90  \n",
       "38       35  \n",
       "39       97  \n",
       "40       78  \n",
       "41      176  \n",
       "42      168  \n",
       "43       57  \n",
       "44       15  \n",
       "45      105  \n",
       "46       15  \n",
       "47      105  \n",
       "48      105  \n",
       "49       35  \n",
       "50       65  \n",
       "51       15  \n",
       "52      127  \n",
       "53      105  "
      ]
     },
     "execution_count": 128,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Example usage\n",
    "# Assuming df_rec is the DataFrame containing userId, recommendations, and tags_movies columns, and tag_cv is the DataFrame containing userId, movieId, and tags.\n",
    "\n",
    "recommendations, user_tags, tags_movies = get_user_data(df_rec, tag_cv, 964)\n",
    "\n",
    "print(\"Recommendations:\", recommendations)\n",
    "print(\"User Tags:\", user_tags)\n",
    "print(\"Tags Movies for userId 505:\", tags_movies)\n",
    "\n",
    "# Get additional features, WSD information for user_tags and userId=96\n",
    "user_features, user_wsd= get_user_feature_set_and_wsd(df_feat, df_wsd,  user_tags, tag_clusters, 964)\n",
    "\n",
    "\n",
    "user_features"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 129,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "User WSD:\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>movieId</th>\n",
       "      <th>tag</th>\n",
       "      <th>disambiguated_sense</th>\n",
       "      <th>confidence</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>legal_action.n.01</td>\n",
       "      <td>0.395202</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>adventure</td>\n",
       "      <td>adventure.n.01</td>\n",
       "      <td>0.394330</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>atmospheric</td>\n",
       "      <td>atmospheric.a.01</td>\n",
       "      <td>0.388486</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>964</td>\n",
       "      <td>260</td>\n",
       "      <td>stylize</td>\n",
       "      <td>stylize.v.01</td>\n",
       "      <td>0.398942</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>169</th>\n",
       "      <td>964</td>\n",
       "      <td>2959</td>\n",
       "      <td>action</td>\n",
       "      <td>legal_action.n.01</td>\n",
       "      <td>0.395202</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3220</th>\n",
       "      <td>964</td>\n",
       "      <td>103228</td>\n",
       "      <td>anime</td>\n",
       "      <td>zanzibar_copal.n.01</td>\n",
       "      <td>0.387292</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3221</th>\n",
       "      <td>964</td>\n",
       "      <td>103228</td>\n",
       "      <td>cinematography</td>\n",
       "      <td>filming.n.01</td>\n",
       "      <td>0.388786</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3222</th>\n",
       "      <td>964</td>\n",
       "      <td>103228</td>\n",
       "      <td>music</td>\n",
       "      <td>music.n.02</td>\n",
       "      <td>0.385036</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3223</th>\n",
       "      <td>964</td>\n",
       "      <td>103228</td>\n",
       "      <td>robot</td>\n",
       "      <td>automaton.n.02</td>\n",
       "      <td>0.383806</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3224</th>\n",
       "      <td>964</td>\n",
       "      <td>103228</td>\n",
       "      <td>romance</td>\n",
       "      <td>romance.n.03</td>\n",
       "      <td>0.398942</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>83 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId  movieId             tag  disambiguated_sense  confidence\n",
       "1        964      260          action    legal_action.n.01    0.395202\n",
       "2        964      260       adventure       adventure.n.01    0.394330\n",
       "3        964      260     atmospheric     atmospheric.a.01    0.388486\n",
       "4        964      260         stylize         stylize.v.01    0.398942\n",
       "169      964     2959          action    legal_action.n.01    0.395202\n",
       "...      ...      ...             ...                  ...         ...\n",
       "3220     964   103228           anime  zanzibar_copal.n.01    0.387292\n",
       "3221     964   103228  cinematography         filming.n.01    0.388786\n",
       "3222     964   103228           music           music.n.02    0.385036\n",
       "3223     964   103228           robot       automaton.n.02    0.383806\n",
       "3224     964   103228         romance         romance.n.03    0.398942\n",
       "\n",
       "[83 rows x 5 columns]"
      ]
     },
     "execution_count": 129,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "print(\"User WSD:\")\n",
    "user_wsd"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "2. Now comparing user tags with tags applied to the movieIds given in the recommendations (recommendations)\n",
    "    - Given in df_rec, the \"tags_movies\" column \n",
    "\n",
    "The process (this is for all users):\n",
    "1. Loop through the recommendations (list of {movieId, sentiment} tuples). \n",
    "2. For each movieId in the list - get the tags applied to this movieId by other users that share the same sentiment recommended to the current target user \n",
    "    - Column in df_rec is \"tags_movies\"\n",
    "3. Compare the tags with the tags applied by the target user (using the similarity metrics) , compare with content based features \n",
    "4. Continue until all tags from the recommendations are compared with the tags applied by the target user. \n",
    "5. Store the similarity score in a separate dataframe.\n",
    "6. normalise the similarity metrics.\n",
    "7. Average similarity metrics and then rank - return the best tag set for recommendation\n",
    "\n",
    "for efficiency: vectorise all necessary data before loops"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**caculate_similarity_for_recommendations**\n",
    "- In this function, we return a dataframe, 'similarity_df' that contains the similarity of the tags from the recommendation movieIds \n",
    "- In similarity_df: we include the column 'WSD_confidence' to filter out tagfs that don't meet a certain level of disambiguation confidence - thus ensuring that only high confidence tags are used in similarity calculation, \n",
    "- Needto store the tag and movieId also in the similarity_df - as pairs - because this effects the WSD of a particular word"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We don't recommend tags the user has already used"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Adding the cluster column to df_feat"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 130,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>tag</th>\n",
       "      <th>glove_vec</th>\n",
       "      <th>ner_label</th>\n",
       "      <th>POS</th>\n",
       "      <th>sentiment_label</th>\n",
       "      <th>scaled_sentiment_value</th>\n",
       "      <th>cluster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>s</td>\n",
       "      <td>[0.18209, 0.88297, -0.49805, 0.53137, -0.36084...</td>\n",
       "      <td>O</td>\n",
       "      <td>PROPN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.24385</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>action</td>\n",
       "      <td>[0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.15630</td>\n",
       "      <td>142</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>twist</td>\n",
       "      <td>[-0.095859, -0.17472, -0.034692, -0.37307, 0.3...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.12125</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>overrate</td>\n",
       "      <td>[0.28151, -0.42171, -0.38275, 0.15364, -0.7648...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.21655</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>violent</td>\n",
       "      <td>[0.13693, 0.1856, -0.65335, -0.50922, -0.18431...</td>\n",
       "      <td>O</td>\n",
       "      <td>ADJ</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.25750</td>\n",
       "      <td>153</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2893</th>\n",
       "      <td>newspaper</td>\n",
       "      <td>[-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.10295</td>\n",
       "      <td>25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2894</th>\n",
       "      <td>static</td>\n",
       "      <td>[0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>positive</td>\n",
       "      <td>0.76810</td>\n",
       "      <td>70</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2895</th>\n",
       "      <td>repeat</td>\n",
       "      <td>[0.48671, 0.93464, -0.015418, -0.46056, -0.152...</td>\n",
       "      <td>O</td>\n",
       "      <td>VERB</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.19360</td>\n",
       "      <td>104</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2896</th>\n",
       "      <td>seal</td>\n",
       "      <td>[-0.35434, 0.51161, -0.086652, -0.23459, 0.435...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.17375</td>\n",
       "      <td>91</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2897</th>\n",
       "      <td>counterespionage</td>\n",
       "      <td>[0.11309, -0.8528, -0.25529, 0.02635, -0.30105...</td>\n",
       "      <td>O</td>\n",
       "      <td>NOUN</td>\n",
       "      <td>neutral</td>\n",
       "      <td>0.14290</td>\n",
       "      <td>65</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>2898 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                   tag                                          glove_vec  \\\n",
       "0                    s  [0.18209, 0.88297, -0.49805, 0.53137, -0.36084...   \n",
       "1               action  [0.02024, 0.84992, -0.7815, -0.82769, 0.43115,...   \n",
       "2                twist  [-0.095859, -0.17472, -0.034692, -0.37307, 0.3...   \n",
       "3             overrate  [0.28151, -0.42171, -0.38275, 0.15364, -0.7648...   \n",
       "4              violent  [0.13693, 0.1856, -0.65335, -0.50922, -0.18431...   \n",
       "...                ...                                                ...   \n",
       "2893         newspaper  [-0.70318, 1.1424, 0.05477, -0.095689, 0.05790...   \n",
       "2894            static  [0.46332, -0.05737, 0.13804, 0.30518, 0.5276, ...   \n",
       "2895            repeat  [0.48671, 0.93464, -0.015418, -0.46056, -0.152...   \n",
       "2896              seal  [-0.35434, 0.51161, -0.086652, -0.23459, 0.435...   \n",
       "2897  counterespionage  [0.11309, -0.8528, -0.25529, 0.02635, -0.30105...   \n",
       "\n",
       "     ner_label    POS sentiment_label  scaled_sentiment_value  cluster  \n",
       "0            O  PROPN         neutral                 0.24385      104  \n",
       "1            O   NOUN         neutral                 0.15630      142  \n",
       "2            O   NOUN         neutral                 0.12125        2  \n",
       "3            O   VERB         neutral                 0.21655        3  \n",
       "4            O    ADJ         neutral                 0.25750      153  \n",
       "...        ...    ...             ...                     ...      ...  \n",
       "2893         O   NOUN         neutral                 0.10295       25  \n",
       "2894         O   NOUN        positive                 0.76810       70  \n",
       "2895         O   VERB         neutral                 0.19360      104  \n",
       "2896         O   NOUN         neutral                 0.17375       91  \n",
       "2897         O   NOUN         neutral                 0.14290       65  \n",
       "\n",
       "[2898 rows x 7 columns]"
      ]
     },
     "execution_count": 130,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_feat = pd.merge(df_feat, tag_clusters, on='tag', how='inner')\n",
    "df_feat.drop(columns='Unnamed: 0', inplace=True)\n",
    "df_feat"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 138,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[[260,\n",
       "  ['action',\n",
       "   'space',\n",
       "   'luke',\n",
       "   'sequel',\n",
       "   'robot',\n",
       "   'heroic',\n",
       "   'series',\n",
       "   'adventure',\n",
       "   'awesome',\n",
       "   'stylize',\n",
       "   'force',\n",
       "   'outdated',\n",
       "   'franchise',\n",
       "   'knight',\n",
       "   'princess',\n",
       "   'soundtrack',\n",
       "   'epic',\n",
       "   's',\n",
       "   'classic',\n",
       "   'atmospheric',\n",
       "   'complete']],\n",
       " [115149, ['action']],\n",
       " [2762,\n",
       "  ['nan',\n",
       "   'enigmatic',\n",
       "   'thriller',\n",
       "   'unpredictable',\n",
       "   'afterlife',\n",
       "   'theater',\n",
       "   'drama',\n",
       "   'horror',\n",
       "   'stylize',\n",
       "   'suspense',\n",
       "   'touch',\n",
       "   'fake',\n",
       "   'death',\n",
       "   'watch',\n",
       "   'ominous',\n",
       "   'scary',\n",
       "   'act',\n",
       "   'ghost',\n",
       "   'psychological',\n",
       "   'frighten',\n",
       "   'boring',\n",
       "   'psychology',\n",
       "   'predictable',\n",
       "   'atmospheric',\n",
       "   'twist']],\n",
       " [2959,\n",
       "  ['action',\n",
       "   'justice',\n",
       "   'rebellious',\n",
       "   'philosophical',\n",
       "   'men',\n",
       "   'original',\n",
       "   'nan',\n",
       "   'crime',\n",
       "   'confrontational',\n",
       "   'disturb',\n",
       "   'dark',\n",
       "   'complicate',\n",
       "   'quirky',\n",
       "   'r',\n",
       "   'stylize',\n",
       "   'violence',\n",
       "   'anarchism',\n",
       "   'philosophy',\n",
       "   'narrate',\n",
       "   'insanity',\n",
       "   'watch',\n",
       "   'smart',\n",
       "   'consumerism',\n",
       "   'challenge',\n",
       "   'psychological',\n",
       "   'sabotage',\n",
       "   'satirical',\n",
       "   'masculine',\n",
       "   'violent',\n",
       "   'cynical',\n",
       "   'thoughtprovoking',\n",
       "   'capitalism',\n",
       "   's',\n",
       "   'psychology',\n",
       "   'identity',\n",
       "   'stylish',\n",
       "   'classic',\n",
       "   'masculinity',\n",
       "   'intense',\n",
       "   'surreal',\n",
       "   'psychedelic',\n",
       "   'atmospheric',\n",
       "   'fight',\n",
       "   'twist']],\n",
       " [3996,\n",
       "  ['overrate',\n",
       "   'action',\n",
       "   'ridiculous',\n",
       "   'poetic',\n",
       "   'nan',\n",
       "   'crime',\n",
       "   'romance',\n",
       "   'hate',\n",
       "   'dvd',\n",
       "   'murder',\n",
       "   'stylize',\n",
       "   'china',\n",
       "   'westernization',\n",
       "   'beautiful',\n",
       "   'watch',\n",
       "   'colourful',\n",
       "   'soundtrack',\n",
       "   'fly',\n",
       "   'dreamlike',\n",
       "   'culture',\n",
       "   'atmospheric',\n",
       "   'tragic']],\n",
       " [6016,\n",
       "  ['interest',\n",
       "   'drug',\n",
       "   'forceful',\n",
       "   'enthral',\n",
       "   'poverty',\n",
       "   'nan',\n",
       "   'amaze',\n",
       "   'crime',\n",
       "   'sweep',\n",
       "   'feel',\n",
       "   'disturb',\n",
       "   'nightclub',\n",
       "   'loser',\n",
       "   'photography',\n",
       "   'brazil',\n",
       "   'drama',\n",
       "   'stylize',\n",
       "   'photographer',\n",
       "   'violence',\n",
       "   'depress',\n",
       "   'refresh',\n",
       "   'idiot',\n",
       "   'portuguese',\n",
       "   'chicken',\n",
       "   'violent',\n",
       "   'soccer',\n",
       "   'robbery',\n",
       "   'slam',\n",
       "   'classic',\n",
       "   'gangster',\n",
       "   'intense',\n",
       "   'atmospheric',\n",
       "   'gang']],\n",
       " [7438,\n",
       "  ['action',\n",
       "   'overrate',\n",
       "   'storytelling',\n",
       "   'crime',\n",
       "   'vengeance',\n",
       "   'thriller',\n",
       "   'adventure',\n",
       "   'quirky',\n",
       "   'drama',\n",
       "   'stylize',\n",
       "   'violence',\n",
       "   'dialogue',\n",
       "   'watch',\n",
       "   'samurai',\n",
       "   'japan',\n",
       "   'bill',\n",
       "   'revenge',\n",
       "   'bloody',\n",
       "   'violent',\n",
       "   'classic',\n",
       "   'surreal',\n",
       "   'atmospheric']],\n",
       " [296,\n",
       "  ['action',\n",
       "   'rivet',\n",
       "   'masterpiece',\n",
       "   'drug',\n",
       "   'dialog',\n",
       "   'quote',\n",
       "   'comedy',\n",
       "   'storytelling',\n",
       "   'philosophical',\n",
       "   'homosexuality',\n",
       "   'amaze',\n",
       "   'nan',\n",
       "   'character',\n",
       "   'crime',\n",
       "   'mobster',\n",
       "   'funny',\n",
       "   'cool',\n",
       "   'thriller',\n",
       "   'dark',\n",
       "   'unpredictable',\n",
       "   'dvd',\n",
       "   'quirky',\n",
       "   'drama',\n",
       "   'stylize',\n",
       "   'humorous',\n",
       "   'violence',\n",
       "   'suspense',\n",
       "   'dialogue',\n",
       "   'watch',\n",
       "   'humor',\n",
       "   'entertain',\n",
       "   'satire',\n",
       "   'violent',\n",
       "   'nonlinear',\n",
       "   'gun',\n",
       "   's',\n",
       "   'classic',\n",
       "   'rape',\n",
       "   'intense',\n",
       "   'atmospheric',\n",
       "   'innovative',\n",
       "   'act']],\n",
       " [805, ['vengeance', 'rape']],\n",
       " [1136,\n",
       "  ['british',\n",
       "   'comedy',\n",
       "   'nan',\n",
       "   'biblical',\n",
       "   'funny',\n",
       "   'awesome',\n",
       "   'humorous',\n",
       "   'parody',\n",
       "   'religion',\n",
       "   'hilarious',\n",
       "   'watch',\n",
       "   'english',\n",
       "   'humor',\n",
       "   'england',\n",
       "   'satire',\n",
       "   'medieval',\n",
       "   'spoof',\n",
       "   'satirical',\n",
       "   'rabbit',\n",
       "   's',\n",
       "   'inventive',\n",
       "   'influential',\n",
       "   'classic']]]"
      ]
     },
     "execution_count": 138,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tags_movies"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 139,
   "metadata": {},
   "outputs": [],
   "source": [
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "\n",
    "def calculate_similarity_for_recommendations(recommendations, tags_movies, df_feat, user_features, df_wsd, user_wsd):\n",
    "    similarity_list = []\n",
    "\n",
    "    # Create a dictionary to easily fetch movie tags\n",
    "    tags_movies_dict = dict(tags_movies)\n",
    "\n",
    "    for movieId, _ in recommendations:\n",
    "        movie_tags = tags_movies_dict.get(movieId, [])  # Fetch the tags from the tags_movies dictionary\n",
    "        if not movie_tags:\n",
    "            continue\n",
    "\n",
    "        for user_tag in user_features['tag'].unique():\n",
    "            for movie_tag in movie_tags:\n",
    "\n",
    "                user_wsd_row = user_wsd[user_wsd['tag'] == user_tag]\n",
    "                movie_wsd_row = df_wsd[(df_wsd['movieId'] == movieId) & (df_wsd['tag'] == movie_tag)]\n",
    "\n",
    "                # nested loop to calculate the wsd\n",
    "                wsd_similarities = []\n",
    "                for user_sense in user_wsd_row['disambiguated_sense'].values:\n",
    "                    for movie_sense in movie_wsd_row['disambiguated_sense'].values:\n",
    "                        wsd_similarities.append(user_sense == movie_sense)\n",
    "\n",
    "                if wsd_similarities:\n",
    "                    wsd_similarity = np.mean(wsd_similarities)\n",
    "                else:\n",
    "                    wsd_similarity = 0\n",
    "\n",
    "                wsd_confidence = movie_wsd_row['confidence'].mean() if not movie_wsd_row.empty else 0\n",
    "\n",
    "                user_feat_row = user_features[user_features['tag'] == user_tag]\n",
    "                movie_feat_row = df_feat[df_feat['tag'] == movie_tag]\n",
    "\n",
    "                pos_match = (user_feat_row['POS'].values == movie_feat_row['POS'].values).mean() if user_feat_row['POS'].values.size and movie_feat_row['POS'].values.size else 0\n",
    "                ner_match = (user_feat_row['ner_label'].values == movie_feat_row['ner_label'].values).mean() if user_feat_row['ner_label'].values.size and movie_feat_row['ner_label'].values.size else 0\n",
    "                sentiment_match = (user_feat_row['sentiment_label'].values == movie_feat_row['sentiment_label'].values).mean() if user_feat_row['sentiment_label'].values.size and movie_feat_row['sentiment_label'].values.size else 0\n",
    "                \n",
    "                # Check for cluster match\n",
    "                cluster_match = int(user_feat_row['cluster'].values[0] == movie_feat_row['cluster'].values[0]) if user_feat_row['cluster'].values.size and movie_feat_row['cluster'].values.size else 0\n",
    "\n",
    "                similarity_list.append({\n",
    "                    'movieId': movieId, \n",
    "                    'user_tag': user_tag,\n",
    "                    'movie_tag': movie_tag,\n",
    "                    'wsd_similarity': wsd_similarity,\n",
    "                    'wsd_confidence': wsd_confidence,\n",
    "                    'pos_match': pos_match,\n",
    "                    'ner_match': ner_match,\n",
    "                    'sentiment_match': sentiment_match,\n",
    "                    'cluster_match': cluster_match  # Adding the cluster match to the dataframe\n",
    "                })\n",
    "\n",
    "    similarity_df = pd.DataFrame(similarity_list)\n",
    "    return similarity_df\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 140,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_feat.to_json(\"../dataset/df_feat.json\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 141,
   "metadata": {},
   "outputs": [],
   "source": [
    "similarity_df = calculate_similarity_for_recommendations(recommendations, tags_movies, df_feat, user_features, df_wsd, user_wsd)\n",
    " "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 142,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>movieId</th>\n",
       "      <th>user_tag</th>\n",
       "      <th>movie_tag</th>\n",
       "      <th>wsd_similarity</th>\n",
       "      <th>wsd_confidence</th>\n",
       "      <th>pos_match</th>\n",
       "      <th>ner_match</th>\n",
       "      <th>sentiment_match</th>\n",
       "      <th>cluster_match</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>action</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.395202</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>space</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.389017</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>luke</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.398942</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>sequel</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.382782</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>robot</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.383806</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12685</th>\n",
       "      <td>1136</td>\n",
       "      <td>robot</td>\n",
       "      <td>rabbit</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.388548</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12686</th>\n",
       "      <td>1136</td>\n",
       "      <td>robot</td>\n",
       "      <td>s</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.396197</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12687</th>\n",
       "      <td>1136</td>\n",
       "      <td>robot</td>\n",
       "      <td>inventive</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.375202</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12688</th>\n",
       "      <td>1136</td>\n",
       "      <td>robot</td>\n",
       "      <td>influential</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.368682</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12689</th>\n",
       "      <td>1136</td>\n",
       "      <td>robot</td>\n",
       "      <td>classic</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.394072</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>12690 rows × 9 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       movieId user_tag    movie_tag  wsd_similarity  wsd_confidence  \\\n",
       "0          260   action       action             1.0        0.395202   \n",
       "1          260   action        space             0.0        0.389017   \n",
       "2          260   action         luke             0.0        0.398942   \n",
       "3          260   action       sequel             0.0        0.382782   \n",
       "4          260   action        robot             0.0        0.383806   \n",
       "...        ...      ...          ...             ...             ...   \n",
       "12685     1136    robot       rabbit             0.0        0.388548   \n",
       "12686     1136    robot            s             0.0        0.396197   \n",
       "12687     1136    robot    inventive             0.0        0.375202   \n",
       "12688     1136    robot  influential             0.0        0.368682   \n",
       "12689     1136    robot      classic             0.0        0.394072   \n",
       "\n",
       "       pos_match  ner_match  sentiment_match  cluster_match  \n",
       "0            1.0        1.0              1.0              1  \n",
       "1            1.0        1.0              1.0              0  \n",
       "2            0.0        0.0              1.0              0  \n",
       "3            1.0        1.0              1.0              0  \n",
       "4            1.0        1.0              1.0              0  \n",
       "...          ...        ...              ...            ...  \n",
       "12685        1.0        1.0              1.0              0  \n",
       "12686        0.0        1.0              1.0              0  \n",
       "12687        0.0        1.0              1.0              0  \n",
       "12688        0.0        1.0              1.0              0  \n",
       "12689        1.0        1.0              0.0              0  \n",
       "\n",
       "[12690 rows x 9 columns]"
      ]
     },
     "execution_count": 142,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "similarity_df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### need to calculate a similarity score between user_tag and movie_tag using the similarity metrics in similarity_df\n",
    "\n",
    "- These weights - hypothetical -> should change these after testing\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 143,
   "metadata": {},
   "outputs": [],
   "source": [
    "def calculate_total_similarity(row, weights):\n",
    "    return sum(row[metric] * weight for metric, weight in weights.items())\n",
    "\n",
    "weights = {\n",
    "    'wsd_similarity': 0.05,\n",
    "    'wsd_confidence': 0.05,\n",
    "    'pos_match': 0.3,\n",
    "    'ner_match': 0.3,\n",
    "    'sentiment_match': 0.2,\n",
    "    'cluster_match': 0.1\n",
    "}\n",
    "\n",
    "# Assuming similarity_df is your DataFrame\n",
    "similarity_df['total_similarity'] = similarity_df.apply(lambda row: calculate_total_similarity(row, weights), axis=1)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 144,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>movieId</th>\n",
       "      <th>user_tag</th>\n",
       "      <th>movie_tag</th>\n",
       "      <th>wsd_similarity</th>\n",
       "      <th>wsd_confidence</th>\n",
       "      <th>pos_match</th>\n",
       "      <th>ner_match</th>\n",
       "      <th>sentiment_match</th>\n",
       "      <th>cluster_match</th>\n",
       "      <th>total_similarity</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>action</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.395202</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.969760</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>space</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.389017</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.819451</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>luke</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.398942</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.219947</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>sequel</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.382782</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.819139</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>robot</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.383806</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.819190</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>heroic</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.395289</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.319764</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>series</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.386528</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.519326</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>adventure</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.394330</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.819717</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>awesome</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.390007</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.319500</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>260</td>\n",
       "      <td>action</td>\n",
       "      <td>stylize</td>\n",
       "      <td>0.0</td>\n",
       "      <td>0.398942</td>\n",
       "      <td>0.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>0</td>\n",
       "      <td>0.519947</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   movieId user_tag  movie_tag  wsd_similarity  wsd_confidence  pos_match  \\\n",
       "0      260   action     action             1.0        0.395202        1.0   \n",
       "1      260   action      space             0.0        0.389017        1.0   \n",
       "2      260   action       luke             0.0        0.398942        0.0   \n",
       "3      260   action     sequel             0.0        0.382782        1.0   \n",
       "4      260   action      robot             0.0        0.383806        1.0   \n",
       "5      260   action     heroic             0.0        0.395289        0.0   \n",
       "6      260   action     series             0.0        0.386528        1.0   \n",
       "7      260   action  adventure             0.0        0.394330        1.0   \n",
       "8      260   action    awesome             0.0        0.390007        0.0   \n",
       "9      260   action    stylize             0.0        0.398942        0.0   \n",
       "\n",
       "   ner_match  sentiment_match  cluster_match  total_similarity  \n",
       "0        1.0              1.0              1          0.969760  \n",
       "1        1.0              1.0              0          0.819451  \n",
       "2        0.0              1.0              0          0.219947  \n",
       "3        1.0              1.0              0          0.819139  \n",
       "4        1.0              1.0              0          0.819190  \n",
       "5        1.0              0.0              0          0.319764  \n",
       "6        0.0              1.0              0          0.519326  \n",
       "7        1.0              1.0              0          0.819717  \n",
       "8        1.0              0.0              0          0.319500  \n",
       "9        1.0              1.0              0          0.519947  "
      ]
     },
     "execution_count": 144,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "similarity_df.head(10)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Return distinct tags"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 145,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>movieId</th>\n",
       "      <th>movie_tag</th>\n",
       "      <th>ner_match</th>\n",
       "      <th>pos_match</th>\n",
       "      <th>cluster_match</th>\n",
       "      <th>total_similarity</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>8844</th>\n",
       "      <td>7438</td>\n",
       "      <td>japan</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919947</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>260</td>\n",
       "      <td>force</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919821</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6418</th>\n",
       "      <td>6016</td>\n",
       "      <td>depress</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919796</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6402</th>\n",
       "      <td>6016</td>\n",
       "      <td>enthral</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919774</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11310</th>\n",
       "      <td>296</td>\n",
       "      <td>character</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919738</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4112</th>\n",
       "      <td>2959</td>\n",
       "      <td>identity</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919733</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6419</th>\n",
       "      <td>6016</td>\n",
       "      <td>refresh</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919650</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5997</th>\n",
       "      <td>3996</td>\n",
       "      <td>crime</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919633</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11625</th>\n",
       "      <td>1136</td>\n",
       "      <td>spoof</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919630</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10835</th>\n",
       "      <td>296</td>\n",
       "      <td>act</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1.0</td>\n",
       "      <td>1</td>\n",
       "      <td>0.919611</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       movieId  movie_tag  ner_match  pos_match  cluster_match  \\\n",
       "8844      7438      japan        1.0        1.0              1   \n",
       "10         260      force        1.0        1.0              1   \n",
       "6418      6016    depress        1.0        1.0              1   \n",
       "6402      6016    enthral        1.0        1.0              1   \n",
       "11310      296  character        1.0        1.0              1   \n",
       "4112      2959   identity        1.0        1.0              1   \n",
       "6419      6016    refresh        1.0        1.0              1   \n",
       "5997      3996      crime        1.0        1.0              1   \n",
       "11625     1136      spoof        1.0        1.0              1   \n",
       "10835      296        act        1.0        1.0              1   \n",
       "\n",
       "       total_similarity  \n",
       "8844           0.919947  \n",
       "10             0.919821  \n",
       "6418           0.919796  \n",
       "6402           0.919774  \n",
       "11310          0.919738  \n",
       "4112           0.919733  \n",
       "6419           0.919650  \n",
       "5997           0.919633  \n",
       "11625          0.919630  \n",
       "10835          0.919611  "
      ]
     },
     "execution_count": 145,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Sort the DataFrame by 'total_similarity' in descending order\n",
    "sorted_similarity_df = similarity_df.sort_values(by='total_similarity', ascending=False)\n",
    "\n",
    "# Remove rows where 'movie_tag' is also present in 'user_tag' column\n",
    "filtered_similarity_df = sorted_similarity_df[~sorted_similarity_df['movie_tag'].isin(sorted_similarity_df['user_tag'])]\n",
    "\n",
    "# Drop duplicates based on the 'movie_tag' column to get distinct tags\n",
    "distinct_tags_df = filtered_similarity_df.drop_duplicates(subset=['movie_tag'])\n",
    "\n",
    "# Get the top 10 distinct tags along with their movieId\n",
    "top_10_distinct_tags_with_movieId = distinct_tags_df[['movieId', 'movie_tag', 'ner_match', 'pos_match', 'cluster_match', 'total_similarity']].head(10)\n",
    "\n",
    "top_10_distinct_tags_with_movieId"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 146,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>userId</th>\n",
       "      <th>recommendations</th>\n",
       "      <th>tags_movies</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>318</td>\n",
       "      <td>[(260, 0.1389), (780, 0.1588), (1196, 0.2946),...</td>\n",
       "      <td>[[260, [action, space, luke, sequel, robot, he...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2274</td>\n",
       "      <td>[(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...</td>\n",
       "      <td>[[2762, [nan, enigmatic, thriller, unpredictab...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3031</td>\n",
       "      <td>[(70, -0.4981), (353, 0.25), (805, 0.25), (487...</td>\n",
       "      <td>[[70, [gore, brother, vampire, intense, nan, s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4087</td>\n",
       "      <td>[(296, 0.0051), (805, 0.2713), (1136, 0.205), ...</td>\n",
       "      <td>[[296, [action, rivet, masterpiece, drug, dial...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4450</td>\n",
       "      <td>[(1994, 0.1524), (4995, 0.205), (4226, 0.145),...</td>\n",
       "      <td>[[1994, [thriller, ghost]], [4995, [education,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1547</th>\n",
       "      <td>117265</td>\n",
       "      <td>[(47, 0.176), (50, 0.1822), (356, 0.1751), (10...</td>\n",
       "      <td>[[47, [overrate, investigation, philosophical,...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1548</th>\n",
       "      <td>117607</td>\n",
       "      <td>[(1257, 0.1369), (1748, 0.1617), (2916, -0.027...</td>\n",
       "      <td>[[1257, [imagination, goofy, silly, skiing, qu...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1549</th>\n",
       "      <td>123915</td>\n",
       "      <td>[(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...</td>\n",
       "      <td>[[1, [woody, adventure, watch, buy, comedy, fa...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1550</th>\n",
       "      <td>127468</td>\n",
       "      <td>[(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...</td>\n",
       "      <td>[[12, [vampire, gothic]], [21, [mafia, hollywo...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1551</th>\n",
       "      <td>136810</td>\n",
       "      <td>[(32, 0.1314), (436, 0.1314), (593, 0.1314), (...</td>\n",
       "      <td>[[32, [interest, british, genetics, original, ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1552 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      userId                                    recommendations  \\\n",
       "0        318  [(260, 0.1389), (780, 0.1588), (1196, 0.2946),...   \n",
       "1       2274  [(2762, 0.1212), (2959, 0.1212), (3996, 0.2166...   \n",
       "2       3031  [(70, -0.4981), (353, 0.25), (805, 0.25), (487...   \n",
       "3       4087  [(296, 0.0051), (805, 0.2713), (1136, 0.205), ...   \n",
       "4       4450  [(1994, 0.1524), (4995, 0.205), (4226, 0.145),...   \n",
       "...      ...                                                ...   \n",
       "1547  117265  [(47, 0.176), (50, 0.1822), (356, 0.1751), (10...   \n",
       "1548  117607  [(1257, 0.1369), (1748, 0.1617), (2916, -0.027...   \n",
       "1549  123915  [(1, 0.1628), (22, -0.2524), (70, 0.1625), (11...   \n",
       "1550  127468  [(12, 0.1932), (21, 0.1604), (26, 0.1674), (32...   \n",
       "1551  136810  [(32, 0.1314), (436, 0.1314), (593, 0.1314), (...   \n",
       "\n",
       "                                            tags_movies  \n",
       "0     [[260, [action, space, luke, sequel, robot, he...  \n",
       "1     [[2762, [nan, enigmatic, thriller, unpredictab...  \n",
       "2     [[70, [gore, brother, vampire, intense, nan, s...  \n",
       "3     [[296, [action, rivet, masterpiece, drug, dial...  \n",
       "4     [[1994, [thriller, ghost]], [4995, [education,...  \n",
       "...                                                 ...  \n",
       "1547  [[47, [overrate, investigation, philosophical,...  \n",
       "1548  [[1257, [imagination, goofy, silly, skiing, qu...  \n",
       "1549  [[1, [woody, adventure, watch, buy, comedy, fa...  \n",
       "1550  [[12, [vampire, gothic]], [21, [mafia, hollywo...  \n",
       "1551  [[32, [interest, british, genetics, original, ...  \n",
       "\n",
       "[1552 rows x 3 columns]"
      ]
     },
     "execution_count": 146,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_rec"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
