{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "1340b53d-7d88-4884-9161-7fb94492512e",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import torch\n",
    "from glob import glob\n",
    "from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer\n",
    "from scipy.special import softmax\n",
    "from scipy.stats import entropy\n",
    "import pandas as pd\n",
    "from matplotlib import pyplot as plt\n",
    "from tqdm import tqdm\n",
    "from pathlib import Path"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "5e20d4b4-76f6-48e4-bb8f-a1f6ef231b13",
   "metadata": {},
   "outputs": [],
   "source": [
    "def top_eigen(A, n, eps=1e-5):\n",
    "    '''\n",
    "    Uses power method to find top eigenvector of nxn matrix A\n",
    "    A should be a function implementing multiplication v -> Av\n",
    "    Returns top eigenvector, top eigenvalue\n",
    "    '''\n",
    "    v0 = np.zeros((n,))\n",
    "    v1 = np.random.normal(0, 1, (n,))\n",
    "    v1 /= np.linalg.norm(v1)\n",
    "    coef0 = None\n",
    "    coef1 = None\n",
    "    while coef0 is None or abs(coef1 - coef0) / abs(coef0) > eps:\n",
    "        v0 = v1\n",
    "        v1 = A(v1)\n",
    "        coef0 = coef1\n",
    "        coef1 = np.dot(v0, v1)  # = v0.T @ v0. Note ||v0||=1 already here.\n",
    "        v1 /= np.linalg.norm(v1)\n",
    "        #print(coef1)\n",
    "    return v1, np.dot(v1, A(v1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "04dbf577-6adf-41c7-ba70-382e7fdfb2af",
   "metadata": {},
   "outputs": [],
   "source": [
    "def eigen_gen(A, n, eps=1e-5):\n",
    "    vs = []\n",
    "    lams = []\n",
    "    cur_A = A\n",
    "    while True:\n",
    "        v, lam = top_eigen(cur_A, n, eps=eps)\n",
    "        vs.append(v)\n",
    "        lams.append(lam)\n",
    "        yield v, lam\n",
    "        cur_A = lambda x: A(x) - sum(lam * np.dot(v, x) * v for v, lam in zip(vs, lams))\n",
    "\n",
    "def topk_eigen(A, n, k, eps=1e-5):\n",
    "    '''\n",
    "    Returns top k eigenvectors (n, k) and eigenvalues (k,)\n",
    "    '''\n",
    "    vs = []\n",
    "    lams = []\n",
    "    it = eigen_gen(A, n, eps=eps)\n",
    "    for _ in range(k):\n",
    "        v, lam = next(it)\n",
    "        vs.append(v)\n",
    "        lams.append(lam)\n",
    "    return np.array(vs).T, np.array(lams)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "cc73edf7-9803-44b6-8e2c-75b47a3e8a61",
   "metadata": {},
   "outputs": [],
   "source": [
    "def topk_svd(A, AT, n, m, k, eps=1e-5, save_name=None):\n",
    "    '''\n",
    "    Given nxm matrix A, returns U (n, k), S (n,), VT(k, m).\n",
    "    A should be provided as two functions v -> Av and v -> ATv\n",
    "    '''\n",
    "    u_eigens = eigen_gen(lambda x: A(AT(x)), n, eps=eps)\n",
    "    v_eigens = eigen_gen(lambda x: AT(A(x)), m, eps=eps)\n",
    "    U = []\n",
    "    S = []\n",
    "    V = []\n",
    "    Path('SVD').mkdir(exist_ok=True)\n",
    "    for i in tqdm(range(k)):\n",
    "        if n < m:\n",
    "            u, lam = next(u_eigens)\n",
    "            s = np.sqrt(lam)\n",
    "            v = AT(u) / s\n",
    "        else:\n",
    "            v, lam = next(v_eigens)\n",
    "            s = np.sqrt(lam)\n",
    "            u = A(v) / s\n",
    "        U.append(u)\n",
    "        S.append(s)\n",
    "        V.append(v)\n",
    "        if save_name:\n",
    "            np.save(f'SVD/{save_name}_U_{i}', u)\n",
    "            np.save(f'SVD/{save_name}_S_{i}', s)\n",
    "            np.save(f'SVD/{save_name}_V_{i}', v)\n",
    "    U, S, V = np.array(U).T, np.array(S), np.array(V).T\n",
    "    if save_name:\n",
    "        np.save(f'SVD/{save_name}_U', U)\n",
    "        np.save(f'SVD/{save_name}_S', S)\n",
    "        np.save(f'SVD/{save_name}_V', V.T)\n",
    "    return U, S, V.T"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "5fd1a490-5a56-4e1a-a5c8-16fc6f827e4b",
   "metadata": {},
   "outputs": [],
   "source": [
    "from time import time\n",
    "TIME = time()\n",
    "def bench():\n",
    "    global TIME\n",
    "    print('TIME ELAPSED:', time() - TIME)\n",
    "    TIME = time()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "0b77954a-c6f6-42f0-9c57-8d368a4837dd",
   "metadata": {},
   "outputs": [],
   "source": [
    "ckpt_f = '/workspace/checkpoints/LLAMA2-NECK-SWEEP*/llama-2-7b-hf_hidden_idxs-32_hidden_lb-{}_token_lb-{}_neck_cls-mlp_*'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "498dc378-ca8e-460e-8ca3-09408a37edae",
   "metadata": {},
   "outputs": [],
   "source": [
    "necks = [\n",
    "    ('t', '-1', '0'),  # token\n",
    "    ('h', '0', '-1'),  # hidden\n",
    "    ('ht', '0', '0'),  # both\n",
    "]\n",
    "for name, h, t in necks:\n",
    "    ckpt = glob(ckpt_f.format(h, t))[0]\n",
    "    state = torch.load(ckpt)['state_dict']\n",
    "    globals()[f'W{name}'] = state['future_neck.layers.0.weight'].cpu().numpy()\n",
    "    globals()[f'b{name}'] = state['future_neck.layers.0.bias'].cpu().numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "97bfb1f9-f295-44df-81d7-2a42e5a7fc36",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "53e1f972dcd343558adfd59e2f8e1935",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "config.json:   0%|          | 0.00/578 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "49b6ca63d0f0400eb10346e56602812e",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "pytorch_model.bin.index.json:   0%|          | 0.00/26.8k [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "de82642580724464a195f03d3c4bb510",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Downloading shards:   0%|          | 0/2 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "1caf4eae4e7144ada4a0f67e25e5a2d3",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "pytorch_model-00001-of-00002.bin:   0%|          | 0.00/9.98G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "5ac9c48650c044b8b53b31461093f38d",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "pytorch_model-00002-of-00002.bin:   0%|          | 0.00/3.50G [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "ac5f7c5fc0f3447ebf04be518acaacdf",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Loading checkpoint shards:   0%|          | 0/2 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e17cd31205184180abf081036fe79bc0",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "generation_config.json:   0%|          | 0.00/132 [00:00<?, ?B/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "model_name = 'daryl149/llama-2-7b-hf'\n",
    "config = AutoConfig.from_pretrained(model_name)\n",
    "model = AutoModelForCausalLM.from_pretrained(model_name, config=config)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "98f63b5b-4e1f-42b3-bc8b-c36bbdf40496",
   "metadata": {},
   "outputs": [],
   "source": [
    "params = dict(model.named_parameters())\n",
    "modules = dict(model.named_modules())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "37c94d6c-92ed-4f73-abd7-88efb90c7080",
   "metadata": {},
   "outputs": [],
   "source": [
    "E = params['model.embed_tokens.weight'].detach().numpy()\n",
    "D = params['lm_head.weight'].detach().numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 146,
   "id": "6281b903-8044-4fa8-bbb8-6bcd5943a881",
   "metadata": {},
   "outputs": [],
   "source": [
    "UD, SD, VD = np.linalg.svd(D, full_matrices=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "8d7a85ee-fad8-40ca-99b5-07bb9ec6b5da",
   "metadata": {},
   "outputs": [],
   "source": [
    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
    "Token = {v: k for k, v in tokenizer.get_vocab().items()}\n",
    "\n",
    "def topk(v, k=40):\n",
    "    # Takes in logits\n",
    "    v = softmax(v.flatten())\n",
    "    idxs = v.argsort()[-k:][::-1]\n",
    "    ret = [(Token[i], v[i]) for i in idxs]\n",
    "    return pd.DataFrame(ret, columns=['token', 'prob'])"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "dae24431-f87d-4c77-ac97-4d7eed5e502a",
   "metadata": {},
   "source": [
    "The key observation here is that a future neck $f(h, x)$ where $h$ is the topmost hidden layer and $x$ is the next embedded token induces a future head $F(\\tilde h, \\tilde x) = DF(D^\\dagger \\tilde h, E \\tilde x)$, where $E$ is the embedding, $D$ is the unembedding, and $D^\\dagger$ is the Moore-Penrose pseudoinverse of $D$. So, assuming $D$ is injective, $D^\\dagger D=I$. Note now that $\\tilde h$ and $\\tilde x$ are now in token space."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "id": "5d70980c-2a8d-42d1-bb50-b5ca941a586c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "TIME ELAPSED: 2072.547867536545\n",
      "TIME ELAPSED: 4.12051796913147\n"
     ]
    }
   ],
   "source": [
    "x = np.random.normal(0, 1, D.shape[0])\n",
    "bench()\n",
    "a = D @ Wt @ np.dot(E.T, x)\n",
    "bench()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "e38ff3db-65d3-4f95-b7dd-b9ea96195f75",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [09:43<00:00, 58.32s/it]\n"
     ]
    }
   ],
   "source": [
    "# No neck: DE^T\n",
    "Ue, Se, Ve = topk_svd(\n",
    "    lambda x: np.dot(D, np.dot(E.T, x)),\n",
    "    lambda x: np.dot(E, np.dot(D.T, x)),\n",
    "    n=D.shape[0],\n",
    "    m=E.shape[0],\n",
    "    k=10,\n",
    "    eps=1e-7,\n",
    "    save_name='e',\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 139,
   "id": "91b511a5-a7f2-4935-86db-1e884ed97bea",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [43:00<00:00, 258.04s/it]\n"
     ]
    }
   ],
   "source": [
    "# Token only: W\\hat = DWE^T\n",
    "DWt = D @ Wt\n",
    "EWtT = E @ Wt.T\n",
    "Ut, St, Vt = topk_svd(\n",
    "    lambda x: np.dot(DWt, np.dot(E.T, x)),\n",
    "    lambda x: np.dot(EWtT, np.dot(D.T, x)),\n",
    "    n=D.shape[0],\n",
    "    m=E.shape[0],\n",
    "    k=10,\n",
    "    eps=1e-7,\n",
    "    save_name='t',\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 181,
   "id": "8e4233dd-5a88-47b2-8a65-e6fb624203dd",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [10:16<00:00, 61.68s/it]\n"
     ]
    }
   ],
   "source": [
    "# Hidden only, but with E in front? W\\hat = DWE^T\n",
    "DWh = D @ Wh\n",
    "EWhT = E @ Wh.T\n",
    "Ut, St, Vt = topk_svd(\n",
    "    lambda x: np.dot(DWh, np.dot(E.T, x)),\n",
    "    lambda x: np.dot(EWhT, np.dot(D.T, x)),\n",
    "    n=D.shape[0],\n",
    "    m=E.shape[0],\n",
    "    k=10,\n",
    "    eps=1e-7,\n",
    "    save_name='he',\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 174,
   "id": "ffa7df3a-2758-4a5d-b30a-204f5e27dff4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(32000, 4096)"
      ]
     },
     "execution_count": 174,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "D.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 176,
   "id": "791b6029-9a56-4867-b5b4-e5c92a5e2743",
   "metadata": {},
   "outputs": [],
   "source": [
    "A = VD.T @ np.diag(1 / SD) @ (UD.T @ D)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 178,
   "id": "b9c6b6d4-e778-4ad3-ad24-536ec49f8ba4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2.4197103258201705e-05"
      ]
     },
     "execution_count": 178,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.linalg.norm(A - np.eye(4096))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a5a6933f-3dcc-4e74-a3e9-ebc9e5ddb2c1",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Hidden only: W\\hat = DW(D^\\dagger)\n",
    "Dp = VD.T @ np.diag(1 / SD) @ UD.T\n",
    "DWh = D @ Wh\n",
    "DpTWhT = Dp.T @ Wh.T\n",
    "Uh, Sh, Vh = topk_svd(\n",
    "    lambda x: np.dot(DWh, np.dot(Dp, x)),\n",
    "    lambda x: np.dot(DpTWhT, np.dot(D.T, x)),\n",
    "    n=D.shape[0],\n",
    "    m=Dp.shape[1],\n",
    "    k=10,\n",
    "    eps=1e-7,\n",
    "    save_name='h',\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 185,
   "id": "bdd98c7b-5d0c-473b-bec9-ccebeb2f9d82",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 10/10 [12:51<00:00, 77.13s/it]\n"
     ]
    }
   ],
   "source": [
    "# Hidden and token: W\\hat = DW[D^\\dagger, E^T]\n",
    "n, m = Wht.shape\n",
    "DWht = D @ Wht\n",
    "DpTWhtT = Dp.T @ Wht[:,:n].T\n",
    "EWhtT = E @ Wht[:,n:].T\n",
    "\n",
    "def A(x):\n",
    "    n = x.shape[0]\n",
    "    u = np.dot(Dp, x[:n//2]) # * 500 # make norms roughly comparable???\n",
    "    v = np.dot(E.T, x[n//2:])\n",
    "    return np.dot(DWht, np.concatenate([u, v]))\n",
    "    \n",
    "def AT(x):\n",
    "    a = np.dot(D.T, x)\n",
    "    return np.concatenate([\n",
    "        np.dot(DpTWhtT, a),# * 500,\n",
    "        np.dot(EWhtT, a)\n",
    "    ])\n",
    "    \n",
    "Uht, Sht, Vht = topk_svd(\n",
    "    A,\n",
    "    AT,\n",
    "    n=D.shape[0],\n",
    "    m=2*D.shape[0],\n",
    "    k=10,\n",
    "    eps=1e-7,\n",
    "    save_name='ht',\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "7d8b2a1b-e56d-47ce-a874-92de49d24eff",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<matplotlib.lines.Line2D at 0x7f9a1a2af850>]"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAiMAAAGdCAYAAADAAnMpAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8g+/7EAAAACXBIWXMAAA9hAAAPYQGoP6dpAAA6OUlEQVR4nO3deXhU5f3+8XsmyUwSskLIHgj7vgaIQa21RHEpLtWWWquIS39asCrWCi5YaytutfhVqq3WpbWK1YpaQRQRUBRBwhpWWRMD2YBksi8zz++PwGgElECSk5l5v65rriFnnjPzmRzh3J5nOTZjjBEAAIBF7FYXAAAAAhthBAAAWIowAgAALEUYAQAAliKMAAAASxFGAACApQgjAADAUoQRAABgqWCrCzgRHo9H+/btU2RkpGw2m9XlAACAE2CMUUVFhZKTk2W3H//6h0+EkX379iktLc3qMgAAwEnIz89XamrqcV/3iTASGRkpqenLREVFWVwNAAA4ES6XS2lpad7z+PH4RBg50jUTFRVFGAEAwMd83xALBrACAABLEUYAAIClCCMAAMBShBEAAGApwggAALAUYQQAAFiKMAIAACxFGAEAAJYijAAAAEu1OIx8/PHHmjBhgpKTk2Wz2fTWW2997z5Lly7VyJEj5XQ61bt3b7344osnUSoAAPBHLQ4jVVVVGjZsmObMmXNC7Xfv3q0LL7xQZ599ttatW6dbb71V119/vd5///0WFwsAAPxPi+9Nc/755+v8888/4fbPPPOMevTooT//+c+SpAEDBmj58uX6y1/+ovHjx7f04wEAgJ9p8xvlrVixQtnZ2c22jR8/Xrfeeutx96mrq1NdXZ33Z5fL1VblAQDQqtweo9oGt+oaPd7nuka3ahs8qmtwq97tUaPHyO02avQc/rPHqNF9+NlzePs3fnYfbmeMZCTJGJmmJxl9vd2YphqMmjY0bWv+etOeR7v29B5K6xzeLr+jb2vzMFJYWKiEhIRm2xISEuRyuVRTU6OwsLCj9pk1a5buv//+ti4NAAA1uj1y1TaqrLpeh6ob5KptUFVdo6rqGlVZ5/b+ueLwc9P2RlXVuVVV36i6Bk+z8NHoOfbJvqObMCzZf8PIyZgxY4amTZvm/dnlciktLc3CigAAvsAYo6p6t0oq6lRaWed9Lq2oU1lNgw5VN6isul7lNQ0qq27Qoep6VdQ2tlk9jiC7nMF2OUOCDj/b5QiyKyTIriC7TcF2m4LstqN+Dg6yKdhub/az3WaTzSbZdORZstlsknTUdu82m63p56P2O7rWhKjQNvs9fJ82DyOJiYkqKipqtq2oqEhRUVHHvCoiSU6nU06ns61LAwD4kOr6Ru0rq9X+8hrtL6vVvvIaFVc0BY2Syq/DR22D56TeP9IZrOjwEEWFhigiNFgRzmB1cgYrwhn0jT83PXdyBivSGaxwR5DCHEEKPRI2goMUGtL07Ay2y24/xlkfR2nzMJKVlaUFCxY027Zo0SJlZWW19UcDAHyEMUYHquq190C18g9Wq6CsRvvKarS/vNb7XF7TcMLv18kRpLhIp7pGOBUX4VSXCIc6d3IoOixEseEOxYSHKCY8RNFhjsPPIQoJYuktq7Q4jFRWVmrHjh3en3fv3q1169apc+fO6tatm2bMmKGCggL985//lCTdeOONeuqpp/S73/1O1157rT766CP95z//0fz581vvWwAAOrwGt0f7ymq090C19h5sCh17D1R5A0hVvft73yPSGaykmFAlRYcpOSZU8ZGh6hrZFDi6HgkfkQ6FOzrkKAQcR4uP1urVq3X22Wd7fz4ytmPSpEl68cUXtX//fuXl5Xlf79Gjh+bPn6/bbrtNTzzxhFJTU/Xcc88xrRcA/FRFbYN2lVRpR3GldpZUep/3Hqj+zsGdNpuUFBWqbl3ClRobruToUCXFhCkpOlTJh58jQ0Pa8ZugvdiMMR1+2K/L5VJ0dLTKy8sVFRVldTkAADWFjm2FFdpSWKEdRRXaUVKpncVVKnTVHncfZ7Bd3TqHq3uXcKV1Dlf3zuHq3qWTunUJV0pMmEJDgtrxG6Ctnej5m+tYAIDv5PEY7T1Yra37XdpSWKEt+13aWuhS/sGa4+7TNdKpXl07qXd8hHp1jfA+J0aFMqgTRyGMAAC8Gt0e7Sip1Ib8cm0oKFNugUvbCitU03Ds8RyJUaHqnxSpfgmR6hV/OHTERSg6nO4UnDjCCAAEKI/HaFdplTYWlGnDV+Xa8FW5Nu0rP+bUWGewXX0TIjUgKVL9E6PUPylSAxKjFNvJYUHl8DeEEQAIEOXVDVqTf0g5ew4pZ+8hbSwoV2Xd0Qt+RTiDNTglSkNTYzQ4JVoDk6KU3iVcwUx9RRshjACAHzLGaM+Baq3ec1Br8g5p9Z5D+rK48qh2oSF2DUqO1pCUaA1NjdbQ1Bj1jOvEuA60K8IIAPgBt8do8z6XPt91QCt3NwWQg1X1R7VL7xKujO6dldE9VsPTYtQ3IYIrHrAcYQQAfJDHY7Sl0KUVOw/o810HtWr3Abm+dY8VR7BdQ1OildE9VhndYzWye6ziIrjVBjoewggA+ABjjLYXVeqznaXeqx9l1c2XR49wBmtMj87K7NFZo9I7a3BKlJzBrNuBjo8wAgAd1IHKOi3fUaqPt5fqky9LVFxR1+z1To4gje7RWaf17KKsnl00KDmKLhf4JMIIAHQQDW6P1uw9pI+/LNHH20uVu69c31wjOzTErtHpnZXVqyl8DE6J5uZu8AuEEQCw0P7yGi3eUqyl20q0YmfpUTeL658YqbP6dtUP+nbVqPRYul3glwgjANCOjDHKLXDpwy1FWry1SLkFrmavd+7k0Jl94nRmn676QZ84xUeFWlQp0H4IIwDQxmob3Pp0R6k+3FKsj7YWqcj19dgPm00anhajcf3jdVbfeA1KjmKNDwQcwggAtIHy6gYt2lKkhbmFWr6jpNkS6+GOIJ3ZJ07jBiToR/3jmW6LgEcYAYBWcqCyTh9sLtJ7uYX6bEepGj1fjz5Njg7VuAEJGjcgXqf17KLQEMZ+AEcQRgDgFBS5avX+pkK9t7FQK3cf0Dfyh/olROq8wYk6d1CCBiZFyWaj+wU4FsIIALRQcUWt5m/Yr/kb9isn71Cz6beDU6J0/uAknTc4Ub26RlhXJOBDCCMAcAJctQ1amFuo/63fp093lDa7AjKiW4zOH5yo8wYlqVuXcOuKBHwUYQQAjqO2wa0lW4v19rp9+mhbseobvx6EOjwtRhOGJev8wYlKjgmzsErA9xFGAOAb3B6jT3eU6u11+/T+pkJV1n1987ne8RG6eFiyLhqerO5dOllYJeBfCCMAIGlnSaX+m/OV3lxToEJXrXd7cnSoJgxP1sXDUjQgKZJBqEAbIIwACFiu2ga9u36/3sjJ15q8Mu/26LAQ/Xhoki4ZkaKMbrEsQga0McIIgIDi9hh9trNUb+R8pYW5hao7PA7EbpN+2C9el2ekatyAeO4BA7QjwgiAgFBQVqPXvsjX66vztb/8626YPvER+umoVF0yPIX7wAAWIYwA8FuNbo+WbCvRKyv3aun2Eu96INFhIbp4eLIuz0jVkJRoxoEAFiOMAPA7+8pqNPeLfP3ni/xmg1HH9uqiK8Z007mDEuiGAToQwggAv9Do9mjpthK9uipPS7YVexcl69zJocszUvXz0WnqyYqoQIdEGAHg0w5W1evVVXn69+d7te8bY0GyenbRFZndNJ6rIECHRxgB4JNyC8r10md79Pb6fd6VUWPDQ3R5RqquGNONqyCADyGMAPAZDW6P3t9UqJc+26Mv9hzybh+SEq1JY9P146FJCg3hKgjgawgjADq80so6vboyT/9emecdkBpst+mCIUmaNDZdI7vFMCMG8GGEEQAd1pdFFXruk92at7ZA9e6mrpi4CKd+kdlNV2Z2UwLrggB+gTACoEMxxmjFrgN69uNdWrKtxLt9WFqMJo9N1/lDEhmQCvgZwgiADqHB7dGCjfv17Ce7lFvgkiTZbNL4gYm64Qc9lNG9s8UVAmgrhBEAlqqsa9TcVXl64dM9KiirkSSFhtj1s1Fpuvb0HkqP62RxhQDaGmEEgCVKKur0/Ke79fLne1VR2yhJiotwaFJWun55WnfFdnJYXCGA9kIYAdCuCspq9PdlOzX3i3zvHXN7de2kG87sqUtGpDA1FwhAhBEA7WJXSaWeXrpT89YWqPHwWu3D02I05ezeGtc/XnY7U3OBQEUYAdCmtux3ac6SHVqwcb/3fjFje3XRlLN7a2yvLqwPAoAwAqBtrM07pKc+2qHFW4u928b1j9eUH/XWyG6xFlYGoKMhjABoVevzy/SXD7dr6eE1Qmw26cIhSfr1D3trYHKUxdUB6IgIIwBaRW5Buf6yaLv3SkiQ3aZLR6To1z/sxU3rAHwnwgiAU7J5n0uzP9yuDzYXSZLsNumSESn6zY/6sEYIgBNCGAFwUrYWuvTEh1/qvdxCSU0h5OLhKbr5R725EgKgRQgjAFpkV0ml/rxou+Zv2C+paUzIhKHJ+s24PuodTwgB0HKEEQAnpLC8Vk8s/lL/WZ0v9+E5uhcOTdIt4/qob0KkxdUB8GWEEQDfqby6QX9dtkMvfrrHu2Jq9oB43X5uPw1IYnYMgFNHGAFwTDX1br3w2W49s3SnXIfvHTM6PVZ3ntdfo9K5gy6A1kMYAdBMg9uj/6zO1xMffqniijpJUv/ESP3uvH46u188K6YCaHWEEQCSJGOM3t9UpIcXbtXu0ipJUmpsmG4/t68uGpaiIO4dA6CNEEYAaMNXZfrju1u0as9BSVKXTg7d/KPeuiKzm5zB3EUXQNsijAABbF9ZjR59f5vmrS2QJIWG2HXDmT31/87qpQgn/zwAaB/8awMEoMq6Rv1t2U79/eNd3hkyPxmRot+O76fkmDCLqwMQaAgjQABxe4xeX52vxz7YrtLKpsGpY3p01j0XDtDQ1BhriwMQsAgjQID4fNcB/f6dTdpaWCFJSu8SrunnD9D4QQnMkAFgKcII4Of2ldXowQVb9O7h5dujw0L0m3F9dNVp3eUItltcHQAQRgC/Vdvg1nOf7NKcJTtV0+CW3Sb9IrObbj+nn2I7OawuDwC8CCOAnzHGaPGWYj0wf7P2HqiW1LRy6u8vGqRBydEWVwcARyOMAH5kV0ml/vDuZi3dViJJio906q4LBuji4cmMCwHQYRFGAD9QU+/Wkx99qWc/2aUGt1FIkE3XntFDN/+oD+uFAOjw+FcK8HFLthbr3rdz9dWhGknSWX27auaEgerVNcLiygDgxBBGAB9VWF6rP7y7SQs2FkqSkqNDdd9Fg3TuQKbqAvAthBHAx7g9Ri99tkd//mCbqurdCrLbdO3p6bo1u6860SUDwAfxLxfgQzZ8Vaa75m1UboFLkjSiW4z+dMkQDUyOsrgyADh5J7Xi0Zw5c5Senq7Q0FBlZmZq1apV39l+9uzZ6tevn8LCwpSWlqbbbrtNtbW1J1UwEIgqaht039u5unjOp8otcCkqNFh/unSw/nvjWIIIAJ/X4isjr732mqZNm6ZnnnlGmZmZmj17tsaPH69t27YpPj7+qPavvPKKpk+frueff15jx47V9u3bdc0118hms+nxxx9vlS8B+LMlW4t117yN2l/eFOAvGZ6suy8cqK6RTosrA4DWYTPGmJbskJmZqdGjR+upp56SJHk8HqWlpenmm2/W9OnTj2o/depUbdmyRYsXL/Zuu/3227Vy5UotX778hD7T5XIpOjpa5eXliori/wIRGA5W1esP/9ukt9btkyR17xKuP10yRGf0ibO4MgA4MSd6/m5RN019fb1ycnKUnZ399RvY7crOztaKFSuOuc/YsWOVk5Pj7crZtWuXFixYoAsuuOC4n1NXVyeXy9XsAQQKY4ze3bBP5zy+TG+t2ye7TbrhzB5aeMsPCCIA/FKLumlKS0vldruVkJDQbHtCQoK2bt16zH1+8YtfqLS0VGeccYaMMWpsbNSNN96ou+6667ifM2vWLN1///0tKQ3wC0WuWt3zVq4WbS6SJPVNiNAjlw/T8LQYawsDgDbU5rfsXLp0qR588EH99a9/1Zo1a/Tmm29q/vz5euCBB467z4wZM1ReXu595Ofnt3WZgKWMMXrtizxlP75MizYXKSTIplvG9dG7N59JEAHg91p0ZSQuLk5BQUEqKipqtr2oqEiJiYnH3Ofee+/VVVddpeuvv16SNGTIEFVVVelXv/qV7r77btntR+chp9Mpp5PBeQgM+8pqdOd/N+iTL0slScNSo/Xw5UPVP5HxUQACQ4uujDgcDmVkZDQbjOrxeLR48WJlZWUdc5/q6uqjAkdQUJCkpv8bBAKVMUb/zflK42d/rE++LJUz2K67Luiv/940liACIKC0eGrvtGnTNGnSJI0aNUpjxozR7NmzVVVVpcmTJ0uSrr76aqWkpGjWrFmSpAkTJujxxx/XiBEjlJmZqR07dujee+/VhAkTvKEECDSllXW6682N+uDw2JDhaTF6/GfD1JP7yQAIQC0OIxMnTlRJSYlmzpypwsJCDR8+XAsXLvQOas3Ly2t2JeSee+6RzWbTPffco4KCAnXt2lUTJkzQn/70p9b7FoAPWZi7X3fNy9XBqnqFBNl0a3Zf/b8f9FRwUJsP4QKADqnF64xYgXVG4A/Kqxt03zu53nVD+idG6vGfDWcFVQB+60TP39ybBmgHy7aX6M43NqjQVSu7Tbrph710y7i+cgRzNQQACCNAG6ptcOvhhVv1wqd7JEk94zrpsZ8N08husdYWBgAdCGEEaCPbiyr0m1fXamthhSRpUlZ3TT9/gMIcDNwGgG8ijACtzBijlz/fqz/O36K6Ro/iIhx69PJhOrv/0TeSBAAQRoBWdaCyTnf+d4M+3FIsSTqrb1c99tNh3GEXAL4DYQRoJR9vL9Htr69XSUWdHEF2TT+/v64Zmy673WZ1aQDQoRFGgFNU3+jRo+9v1bOf7JYk9YmP0BM/H8GUXQA4QYQR4BTkH6zW1FfXan1+mSTpqtO66+4LByg0hEGqAHCiCCPASfpgU6F++/p6uWobFRUarMd+OkznDjr2DSMBAMdHGAFaqL7Ro0cWbtVzy5u6ZYalxeipK0YorXO4xZUBgG8ijAAt8NWhak19Za3WHe6Wuf6MHvrdef1ZSRUATgFhBDhBH24u0u2vr1d5TQPdMgDQiggjwPdodHv0yPvb9PePd0miWwYAWhthBPgOpZV1mvrKGn2+66Ak6drTe2j6+XTLAEBrIowAx7E275BuenmNCl216uQI0mM/HabzhyRZXRYA+B3CCHAMr67K031vb1K926NeXTvpb1dlqHd8pNVlAYBfIowA31Db4NZ9b2/Sa6vzJUnjByXosZ8OU2RoiMWVAYD/IowAhxWU1eiml3O04aty2W3Sb8f3001n9ZLNxr1lAKAtEUYASSt2HtCUV9boYFW9YsJD9OQVI3Rmn65WlwUAAYEwgoD38ud79ft3NqnRYzQoOUrP/DKDabsA0I4IIwhYDW6P/vC/zfrX53slSRcPT9bDlw3lJncA0M4IIwhIZdX1+vW/1+iznQdks0l3MD4EACxDGEHA2VFcoeteWq29B6rVyRGk2T8foXMGJlhdFgAELMIIAsqSrcX6zatrVVHXqNTYMD03aZT6J0ZZXRYABDTCCAKCMUbPfbJbD763RcZIY3p01tNXjlSXCKfVpQFAwCOMwO81uj26751N+vfKPEnSFWPSdP9Fg7m/DAB0EIQR+LXKukZNfWWNlm4rkc0m3XPhQF17ejoDVQGgAyGMwG8Vltfq2he/0Ob9LoWG2PXEz0do/KBEq8sCAHwLYQR+act+lya/8IUKXbWKi3DouUmjNTwtxuqyAADHQBiB31m2vURT/r1GlXWN6h0foReuGc2KqgDQgRFG4FdeXZWne97KldtjdFrPzvrbL0cpOpw77gJAR0YYgV8wxmj2h1/qicVfSpJ+MiJFD102lBkzAOADCCPweW6P0cy3c71Td3/zo9667Zy+zJgBAB9BGIFPq21w67bX1um93ELZbNIfLh6sq07rbnVZAIAWIIzAZ7lqG/Srf67W57sOyhFk1+yfD9cFQ5KsLgsA0EKEEfik4opaXfN80xoiEc5g/f2qDI3tHWd1WQCAk0AYgc/Ze6BKV/1jlfIOVisuwqkXJ4/W4JRoq8sCAJwkwgh8ypb9Ll31j1UqraxTt87h+td1Y9S9SyerywIAnALCCHzGuvwyTXp+lcprGjQwKUovXjta8ZGhVpcFADhFhBH4hJW7DujaF79QVb1bI7vF6IXJYxQdxmJmAOAPCCPo8JZtL9H/+9dq1TZ4NLZXFz179Sh1cvKfLgD4C/5FR4e2MLdQN7+6Rg1uox/1j9dfrxyp0JAgq8sCALQiwgg6rLfWFuj219fL7TG6cEiS/jJxOMu7A4AfIoygQ3p1VZ7umrdRxkiXjUzVw5cNUXAQQQQA/BFhBB3Oy5/v1T1v5UqSrs7qrt9PGCS7nfvMAIC/IoygQ/lmELn+jB66+8IB3PAOAPwcYQQdxjeDyA1n9tBdFxBEACAQ0AmPDuFfBBEACFhcGYHl/vX5Xt17OIj86gc9NeP8/gQRAAggXBmBpQgiAADCCCzzyso8gggAgDACa7y55ivd/dZGSQQRAAh0hBG0u/c27tdvX18vY6RrxqYTRAAgwBFG0K6WbC3Wb+aulcdIPxuVqpk/HkgQAYAARxhBu/lsZ6lufDlHDW6jHw9N0qyfDGVlVQAAYQTtI2fvIV3/0mrVNXqUPSBBf5k4XEEEEQCACCNoB7kF5brmhVWqrnfrzD5xeuoXIxTCTe8AAIdxRkCb2lVSqaufX6WK2kaNTo/V367KUGhIkNVlAQA6EMII2kyRq1ZX/WOVDlbVa0hKtJ6/ZrTCHSz6CwBojjCCNlFe06BJz69SQVmNesR10guTRysyNMTqsgAAHRBhBK2utsGt61/6QlsLK9Q10ql/XjtGcRFOq8sCAHRQhBG0qka3R1NfWasv9hxSZGiw/nntGKV1Dre6LABAB0YYQasxxuiueRv14ZYiOYLteu7qURqQFGV1WQCADo4wglbz2Afb9J/VX8luk566YoQye3axuiQAgA84qTAyZ84cpaenKzQ0VJmZmVq1atV3ti8rK9OUKVOUlJQkp9Opvn37asGCBSdVMDqmlz/fqzlLdkqSZv1kiM4dlGhxRQAAX9HieZavvfaapk2bpmeeeUaZmZmaPXu2xo8fr23btik+Pv6o9vX19TrnnHMUHx+vN954QykpKdq7d69iYmJao350AEu2Fmvm27mSpGnn9NXE0d0srggA4EtsxhjTkh0yMzM1evRoPfXUU5Ikj8ejtLQ03XzzzZo+ffpR7Z955hk9+uij2rp1q0JCTm5qp8vlUnR0tMrLyxUVxRiEjiS3oFw/+9sKVde7dXlGqh69fCg3vgMASDrx83eLumnq6+uVk5Oj7Ozsr9/Abld2drZWrFhxzH3eeecdZWVlacqUKUpISNDgwYP14IMPyu12H/dz6urq5HK5mj3Q8ewvr9F1L32h6nq3Tu/dRQ9eOoQgAgBosRaFkdLSUrndbiUkJDTbnpCQoMLCwmPus2vXLr3xxhtyu91asGCB7r33Xv35z3/WH//4x+N+zqxZsxQdHe19pKWltaRMtIOK2gZNfuELFbnq1DchQn+9MkOOYMZDAwBars3PHh6PR/Hx8fr73/+ujIwMTZw4UXfffbeeeeaZ4+4zY8YMlZeXex/5+fltXSZaoMHt0ZRX1noXNXv+mtGKDmN1VQDAyWnRANa4uDgFBQWpqKio2faioiIlJh579kRSUpJCQkIUFPT1zdEGDBigwsJC1dfXy+FwHLWP0+mU08mKnR2RMUYz387Vx9tLFBYSpOcnjVZqLIuaAQBOXouujDgcDmVkZGjx4sXebR6PR4sXL1ZWVtYx9zn99NO1Y8cOeTwe77bt27crKSnpmEEEHds/lu/Wq6vyZbdJT14xQkNSo60uCQDg41rcTTNt2jQ9++yzeumll7RlyxbddNNNqqqq0uTJkyVJV199tWbMmOFtf9NNN+ngwYO65ZZbtH37ds2fP18PPvigpkyZ0nrfAu1iybZiPbhgiyTp7gsHKntgwvfsAQDA92vxOiMTJ05USUmJZs6cqcLCQg0fPlwLFy70DmrNy8uT3f51xklLS9P777+v2267TUOHDlVKSopuueUW3Xnnna33LdDmdhRX6jevrJXHSBNHpena09OtLgkA4CdavM6IFVhnxFpl1fW6ZM6n2nOgWqPTY/Xv609j5gwA4Hu1yTojCDxH7sK750C1UmLC9PQvmcILAGhdnFXwnf44f4uW7yhVuCNIz149SnERzHICALQuwgiO69VVeXrxsz2SpMd/NlwDk+kiAwC0PsIIjiln7yHvze9uP6evzhvMXXgBAG2DMIKjFFfU6tf/zlGD2+iCIYma+qPeVpcEAPBjhBE003B4wGqRq0694yP0yOXDuPkdAKBNEUbQzEPvbdWq3QcV4QzWM7/MUISzxUvRAADQIoQReP1v/T79Y/luSdJjPx2q3vERFlcEAAgEhBFIkrYXVejO/26QJN14Vi+dNzjJ4ooAAIGCMAK5ahv0//6Vo+p6t07v3UW/Pbev1SUBAAIIYSTAGWN0x+vrtbu0SsnRofq/n49QcBD/WQAA2g9nnQD34md79P6mIoUE2fT0LzPUhRVWAQDtjDASwDZ8VaYHF2yRJN11wQANS4uxtiAAQEAijAQoV22Dpr6yVg1uo/GDEnTN2HSrSwIABCjCSAAyxmj6fzco72C1UmPD9MhlLGwGALAOYSQAvfz5Xi3YWKhgu01PXjFC0eEhVpcEAAhghJEAk1tQrgfebRonMv38/hrRLdbiigAAgY4wEkAq6xo19ZU1qnd7lD0gXted0cPqkgAAIIwEkvvf2aQ9B6qVHB2qx37KOBEAQMdAGAkQ8zfs1+s5X8luk2b/fIRiwh1WlwQAgCTCSEDYX16ju+ZtlCTd9MNeGtOjs8UVAQDwNcKIn/N4jKa9tl7lNQ0amhqtW7O57wwAoGMhjPi5Zz/ZpRW7DigsJEizJw5XCPedAQB0MJyZ/FhuQbke+2CbJOm+CQPVs2uExRUBAHA0woifqql365a5Tcu9nzswQRNHp1ldEgAAx0QY8VMPL9yqnSVVio906qHLhjKNFwDQYRFG/NCKnQf04md7JEmPXD5UnTsxjRcA0HERRvxMVV2j7nhjvSTpijFp+mG/eIsrAgDguxFG/MyDC7boq0M1SokJ010XDLC6HAAAvhdhxI988mWJ/r0yT1JT90xkKHfjBQB0fIQRP1FR26A739ggSbrqtO46vXecxRUBAHBiCCN+4o/vbtG+8lp16xyu6ef3t7ocAABOGGHEDyzZVqzXVufLZpMevXyoOjmDrS4JAIATRhjxcZV1jbr7zaab4F0zNl2ZPbtYXBEAAC1DGPFxj72/TfvKa5UaG6Y7xvezuhwAAFqMMOLD1uQd0ksr9kiSHrx0iMIddM8AAHwPYcRH1Td6NOO/G2WM9JORKfpB365WlwQAwEkhjPiovy3bqW1FFercyaF7LhxodTkAAJw0wogP2lFcqSc/2iFJum/CQO49AwDwaYQRH+PxGN315kbVuz06q29XXTQs2eqSAAA4JYQRHzP3i3yt2nNQ4Y4g/enSwbLZbFaXBADAKSGM+JADlXV6eOFWSdLt5/ZTamy4xRUBAHDqCCM+5OGFW1Ve06CBSVGalNXd6nIAAGgVhBEfkbP3oP6z+itJ0gOXDFJwEIcOAOAfOKP5gEa3R/e8tUmS9NOMVGV072xxRQAAtB7CiA94+fO92rLfpeiwEO7ICwDwO4SRDq64olZ//mC7JOmO8f3UJcJpcUUAALQuwkgHN2vBVlXUNWpoarSuGNPN6nIAAGh1hJEObNXug5q3tkA2m/TAxYMVZGdNEQCA/yGMdFBuj9H9/2satPrz0d00LC3G2oIAAGgjhJEO6o2cfG3a51JkaLB+e25fq8sBAKDNEEY6oIraBj36ftOg1VvG9WHQKgDArxFGOqA5S3aqtLJOPeI66eqsdKvLAQCgTRFGOpi9B6r0/PLdkqS7LxggRzCHCADg3zjTdTCzFmxVvdujM/vEadyAeKvLAQCgzRFGOpAVOw9o4aZC2W3SPRcOlM3GVF4AgP8jjHQQHo/RA+9uliRdmdld/RIjLa4IAID2QRjpIN5eX6DN+5um8t52DlN5AQCBgzDSAdQ2uPXY4am8N/2wlzp3clhcEQAA7Ycw0gG8/PleFZTVKDEqVJPH9rC6HAAA2hVhxGLlNQ16askOSdJt5/RRmCPI4ooAAGhfhBGL/W3ZTpVVN6h3fIQuG5lqdTkAALQ7woiFCstr9fynTQuc3XlefwUHcTgAAIGHs5+F/rJou2obPBqdHqtsFjgDAASokwojc+bMUXp6ukJDQ5WZmalVq1ad0H5z586VzWbTJZdccjIf61d2FFfq9Zx8SdL08/uzwBkAIGC1OIy89tprmjZtmu677z6tWbNGw4YN0/jx41VcXPyd++3Zs0e//e1vdeaZZ550sf5k9ofb5THSOQMTlNG9s9XlAABgmRaHkccff1w33HCDJk+erIEDB+qZZ55ReHi4nn/++ePu43a7deWVV+r+++9Xz549T6lgf7C10KX5G/dLkqaxwBkAIMC1KIzU19crJydH2dnZX7+B3a7s7GytWLHiuPv94Q9/UHx8vK677roT+py6ujq5XK5mD38ye9GXMka6cEiSBiRFWV0OAACWalEYKS0tldvtVkJCQrPtCQkJKiwsPOY+y5cv1z/+8Q89++yzJ/w5s2bNUnR0tPeRlpbWkjI7tNyCci3cVCibTbolu4/V5QAAYLk2nU1TUVGhq666Ss8++6zi4uJOeL8ZM2aovLzc+8jPz2/DKtvXXxY1Lft+0bBk9U3gZngAAAS3pHFcXJyCgoJUVFTUbHtRUZESExOPar9z507t2bNHEyZM8G7zeDxNHxwcrG3btqlXr15H7ed0OuV0OltSmk9Yl1+mxVuLZbdJt4zjqggAAFILr4w4HA5lZGRo8eLF3m0ej0eLFy9WVlbWUe379++vjRs3at26dd7HRRddpLPPPlvr1q3zq+6XE/H44asil45IVc+uERZXAwBAx9CiKyOSNG3aNE2aNEmjRo3SmDFjNHv2bFVVVWny5MmSpKuvvlopKSmaNWuWQkNDNXjw4Gb7x8TESNJR2/1dzt6D+nh7iYLtNq6KAADwDS0OIxMnTlRJSYlmzpypwsJCDR8+XAsXLvQOas3Ly5PdzsKu3/bkR003w7tsZKq6dQm3uBoAADoOmzHGWF3E93G5XIqOjlZ5ebmionxvKmxuQbl+/ORy2W3SR7f/UOlxnawuCQCANnei528uYbSDOUuaropMGJZMEAEA4FsII21sR3GFFm5qWoPl1z/sbXE1AAB0PISRNvbXJTtljHTuwAT1S2RdEQAAvo0w0obyDlTr7fX7JElTf8RVEQAAjoUw0oae+Xin3B6jM/vEaWhqjNXlAADQIRFG2kiRq1ZvrP5KkjT1bK6KAABwPISRNvLCp3tU7/ZoVPdYZfbsYnU5AAB0WISRNlBV16hXVu6VJP3qBz0trgYAgI6NMNIG/rM6X67aRvWI66TsAQlWlwMAQIdGGGlljW6P/rF8tyTpujN6yG63WVwRAAAdG2Gklb2/qUhfHapRbHiILhuZanU5AAB0eISRVmSM0bOf7JIkXXVad4U5giyuCACAjo8w0opy9h7SuvwyOYLtuior3epyAADwCYSRVnTkqshPRqSoa6TT4moAAPANhJFWkn+wWos2F0lqGrgKAABODGGklfx7ZZ48RjqzT5z6JHBDPAAAThRhpBXUNrj12hd5kpoGrgIAgBNHGGkF/1u/T4eqG5QSE6ZxLHIGAECLEEZOkTFG/1zRtPT7L0/rriAWOQMAoEUII6doXX6ZNhaUyxFs18TRaVaXAwCAzyGMnKIjV0UmDE1W504Oi6sBAMD3EEZOQWllneZv2C9JmjSWgasAAJwMwsgp+G/OV6p3ezQsLUZDU2OsLgcAAJ9EGDlJxhi99kW+JOkXYxgrAgDAySKMnKRVuw9qV2mVOjmC9OOhyVaXAwCAzyKMnKQjV0UmDEtWJ2ewxdUAAOC7CCMnobymQfM3Ng1cZTovAACnhjByEt5ZV6C6Ro/6J0ZqeFqM1eUAAODTCCMtZIzRq6uaumgmjk6TzcaKqwAAnArCSAvlFri0eb9LjmC7Lh2RYnU5AAD4PMJIC72R03RVZPygRMWEs+IqAACnijDSAg1uj/53eMXVy0ZyVQQAgNZAGGmBZdtKdLCqXnERTp3RO87qcgAA8AuEkRaYt7ZAknTx8GQFB/GrAwCgNXBGPUHlNQ1atKVIkhi4CgBAKyKMnKD3Nu5XfaNHfeIjNCg5yupyAADwG4SRE3Ski+bSkSmsLQIAQCsijJyAgrIardx9UDabdMlwumgAAGhNhJETsODwdN7R6Z2VHBNmcTUAAPgXwsgJOHJTvB8PTbK4EgAA/A9h5Ht8daha6/LLZLNJ5w1OtLocAAD8DmHke7y3sVBSUxdNfGSoxdUAAOB/CCPfgy4aAADaFmHkOxSU1dBFAwBAGyOMfIf3Nn49i4YuGgAA2gZh5Du8v6lpvMgFXBUBAKDNEEaO42BVvXL2HpIkZQ9MsLgaAAD8F2HkOJZsLZbHSAOSopQaG251OQAA+C3CyHEs3tp0h97sAfEWVwIAgH8jjBxDXaNbH28vlSRlD6CLBgCAtkQYOYaVuw6qsq5RXSOdGpISbXU5AAD4NcLIMSze8nUXjd1us7gaAAD8G2HkGJZtL5Eknd2P8SIAALQ1wsi35B+s1p4D1Qqy25TVq4vV5QAA4PcII9/y2c6mgavD02IUGRpicTUAAPg/wsi3fPJlUxg5vXecxZUAABAYCCPf4PEYfbbzgCTpDMIIAADtgjDyDVsKXTpYVa9OjiCN6BZjdTkAAAQEwsg3rDh8VWRMj84KCeJXAwBAe+CM+w1r8ppujDcqvbPFlQAAEDgII4cZY7x36R3VPdbiagAACByEkcO+OlSjIledgu02DU2NsbocAAACBmHksCNdNINSohXmCLK4GgAAAgdh5LDVe5rCSEY3umgAAGhPJxVG5syZo/T0dIWGhiozM1OrVq06bttnn31WZ555pmJjYxUbG6vs7OzvbG+VDQXlksSUXgAA2lmLw8hrr72madOm6b777tOaNWs0bNgwjR8/XsXFxcdsv3TpUl1xxRVasmSJVqxYobS0NJ177rkqKCg45eJbS6Pbo637XZKkQclRFlcDAEBgsRljTEt2yMzM1OjRo/XUU09Jkjwej9LS0nTzzTdr+vTp37u/2+1WbGysnnrqKV199dUn9Jkul0vR0dEqLy9XVFTrh4UdxRXKfvxjhTuClPv78bLbba3+GQAABJoTPX+36MpIfX29cnJylJ2d/fUb2O3Kzs7WihUrTug9qqur1dDQoM6dO85aHpv2NV0VGZAURRABAKCdBbekcWlpqdxutxISEpptT0hI0NatW0/oPe68804lJyc3CzTfVldXp7q6Ou/PLperJWW22ObDXTQDk+iiAQCgvbXrbJqHHnpIc+fO1bx58xQaGnrcdrNmzVJ0dLT3kZaW1qZ1bS+skCT1T4ps088BAABHa1EYiYuLU1BQkIqKipptLyoqUmJi4nfu+9hjj+mhhx7SBx98oKFDh35n2xkzZqi8vNz7yM/Pb0mZLbb3QLUkqUeXTm36OQAA4GgtCiMOh0MZGRlavHixd5vH49HixYuVlZV13P0eeeQRPfDAA1q4cKFGjRr1vZ/jdDoVFRXV7NFW3B6j/ENNYaRbl/A2+xwAAHBsLRozIknTpk3TpEmTNGrUKI0ZM0azZ89WVVWVJk+eLEm6+uqrlZKSolmzZkmSHn74Yc2cOVOvvPKK0tPTVVhYKEmKiIhQREREK36Vk7O/vEYNbqOQIJuSosOsLgcAgIDT4jAyceJElZSUaObMmSosLNTw4cO1cOFC76DWvLw82e1fX3B5+umnVV9fr8svv7zZ+9x33336/e9/f2rVt4IjXTRpncMVxEwaAADaXYvDiCRNnTpVU6dOPeZrS5cubfbznj17TuYj2s2RMNK9M100AABYIeDvTbO/vEaSlBJLFw0AAFYI+DBSUtG0nkl85PGnGgMAgLYT8GGk+HAY6RrptLgSAAACE2GkolaSFE8YAQDAEoQRF900AABYKaDDiMdjdKCqXhLdNAAAWCWgw0h1g1tuj5EkxYSHWFwNAACBKaDDSGVtoyQp2G6TMzigfxUAAFgmoM/AlXUNkqROzmDZbKy+CgCAFQI6jFQcvjIS4TyphWgBAEArCOgwUlXnliRFhhJGAACwSkCHkSPdNFwZAQDAOgEdRrzdNFwZAQDAMgEdRirrmsJIJ66MAABgmYAOI3WNHklSaHCQxZUAABC4AjqMNLqbwkhIENN6AQCwSkCHkXp30+qrwYQRAAAsE9Bh5OsrIwH9awAAwFIBfRZuPHxfGsIIAADWCeizcH0jY0YAALBaQIeRRk9TGAm2B/SvAQAASwX0Wbih8Ug3DVdGAACwSmCHEQ8DWAEAsFpAn4UbvFN7A/rXAACApQL6LHxkaq+DbhoAACwT0GGk4XAY4coIAADWCeizsLebxs6VEQAArBLQYeTI1F5HcED/GgAAsFRAn4WPTO1lnREAAKwT0Gfhr6f20k0DAIBVgq0uwEqXZ6Qqq2cX9ezayepSAAAIWAEdRq7M7G51CQAABLyA7qYBAADWI4wAAABLEUYAAIClCCMAAMBShBEAAGApwggAALAUYQQAAFiKMAIAACxFGAEAAJYijAAAAEsRRgAAgKUIIwAAwFKEEQAAYCmfuGuvMUaS5HK5LK4EAACcqCPn7SPn8ePxiTBSUVEhSUpLS7O4EgAA0FIVFRWKjo4+7us2831xpQPweDzat2+fIiMjZbPZWu19XS6X0tLSlJ+fr6ioqFZ7X7Qtjptv4rj5Lo6db+oIx80Yo4qKCiUnJ8tuP/7IEJ+4MmK325Wamtpm7x8VFcVfMB/EcfNNHDffxbHzTVYft++6InIEA1gBAIClCCMAAMBSAR1GnE6n7rvvPjmdTqtLQQtw3HwTx813cex8ky8dN58YwAoAAPxXQF8ZAQAA1iOMAAAASxFGAACApQgjAADAUgEdRubMmaP09HSFhoYqMzNTq1atsrqkgPHxxx9rwoQJSk5Ols1m01tvvdXsdWOMZs6cqaSkJIWFhSk7O1tffvllszYHDx7UlVdeqaioKMXExOi6665TZWVlszYbNmzQmWeeqdDQUKWlpemRRx5p66/m12bNmqXRo0crMjJS8fHxuuSSS7Rt27ZmbWprazVlyhR16dJFERERuuyyy1RUVNSsTV5eni688EKFh4crPj5ed9xxhxobG5u1Wbp0qUaOHCmn06nevXvrxRdfbOuv57eefvppDR061Lv4VVZWlt577z3v6xwz3/DQQw/JZrPp1ltv9W7zm2NnAtTcuXONw+Ewzz//vNm0aZO54YYbTExMjCkqKrK6tICwYMECc/fdd5s333zTSDLz5s1r9vpDDz1koqOjzVtvvWXWr19vLrroItOjRw9TU1PjbXPeeeeZYcOGmc8//9x88sknpnfv3uaKK67wvl5eXm4SEhLMlVdeaXJzc82rr75qwsLCzN/+9rf2+pp+Z/z48eaFF14wubm5Zt26deaCCy4w3bp1M5WVld42N954o0lLSzOLFy82q1evNqeddpoZO3as9/XGxkYzePBgk52dbdauXWsWLFhg4uLizIwZM7xtdu3aZcLDw820adPM5s2bzZNPPmmCgoLMwoUL2/X7+ot33nnHzJ8/32zfvt1s27bN3HXXXSYkJMTk5uYaYzhmvmDVqlUmPT3dDB061Nxyyy3e7f5y7AI2jIwZM8ZMmTLF+7Pb7TbJyclm1qxZFlYVmL4dRjwej0lMTDSPPvqod1tZWZlxOp3m1VdfNcYYs3nzZiPJfPHFF9427733nrHZbKagoMAYY8xf//pXExsba+rq6rxt7rzzTtOvX782/kaBo7i42Egyy5YtM8Y0HaeQkBDz+uuve9ts2bLFSDIrVqwwxjQFUbvdbgoLC71tnn76aRMVFeU9Vr/73e/MoEGDmn3WxIkTzfjx49v6KwWM2NhY89xzz3HMfEBFRYXp06ePWbRokTnrrLO8YcSfjl1AdtPU19crJydH2dnZ3m12u13Z2dlasWKFhZVBknbv3q3CwsJmxyc6OlqZmZne47NixQrFxMRo1KhR3jbZ2dmy2+1auXKlt80PfvADORwOb5vx48dr27ZtOnToUDt9G/9WXl4uSercubMkKScnRw0NDc2OXf/+/dWtW7dmx27IkCFKSEjwthk/frxcLpc2bdrkbfPN9zjShr+fp87tdmvu3LmqqqpSVlYWx8wHTJkyRRdeeOFRv19/OnY+caO81lZaWiq3293s4EhSQkKCtm7dalFVOKKwsFCSjnl8jrxWWFio+Pj4Zq8HBwerc+fOzdr06NHjqPc48lpsbGyb1B8oPB6Pbr31Vp1++ukaPHiwpKbfq8PhUExMTLO23z52xzq2R177rjYul0s1NTUKCwtri6/k1zZu3KisrCzV1tYqIiJC8+bN08CBA7Vu3TqOWQc2d+5crVmzRl988cVRr/nT37eADCMATt2UKVOUm5ur5cuXW10KTkC/fv20bt06lZeX64033tCkSZO0bNkyq8vCd8jPz9ctt9yiRYsWKTQ01Opy2lRAdtPExcUpKCjoqBHHRUVFSkxMtKgqHHHkGHzX8UlMTFRxcXGz1xsbG3Xw4MFmbY71Ht/8DJycqVOn6t1339WSJUuUmprq3Z6YmKj6+nqVlZU1a//tY/d9x+V4baKiovg/7JPkcDjUu3dvZWRkaNasWRo2bJieeOIJjlkHlpOTo+LiYo0cOVLBwcEKDg7WsmXL9H//938KDg5WQkKC3xy7gAwjDodDGRkZWrx4sXebx+PR4sWLlZWVZWFlkKQePXooMTGx2fFxuVxauXKl9/hkZWWprKxMOTk53jYfffSRPB6PMjMzvW0+/vhjNTQ0eNssWrRI/fr1o4vmJBljNHXqVM2bN08fffTRUd1gGRkZCgkJaXbstm3bpry8vGbHbuPGjc3C5KJFixQVFaWBAwd623zzPY604e9n6/F4PKqrq+OYdWDjxo3Txo0btW7dOu9j1KhRuvLKK71/9ptj125DZTuYuXPnGqfTaV588UWzefNm86tf/crExMQ0G3GMtlNRUWHWrl1r1q5daySZxx9/3Kxdu9bs3bvXGNM0tTcmJsa8/fbbZsOGDebiiy8+5tTeESNGmJUrV5rly5ebPn36NJvaW1ZWZhISEsxVV11lcnNzzdy5c014eDhTe0/BTTfdZKKjo83SpUvN/v37vY/q6mpvmxtvvNF069bNfPTRR2b16tUmKyvLZGVleV8/MtXw3HPPNevWrTMLFy40Xbt2PeZUwzvuuMNs2bLFzJkzh2mip2D69Olm2bJlZvfu3WbDhg1m+vTpxmazmQ8++MAYwzHzJd+cTWOM/xy7gA0jxhjz5JNPmm7duhmHw2HGjBljPv/8c6tLChhLliwxko56TJo0yRjTNL333nvvNQkJCcbpdJpx48aZbdu2NXuPAwcOmCuuuMJERESYqKgoM3nyZFNRUdGszfr1680ZZ5xhnE6nSUlJMQ899FB7fUW/dKxjJsm88MIL3jY1NTXm17/+tYmNjTXh4eHm0ksvNfv372/2Pnv27DHnn3++CQsLM3Fxceb22283DQ0NzdosWbLEDB8+3DgcDtOzZ89mn4GWufbaa0337t2Nw+EwXbt2NePGjfMGEWM4Zr7k22HEX46dzRhj2u86DAAAQHMBOWYEAAB0HIQRAABgKcIIAACwFGEEAABYijACAAAsRRgBAACWIowAAABLEUYAAIClCCMAAMBShBEAAGApwggAALAUYQQAAFjq/wMI6YkYJ6m7HgAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.plot(np.cumsum(Sh ** 2) / np.sum(Sh ** 2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "bcce3fba-d5ca-41fe-8a68-015186e2d5ab",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(32000,)"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "Vh[0].shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "e4684cfb-b600-4dfc-a76c-c2a669162440",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "S 26.656696\n",
      "             token      prob        token      prob\n",
      "0          archivi  0.000032           ,”  0.000032\n",
      "1            textt  0.000032   ▁everybody  0.000032\n",
      "2   ▁partiellement  0.000032            　  0.000032\n",
      "3        ▁externos  0.000032           .\"  0.000032\n",
      "4         ▁esterni  0.000032           ▁â  0.000032\n",
      "5          ▁eredet  0.000032           -(  0.000032\n",
      "6      ▁információ  0.000031          ▁(.  0.000032\n",
      "7              ira  0.000031     ▁whereas  0.000032\n",
      "8               ip  0.000031           ▁‘  0.000032\n",
      "9               ui  0.000031         ensk  0.000032\n",
      "10             era  0.000031           -\\  0.000032\n",
      "11              iz  0.000031      ▁dissol  0.000032\n",
      "12             ern  0.000031           .[  0.000032\n",
      "13             uss  0.000031  ▁eredetiből  0.000032\n",
      "14             ill  0.000031        mlung  0.000032\n",
      "15              yn  0.000031            ~  0.000032\n",
      "16              od  0.000031     ▁suppose  0.000032\n",
      "17              ub  0.000031     multirow  0.000032\n",
      "18            ▁rör  0.000031      archivi  0.000032\n",
      "19             iss  0.000031        ▁pode  0.000032\n",
      "20              og  0.000031            آ  0.000032\n",
      "21              ym  0.000031           яз  0.000032\n",
      "22              ol  0.000031        ▁Tras  0.000032\n",
      "23        ▁externe  0.000031   ▁angularjs  0.000032\n",
      "24         ▁stessa  0.000031            -  0.000032\n",
      "25              oh  0.000031       thesis  0.000032\n",
      "26             ino  0.000031        ▁Cong  0.000032\n",
      "27             ana  0.000031        ettes  0.000032\n",
      "28           ▁přek  0.000031           та  0.000032\n",
      "29              uc  0.000031         ▁nel  0.000032\n",
      "30              ik  0.000031          ▁(+  0.000032\n",
      "31             ash  0.000031        ▁till  0.000032\n",
      "32         ▁autory  0.000031           ов  0.000032\n",
      "33             ios  0.000031           ?”  0.000032\n",
      "34              os  0.000031            종  0.000032\n",
      "35           ▁perí  0.000031  ▁regardless  0.000032\n",
      "36            ▁cím  0.000031           ey  0.000032\n",
      "37             ond  0.000031      ulative  0.000032\n",
      "38             erm  0.000031          ▁(!  0.000032\n",
      "39             ass  0.000031           RC  0.000032\n",
      "S 11.636547\n",
      "     token      prob          token      prob\n",
      "0        .  0.000033           ▁...  0.000033\n",
      "1        ,  0.000033            ...  0.000033\n",
      "2      ▁in  0.000032         <0x0A>  0.000033\n",
      "3       ▁(  0.000032             ▁…  0.000033\n",
      "4        ;  0.000032              …  0.000032\n",
      "5   <0x0A>  0.000032           ....  0.000032\n",
      "6     ▁and  0.000032           ...\"  0.000032\n",
      "7     ▁for  0.000032              Â  0.000032\n",
      "8      ▁to  0.000032         ▁#####  0.000032\n",
      "9        :  0.000032         selves  0.000032\n",
      "10     ▁at  0.000032           !...  0.000032\n",
      "11     ▁is  0.000032          ▁...)  0.000032\n",
      "12   ▁that  0.000032             ▁(  0.000032\n",
      "13   ▁with  0.000032         ▁[...]  0.000032\n",
      "14     ▁on  0.000032         ▁today  0.000032\n",
      "15     ▁by  0.000032             ▁\"  0.000032\n",
      "16     ▁as  0.000032           chos  0.000032\n",
      "17      ▁a  0.000032         <0x12>  0.000032\n",
      "18     ▁of  0.000032              ­  0.000032\n",
      "19   ▁from  0.000032           ...,  0.000032\n",
      "20       )  0.000032          ▁####  0.000032\n",
      "21       !  0.000032           ...)  0.000032\n",
      "22     ▁or  0.000032           ▁til  0.000032\n",
      "23      ).  0.000032              ʹ  0.000032\n",
      "24      ▁-  0.000032            isy  0.000032\n",
      "25       ?  0.000032             ▁Î  0.000032\n",
      "26      ▁–  0.000032           idel  0.000032\n",
      "27    ▁the  0.000032           тури  0.000032\n",
      "28       s  0.000032  ▁respectively  0.000032\n",
      "29   ▁when  0.000032              �  0.000032\n",
      "30       y  0.000032       CheckBox  0.000032\n",
      "31       a  0.000032           мери  0.000032\n",
      "32      it  0.000032          prüft  0.000032\n",
      "33     ing  0.000032           apor  0.000032\n",
      "34      ),  0.000032         autore  0.000032\n",
      "35     ▁if  0.000032            FOR  0.000032\n",
      "36     ▁it  0.000032             ▁'  0.000032\n",
      "37      et  0.000032           ...]  0.000032\n",
      "38     ons  0.000032             Ар  0.000032\n",
      "39       /  0.000032          quote  0.000032\n",
      "S 9.789183\n",
      "          token      prob          token      prob\n",
      "0       ▁effect  0.000032           </s>  0.000032\n",
      "1      ▁process  0.000032             ▁…  0.000032\n",
      "2       ▁change  0.000032            !--  0.000032\n",
      "3    ▁condition  0.000032         <0x0A>  0.000032\n",
      "4    ▁structure  0.000032             -,  0.000032\n",
      "5     ▁function  0.000032            кро  0.000032\n",
      "6     ▁position  0.000032            ätz  0.000032\n",
      "7         ▁rule  0.000032              ¬  0.000032\n",
      "8        ▁value  0.000032         ▁shall  0.000032\n",
      "9         ▁sign  0.000032             ▁“  0.000032\n",
      "10     ▁pattern  0.000032                 0.000032\n",
      "11      ▁answer  0.000032             ом  0.000032\n",
      "12        ▁name  0.000032             ▁I  0.000032\n",
      "13    ▁activity  0.000032          ▁einz  0.000032\n",
      "14      ▁figure  0.000032             ▁\"  0.000032\n",
      "15        ▁call  0.000032            ▁to  0.000032\n",
      "16     ▁measure  0.000032          ▁...)  0.000032\n",
      "17        ▁word  0.000032            etc  0.000032\n",
      "18      ▁method  0.000032             ▁M  0.000032\n",
      "19        ▁work  0.000032             <>  0.000032\n",
      "20    ▁material  0.000032             _)  0.000032\n",
      "21      ▁reason  0.000032          abase  0.000032\n",
      "22      ▁height  0.000032             зи  0.000032\n",
      "23       ▁issue  0.000032     ▁nederbörd  0.000032\n",
      "24        ▁size  0.000032          aient  0.000032\n",
      "25        ▁move  0.000032            ▁..  0.000032\n",
      "26     ▁changes  0.000032             -)  0.000032\n",
      "27       ▁force  0.000032             нг  0.000032\n",
      "28        ▁deal  0.000032           тому  0.000032\n",
      "29      ▁record  0.000032            ++,  0.000032\n",
      "30        ▁qual  0.000032           ▁hat  0.000032\n",
      "31      ▁branch  0.000032        encoded  0.000032\n",
      "32      ▁action  0.000032            ▁it  0.000032\n",
      "33       ▁rules  0.000032           anel  0.000032\n",
      "34  ▁experience  0.000032  ▁departamento  0.000032\n",
      "35       ▁space  0.000032          ▁afin  0.000032\n",
      "36      ▁report  0.000032            ▁\\r  0.000032\n",
      "37    ▁contract  0.000032              ↵  0.000032\n",
      "38     ▁problem  0.000032              🌍  0.000032\n",
      "39       ▁build  0.000032            ▁or  0.000032\n",
      "S 7.340107\n",
      "     token      prob           token      prob\n",
      "0       od  0.000032            ▁etc  0.000032\n",
      "1       om  0.000032            ▁the  0.000032\n",
      "2      est  0.000032             ...  0.000032\n",
      "3      ene  0.000032             ▁of  0.000032\n",
      "4       ot  0.000032          <0x0A>  0.000032\n",
      "5      ent  0.000032              ▁a  0.000032\n",
      "6       ir  0.000032            ...)  0.000032\n",
      "7      ong  0.000032             <s>  0.000032\n",
      "8       ro  0.000032            !...  0.000032\n",
      "9       os  0.000032         ▁станов  0.000032\n",
      "10      et  0.000032          iginal  0.000032\n",
      "11      le  0.000032           thead  0.000032\n",
      "12      ur  0.000032            ▁...  0.000032\n",
      "13  ▁veget  0.000032            cean  0.000032\n",
      "14      id  0.000032               Ã  0.000032\n",
      "15     ber  0.000032            anti  0.000032\n",
      "16      ip  0.000032             .:   0.000032\n",
      "17      qu  0.000032           heits  0.000032\n",
      "18      ra  0.000032              ▁&  0.000032\n",
      "19      ub  0.000032              ▁а  0.000032\n",
      "20      oc  0.000032              !,  0.000032\n",
      "21     ont  0.000032           ремен  0.000032\n",
      "22     ano  0.000032            ...,  0.000032\n",
      "23      og  0.000032            ▁our  0.000032\n",
      "24     ast  0.000032            iner  0.000032\n",
      "25     ate  0.000032             iki  0.000032\n",
      "26      el  0.000032               ṭ  0.000032\n",
      "27      ol  0.000032               包  0.000032\n",
      "28      ul  0.000032           nisse  0.000032\n",
      "29     ond  0.000032           ▁from  0.000032\n",
      "30      ud  0.000032          endant  0.000032\n",
      "31      ug  0.000032  AndroidRuntime  0.000032\n",
      "32      ry  0.000032        ▁деревня  0.000032\n",
      "33     fer  0.000032        ▁infatti  0.000032\n",
      "34    ient  0.000032            TRUE  0.000032\n",
      "35      op  0.000032            чная  0.000032\n",
      "36     ron  0.000032           ▁your  0.000032\n",
      "37      ut  0.000032            uber  0.000032\n",
      "38      ig  0.000032              ху  0.000032\n",
      "39      um  0.000032             lob  0.000032\n",
      "S 6.691803\n",
      "              token      prob        token      prob\n",
      "0              ▁the  0.000033           ▁…  0.000033\n",
      "1                ▁a  0.000033            .  0.000033\n",
      "2               ▁an  0.000032          ▁in  0.000032\n",
      "3               ▁in  0.000032            …  0.000032\n",
      "4                 .  0.000032       ▁desar  0.000032\n",
      "5      ▁Хронологија  0.000032           ?)  0.000032\n",
      "6                 :  0.000032     intellij  0.000032\n",
      "7                 ,  0.000032               0.000032\n",
      "8               ▁it  0.000032  ▁Einzelnach  0.000032\n",
      "9                 ;  0.000032            №  0.000032\n",
      "10           ▁their  0.000032        jboss  0.000032\n",
      "11           <0x0A>  0.000032       aucoup  0.000032\n",
      "12             ▁its  0.000032          <s>  0.000032\n",
      "13            empio  0.000032          ▁of  0.000032\n",
      "14              <s>  0.000032          ▁as  0.000032\n",
      "15          perties  0.000032          ikz  0.000032\n",
      "16             INCT  0.000032   ▁parenthes  0.000032\n",
      "17           ▁Попис  0.000032     férences  0.000032\n",
      "18            ▁some  0.000032            !  0.000032\n",
      "19            ▁this  0.000032     geordnet  0.000032\n",
      "20               ▁.  0.000032            Ű  0.000032\n",
      "21            bolds  0.000032            ⅓  0.000032\n",
      "22               ▁(  0.000032            Õ  0.000032\n",
      "23          ategory  0.000032            Ē  0.000032\n",
      "24           irtual  0.000032       onnées  0.000032\n",
      "25           atform  0.000032     EditText  0.000032\n",
      "26              ▁at  0.000032       ▁});\\r  0.000032\n",
      "27            ▁what  0.000032        ▁Airl  0.000032\n",
      "28             ▁for  0.000032        uteur  0.000032\n",
      "29            ▁that  0.000032         ulté  0.000032\n",
      "30        stringify  0.000032       staden  0.000032\n",
      "31              ▁my  0.000032       esterd  0.000032\n",
      "32  printStackTrace  0.000032        numer  0.000032\n",
      "33             ▁our  0.000032       selves  0.000032\n",
      "34             ▁his  0.000032       ▁Febru  0.000032\n",
      "35             $}}%  0.000032         adém  0.000032\n",
      "36    ▁Begriffsklär  0.000032           яз  0.000032\n",
      "37           onnées  0.000032          ▁\\\"  0.000032\n",
      "38         ▁listade  0.000032      ▁година  0.000032\n",
      "39              ▁by  0.000032        raste  0.000032\n",
      "S 6.4978533\n",
      "     token      prob      token      prob\n",
      "0       ▁a  0.000032          -  0.000035\n",
      "1      the  0.000032         ▁(  0.000033\n",
      "2        F  0.000032         -(  0.000033\n",
      "3        B  0.000032          ‑  0.000033\n",
      "4    state  0.000032         -%  0.000033\n",
      "5        G  0.000032          /  0.000033\n",
      "6        M  0.000032          _  0.000033\n",
      "7       St  0.000032         -$  0.000033\n",
      "8        D  0.000032          ‐  0.000032\n",
      "9     tree  0.000032         -\\  0.000032\n",
      "10       J  0.000032         ▁…  0.000032\n",
      "11      Sh  0.000032        ▁(:  0.000032\n",
      "12    ▁the  0.000032          ・  0.000032\n",
      "13       S  0.000032         '-  0.000032\n",
      "14     New  0.000032       ▁();  0.000032\n",
      "15       T  0.000032    ▁latter  0.000032\n",
      "16       N  0.000032         ?(  0.000032\n",
      "17     sub  0.000032        ▁(?  0.000032\n",
      "18  market  0.000032         .-  0.000032\n",
      "19     Car  0.000032          ≃  0.000032\n",
      "20  square  0.000032          ∙  0.000032\n",
      "21     new  0.000032       Sito  0.000032\n",
      "22   class  0.000032      ▁...)  0.000032\n",
      "23     ▁an  0.000032         [-  0.000032\n",
      "24       L  0.000032         $-  0.000032\n",
      "25       P  0.000032          （  0.000032\n",
      "26    text  0.000032          ┴  0.000032\n",
      "27       K  0.000032         _(  0.000032\n",
      "28    gior  0.000032     <0x02>  0.000032\n",
      "29       H  0.000032         ▁-  0.000032\n",
      "30   touch  0.000032       ▁etc  0.000032\n",
      "31       W  0.000032         '(  0.000032\n",
      "32    hand  0.000032       olin  0.000032\n",
      "33   month  0.000032          −  0.000032\n",
      "34      gl  0.000032  ungsseite  0.000032\n",
      "35    home  0.000032        AXI  0.000032\n",
      "36      Ad  0.000032          =  0.000032\n",
      "37     tax  0.000032    Vorlage  0.000032\n",
      "38      Ch  0.000032         `-  0.000032\n",
      "39       A  0.000032       ▁...  0.000032\n",
      "S 5.7914534\n",
      "           token      prob      token      prob\n",
      "0       ▁process  0.000032        ...  0.000033\n",
      "1        ▁method  0.000032        }$-  0.000032\n",
      "2       ▁program  0.000032        ▁%.  0.000032\n",
      "3      ▁category  0.000032      ▁sake  0.000032\n",
      "4        ▁system  0.000032          !  0.000032\n",
      "5       ▁Program  0.000032        ().  0.000032\n",
      "6       ▁Process  0.000032      ▁című  0.000032\n",
      "7          ▁page  0.000032        __.  0.000032\n",
      "8          ▁site  0.000032          。  0.000032\n",
      "9      ▁Services  0.000032          …  0.000032\n",
      "10         ▁area  0.000032       !...  0.000032\n",
      "11       ▁System  0.000032         ▁_  0.000032\n",
      "12  ▁application  0.000032         ▁-  0.000032\n",
      "13      ▁Service  0.000032        бір  0.000032\n",
      "14    ▁procedure  0.000032          ̶  0.000032\n",
      "15       ▁Report  0.000032         *.  0.000032\n",
      "16         ▁list  0.000032        isi  0.000032\n",
      "17         ▁List  0.000032      ▁mano  0.000032\n",
      "18    ▁programme  0.000032        )$-  0.000032\n",
      "19   ▁department  0.000032          ?  0.000032\n",
      "20         ▁team  0.000032   pository  0.000032\n",
      "21         ▁Test  0.000032         ².  0.000032\n",
      "22         ▁name  0.000032    nection  0.000032\n",
      "23      ▁website  0.000032    ▁VALUES  0.000032\n",
      "24          ▁Act  0.000032       gele  0.000032\n",
      "25      ▁Company  0.000032          ；  0.000032\n",
      "26         ▁rate  0.000032          ˜  0.000032\n",
      "27    ▁statement  0.000032  ▁circumst  0.000032\n",
      "28       ▁format  0.000032         шу  0.000032\n",
      "29       ▁device  0.000032    chestra  0.000032\n",
      "30        <0x0A>  0.000032    unächst  0.000032\n",
      "31       ▁region  0.000032     доступ  0.000032\n",
      "32        ▁story  0.000032        ▁\\<  0.000032\n",
      "33  ▁Association  0.000032      viron  0.000032\n",
      "34        ▁group  0.000032       ...\"  0.000032\n",
      "35       ▁School  0.000032          ↵  0.000032\n",
      "36         ▁item  0.000032          配  0.000032\n",
      "37      ▁service  0.000032     сторія  0.000032\n",
      "38       ▁module  0.000032         ▁–  0.000032\n",
      "39     ▁function  0.000032      overy  0.000032\n",
      "S 5.2599735\n",
      "       token      prob           token      prob\n",
      "0      ▁take  0.000032             ▁to  0.000033\n",
      "1       ▁get  0.000032               .  0.000032\n",
      "2        ▁go  0.000032             ...  0.000032\n",
      "3      ▁make  0.000032             and  0.000032\n",
      "4      ▁turn  0.000032              to  0.000032\n",
      "5     ▁start  0.000032               …  0.000032\n",
      "6      ▁look  0.000032           uncia  0.000032\n",
      "7       ▁see  0.000032            ▁and  0.000032\n",
      "8      ▁give  0.000032            ▁...  0.000032\n",
      "9      ▁move  0.000032             ▁să  0.000032\n",
      "10      ▁try  0.000032           ▁they  0.000032\n",
      "11      ▁put  0.000032            nbsp  0.000032\n",
      "12      ▁use  0.000032            fach  0.000032\n",
      "13       ▁do  0.000032              we  0.000032\n",
      "14     ▁find  0.000032           elsen  0.000032\n",
      "15     ▁keep  0.000032          lament  0.000032\n",
      "16    ▁leave  0.000032           ▁stal  0.000032\n",
      "17    ▁bring  0.000032            icus  0.000032\n",
      "18     ▁call  0.000032          ▁Архив  0.000032\n",
      "19     ▁stop  0.000032             esz  0.000032\n",
      "20     ▁have  0.000032        amerikan  0.000032\n",
      "21     ▁tell  0.000032           ▁Tsch  0.000032\n",
      "22     ▁feel  0.000032               ’  0.000032\n",
      "23   ▁change  0.000032       ▁Licencia  0.000032\n",
      "24      ▁run  0.000032             lus  0.000032\n",
      "25     ▁play  0.000032            ▁Ung  0.000032\n",
      "26   ▁return  0.000032            ────  0.000032\n",
      "27     ▁show  0.000032             ▁{%  0.000032\n",
      "28   ▁create  0.000032          ▁funds  0.000032\n",
      "29    ▁check  0.000032             top  0.000032\n",
      "30     ▁send  0.000032               씨  0.000032\n",
      "31    ▁reach  0.000032               不  0.000032\n",
      "32     ▁hold  0.000032             (()  0.000032\n",
      "33    ▁carry  0.000032               в  0.000032\n",
      "34     ▁fall  0.000032  amerikanischer  0.000032\n",
      "35      ▁sit  0.000032            chod  0.000032\n",
      "36  ▁receive  0.000032               で  0.000032\n",
      "37       ▁be  0.000032               将  0.000032\n",
      "38      ▁ask  0.000032           await  0.000032\n",
      "39     ▁walk  0.000032             yed  0.000032\n",
      "S 5.0319004\n",
      "      token      prob      token      prob\n",
      "0   archivi  0.000032          -  0.000033\n",
      "1     FAULT  0.000032         ▁-  0.000032\n",
      "2     state  0.000032          ➖  0.000032\n",
      "3     textt  0.000032          .  0.000032\n",
      "4       can  0.000032         '-  0.000032\n",
      "5      work  0.000032          ‐  0.000032\n",
      "6      keep  0.000032     ▁Uniti  0.000032\n",
      "7      fill  0.000032          ‑  0.000032\n",
      "8    making  0.000032      textt  0.000032\n",
      "9      call  0.000032        ▁In  0.000032\n",
      "10     form  0.000032        ▁un  0.000032\n",
      "11    bound  0.000032       werk  0.000032\n",
      "12    files  0.000032         ún  0.000032\n",
      "13  service  0.000032          方  0.000032\n",
      "14    stage  0.000032       ▁jsf  0.000032\n",
      "15     file  0.000032        tis  0.000032\n",
      "16     bank  0.000032     ▁starb  0.000032\n",
      "17    maker  0.000032         xp  0.000032\n",
      "18   NUMBER  0.000032     <0x8F>  0.000032\n",
      "19    books  0.000032        etc  0.000032\n",
      "20   master  0.000032         [,  0.000032\n",
      "21     line  0.000032          ↳  0.000032\n",
      "22     step  0.000032       ▁dob  0.000032\n",
      "23   LENGTH  0.000032         ▁Э  0.000032\n",
      "24     care  0.000032          ,  0.000032\n",
      "25    start  0.000032          ภ  0.000032\n",
      "26     case  0.000032         .-  0.000032\n",
      "27    court  0.000032          田  0.000032\n",
      "28     stop  0.000032        ▁pó  0.000032\n",
      "29    store  0.000032       ▁amp  0.000032\n",
      "30     side  0.000032         -%  0.000032\n",
      "31     grad  0.000032          ณ  0.000032\n",
      "32      car  0.000032          ể  0.000032\n",
      "33    catch  0.000032      ropol  0.000032\n",
      "34     yard  0.000032         }-  0.000032\n",
      "35   stream  0.000032    ▁einges  0.000032\n",
      "36     flow  0.000032          ∃  0.000032\n",
      "37     life  0.000032  ▁quantity  0.000032\n",
      "38    match  0.000032          ア  0.000032\n",
      "39    share  0.000032          ར  0.000032\n",
      "S 4.803552\n",
      "          token      prob        token      prob\n",
      "0          ▁prü  0.000032            -  0.000033\n",
      "1         ▁more  0.000032            ,  0.000032\n",
      "2    ▁necessary  0.000032            —  0.000032\n",
      "3    ▁different  0.000032     istrzost  0.000032\n",
      "4          ▁way  0.000032       <0x9A>  0.000032\n",
      "5          ▁the  0.000032           is  0.000032\n",
      "6        ▁their  0.000032    ▁invånare  0.000032\n",
      "7        ▁given  0.000032            ‑  0.000032\n",
      "8         ively  0.000032           -(  0.000032\n",
      "9      ▁certain  0.000032        ствии  0.000032\n",
      "10       ▁other  0.000032          ▁be  0.000032\n",
      "11   ▁important  0.000032        ações  0.000032\n",
      "12        ▁some  0.000032          igg  0.000032\n",
      "13    ▁relevant  0.000032     ▁charact  0.000032\n",
      "14        ually  0.000032          ($_  0.000032\n",
      "15       ations  0.000032           yi  0.000032\n",
      "16      ▁stessa  0.000032       izable  0.000032\n",
      "17    ▁specific  0.000032         ▁the  0.000032\n",
      "18        fully  0.000032       ▁deren  0.000032\n",
      "19        ▁most  0.000032          are  0.000032\n",
      "20       ▁known  0.000032     ▁diretto  0.000032\n",
      "21    ▁possible  0.000032           '-  0.000032\n",
      "22      ▁chosen  0.000032       ▁oltre  0.000032\n",
      "23         ▁its  0.000032  multicolumn  0.000032\n",
      "24        ▁many  0.000032     mathchar  0.000032\n",
      "25    ▁previous  0.000032       ▁onder  0.000032\n",
      "26        ▁less  0.000032          ého  0.000032\n",
      "27        ▁same  0.000032       ніципа  0.000032\n",
      "28        ▁part  0.000032   ▁somewhere  0.000032\n",
      "29        ▁very  0.000032            −  0.000032\n",
      "30     ▁current  0.000032         ozzá  0.000032\n",
      "31        ▁what  0.000032           --  0.000032\n",
      "32        ▁much  0.000032      ▁exceed  0.000032\n",
      "33         ▁our  0.000032         engo  0.000032\n",
      "34         ▁two  0.000032        ональ  0.000032\n",
      "35      ▁higher  0.000032     ▁numeric  0.000032\n",
      "36         ▁one  0.000032           -%  0.000032\n",
      "37        ▁your  0.000032   ----------  0.000032\n",
      "38     ▁another  0.000032        ▁ways  0.000032\n",
      "39  ▁additional  0.000032        ▁otro  0.000032\n",
      "S 4.469883\n",
      "   token      prob           token      prob\n",
      "0     ).  0.000033              ▁a  0.000033\n",
      "1      .  0.000033             ▁an  0.000033\n",
      "2     .)  0.000033             ▁%.  0.000032\n",
      "3     ),  0.000033        ▁another  0.000032\n",
      "4     ].  0.000032            ▁one  0.000032\n",
      "5    .).  0.000032           ▁hina  0.000032\n",
      "6      )  0.000032            ▁the  0.000032\n",
      "7      ;  0.000032             ící  0.000032\n",
      "8     );  0.000032     scriptstyle  0.000032\n",
      "9     .[  0.000032              -,  0.000032\n",
      "10    .]  0.000032               。  0.000032\n",
      "11    .;  0.000032             ▁yo  0.000032\n",
      "12    .*  0.000032              %.  0.000032\n",
      "13   .),  0.000032               a  0.000032\n",
      "14    ».  0.000032           ▁your  0.000032\n",
      "15    ..  0.000032          <0xC8>  0.000032\n",
      "16     ?  0.000032              -)  0.000032\n",
      "17    ):  0.000032           reten  0.000032\n",
      "18    ².  0.000032      ▁demselben  0.000032\n",
      "19     。  0.000032               ѣ  0.000032\n",
      "20    *.  0.000032  ▁Genomsnittlig  0.000032\n",
      "21    .,  0.000032           ▁part  0.000032\n",
      "22    .\"  0.000032              äß  0.000032\n",
      "23    }.  0.000032             osz  0.000032\n",
      "24     ]  0.000032               ῆ  0.000032\n",
      "25    .»  0.000032          Holder  0.000032\n",
      "26     !  0.000032             utf  0.000032\n",
      "27    >.  0.000032           ▁afin  0.000032\n",
      "28    ],  0.000032            hens  0.000032\n",
      "29    '.  0.000032             hed  0.000032\n",
      "30    \".  0.000032             ssl  0.000032\n",
      "31    .}  0.000032           лении  0.000032\n",
      "32    ▁.  0.000032            anim  0.000032\n",
      "33    .”  0.000032      ▁ebenfalls  0.000032\n",
      "34    .(  0.000032             ▁ON  0.000032\n",
      "35    .«  0.000032              td  0.000032\n",
      "36    ._  0.000032               洞  0.000032\n",
      "37   ▁).  0.000032               ⟶  0.000032\n",
      "38   .</  0.000032              ▁а  0.000032\n",
      "39   .):  0.000032            sero  0.000032\n",
      "S 4.2756543\n",
      "         token      prob       token      prob\n",
      "0        ities  0.000032         ▁to  0.000033\n",
      "1        ships  0.000032           来  0.000032\n",
      "2        ments  0.000032          to  0.000032\n",
      "3       ements  0.000032       ckets  0.000032\n",
      "4       ations  0.000032        hnen  0.000032\n",
      "5       ctions  0.000032         ▁să  0.000032\n",
      "6        ances  0.000032        izon  0.000032\n",
      "7       itions  0.000032         ▁ot  0.000032\n",
      "8         ases  0.000032       льных  0.000032\n",
      "9        ences  0.000032      ▁these  0.000032\n",
      "10         ies  0.000032       ashed  0.000032\n",
      "11        ures  0.000032      ▁Wikip  0.000032\n",
      "12        ants  0.000032      ▁чтобы  0.000032\n",
      "13       aries  0.000032           ´  0.000032\n",
      "14        ents  0.000032        wort  0.000032\n",
      "15      atives  0.000032     atiques  0.000032\n",
      "16     ologies  0.000032       cribe  0.000032\n",
      "17     ilities  0.000032         ▁CO  0.000032\n",
      "18        ages  0.000032      ▁Looks  0.000032\n",
      "19      aments  0.000032       ieurs  0.000032\n",
      "20        ists  0.000032       ymnas  0.000032\n",
      "21        ices  0.000032      ческих  0.000032\n",
      "22    izations  0.000032       ▁nyel  0.000032\n",
      "23        ates  0.000032         ,\\r  0.000032\n",
      "24        ties  0.000032       ▁seus  0.000032\n",
      "25  ifications  0.000032         sta  0.000032\n",
      "26        ests  0.000032           Ḩ  0.000032\n",
      "27      ptions  0.000032       rások  0.000032\n",
      "28       ables  0.000032    ferences  0.000032\n",
      "29     ensions  0.000032        RESS  0.000032\n",
      "30      itudes  0.000032     ▁realiz  0.000032\n",
      "31      atures  0.000032  googleapis  0.000032\n",
      "32       icles  0.000032       agens  0.000032\n",
      "33      iments  0.000032       okrat  0.000032\n",
      "34      utions  0.000032         пли  0.000032\n",
      "35        izes  0.000032         дні  0.000032\n",
      "36        ises  0.000032        ▁you  0.000032\n",
      "37        asts  0.000032       inals  0.000032\n",
      "38       esses  0.000032       antes  0.000032\n",
      "39        uses  0.000032    férences  0.000032\n",
      "S 4.1129456\n",
      "        token      prob       token      prob\n",
      "0         ▁in  0.000032           -  0.000033\n",
      "1         ▁by  0.000032           ,  0.000033\n",
      "2          ▁a  0.000032         ▁in  0.000032\n",
      "3       ▁when  0.000032      <0xE6>  0.000032\n",
      "4       ▁this  0.000032           .  0.000032\n",
      "5         ▁if  0.000032           (  0.000032\n",
      "6        ▁and  0.000032         ▁to  0.000032\n",
      "7       ▁konn  0.000032      <0xE8>  0.000032\n",
      "8        ▁the  0.000032          ▁w  0.000032\n",
      "9        ▁for  0.000032          ▁b  0.000032\n",
      "10        ▁as  0.000032           '  0.000032\n",
      "11      ▁your  0.000032           \"  0.000032\n",
      "12      ▁with  0.000032           ǧ  0.000032\n",
      "13        ▁at  0.000032        ację  0.000032\n",
      "14      ▁each  0.000032          ▁с  0.000032\n",
      "15       ▁our  0.000032           s  0.000032\n",
      "16       ▁his  0.000032        тому  0.000032\n",
      "17   ▁version  0.000032           ◄  0.000032\n",
      "18   ▁because  0.000032      ongodb  0.000032\n",
      "19        ▁an  0.000032       ▁того  0.000032\n",
      "20     ▁movie  0.000032      <0xED>  0.000032\n",
      "21       ▁him  0.000032      <0xE5>  0.000032\n",
      "22      ▁page  0.000032           ̯  0.000032\n",
      "23  ▁category  0.000032           ώ  0.000032\n",
      "24     ▁while  0.000032          ▁s  0.000032\n",
      "25       ▁but  0.000032  ▁somewhere  0.000032\n",
      "26     ▁where  0.000032          ▁h  0.000032\n",
      "27      ▁list  0.000032      ▁fresh  0.000032\n",
      "28      ▁year  0.000032           :  0.000032\n",
      "29        ▁to  0.000032           /  0.000032\n",
      "30       ▁you  0.000032           l  0.000032\n",
      "31        arg  0.000032      undert  0.000032\n",
      "32     ▁their  0.000032       raine  0.000032\n",
      "33   ▁through  0.000032           ್  0.000032\n",
      "34        ▁on  0.000032         ▁Vé  0.000032\n",
      "35        ▁or  0.000032        nung  0.000032\n",
      "36   ▁article  0.000032          ▁a  0.000032\n",
      "37      ▁book  0.000032        herr  0.000032\n",
      "38      ▁here  0.000032        iane  0.000032\n",
      "39     ▁month  0.000032         ▁In  0.000032\n",
      "S 4.085633\n",
      "            token      prob        token      prob\n",
      "0           textt  0.000032          ▁to  0.000032\n",
      "1        makeText  0.000032            ら  0.000032\n",
      "2         archivi  0.000032          <s>  0.000032\n",
      "3            read  0.000032           $.  0.000032\n",
      "4               .  0.000032       Brainz  0.000032\n",
      "5         Portail  0.000032           ▁…  0.000032\n",
      "6             omb  0.000032     ▁Notices  0.000032\n",
      "7           utter  0.000032         ▁etc  0.000032\n",
      "8    ▁Хронологија  0.000032  ambiguation  0.000032\n",
      "9             .).  0.000032          iat  0.000032\n",
      "10        données  0.000032          rii  0.000032\n",
      "11            ▁%.  0.000032          ují  0.000032\n",
      "12             .;  0.000032           rf  0.000032\n",
      "13  ▁bezeichneter  0.000032         znam  0.000032\n",
      "14            add  0.000032           ▁t  0.000032\n",
      "15            .):  0.000032            Ő  0.000032\n",
      "16            emp  0.000032          xes  0.000032\n",
      "17           olds  0.000032      ▁článku  0.000032\n",
      "18    ▁Einzelnach  0.000032        -----  0.000032\n",
      "19           apes  0.000032         ▁and  0.000032\n",
      "20            uff  0.000032         érez  0.000032\n",
      "21              紀  0.000032         álva  0.000032\n",
      "22             aw  0.000032         SION  0.000032\n",
      "23             .]  0.000032            ¦  0.000032\n",
      "24           ails  0.000032        ipage  0.000032\n",
      "25            ask  0.000032        creen  0.000032\n",
      "26           alet  0.000032        ▁happ  0.000032\n",
      "27             %.  0.000032       onnées  0.000032\n",
      "28    ▁exceptions  0.000032         ować  0.000032\n",
      "29            ▁$.  0.000032          ▁Py  0.000032\n",
      "30          older  0.000032           ▁&  0.000032\n",
      "31           alle  0.000032         atge  0.000032\n",
      "32           ools  0.000032        edeut  0.000032\n",
      "33            unn  0.000032         refs  0.000032\n",
      "34            att  0.000032       ategor  0.000032\n",
      "35       ▁recover  0.000032           %.  0.000032\n",
      "36            enz  0.000032            并  0.000032\n",
      "37            aff  0.000032            夢  0.000032\n",
      "38             !.  0.000032         ▁not  0.000032\n",
      "39           unch  0.000032          ▁fo  0.000032\n",
      "S 3.9427152\n",
      "      token      prob       token      prob\n",
      "0        es  0.000032           -  0.000033\n",
      "1      ages  0.000032           ,  0.000033\n",
      "2       ins  0.000032           .  0.000033\n",
      "3     Deleg  0.000032           /  0.000033\n",
      "4      ates  0.000032           (  0.000033\n",
      "5       ids  0.000032           :  0.000033\n",
      "6      ines  0.000032           ?  0.000032\n",
      "7      ives  0.000032           _  0.000032\n",
      "8      ides  0.000032           ;  0.000032\n",
      "9       ags  0.000032           !  0.000032\n",
      "10     Unis  0.000032           ▁  0.000032\n",
      "11      its  0.000032          ▁a  0.000032\n",
      "12    ▁When  0.000032          ▁(  0.000032\n",
      "13     ases  0.000032    enschaft  0.000032\n",
      "14     tout  0.000032  artifactId  0.000032\n",
      "15      als  0.000032          ▁M  0.000032\n",
      "16   ▁Where  0.000032          ▁H  0.000032\n",
      "17     ards  0.000032          -(  0.000032\n",
      "18        ы  0.000032           ￼  0.000032\n",
      "19     ings  0.000032         ▁++  0.000032\n",
      "20     ures  0.000032      <0xED>  0.000032\n",
      "21      ils  0.000032         ijk  0.000032\n",
      "22      ies  0.000032          ▁ш  0.000032\n",
      "23    ▁That  0.000032           '  0.000032\n",
      "24      ics  0.000032          ▁Ј  0.000032\n",
      "25        官  0.000032      ▁dolor  0.000032\n",
      "26     oses  0.000032          ▁−  0.000032\n",
      "27      ▁If  0.000032      ▁Aires  0.000032\n",
      "28        ツ  0.000032           め  0.000032\n",
      "29     ions  0.000032           ్  0.000032\n",
      "30    daten  0.000032      ouvern  0.000032\n",
      "31      ols  0.000032           ्  0.000032\n",
      "32     ires  0.000032           ʲ  0.000032\n",
      "33     ents  0.000032          ▁є  0.000032\n",
      "34     icks  0.000032         .~\\  0.000032\n",
      "35  AppData  0.000032       ▁denn  0.000032\n",
      "36    ▁This  0.000032           ・  0.000032\n",
      "37     ▁kle  0.000032       iture  0.000032\n",
      "38     ells  0.000032         .\\r  0.000032\n",
      "39    aries  0.000032      ▁explo  0.000032\n",
      "S 3.870231\n",
      "           token      prob           token      prob\n",
      "0              6  0.000032             ▁an  0.000032\n",
      "1              8  0.000032           ▁...)  0.000032\n",
      "2              7  0.000032            Sito  0.000032\n",
      "3              9  0.000032              ▁…  0.000032\n",
      "4             +)  0.000032          oreign  0.000032\n",
      "5              4  0.000032               ∃  0.000032\n",
      "6              0  0.000032  disambiguation  0.000032\n",
      "7              5  0.000032            ▁...  0.000032\n",
      "8         ensure  0.000032             ](#  0.000032\n",
      "9        ▁arrest  0.000032            sime  0.000032\n",
      "10         overy  0.000032              ▁C  0.000032\n",
      "11        number  0.000032           стран  0.000032\n",
      "12  ▁Хронологија  0.000032         Vorlage  0.000032\n",
      "13         lapse  0.000032         ▁tématu  0.000032\n",
      "14  ▁improvement  0.000032            adal  0.000032\n",
      "15       ▁faster  0.000032             orb  0.000032\n",
      "16            ▁&  0.000032           CLARE  0.000032\n",
      "17   ▁incomplete  0.000032               ﬁ  0.000032\n",
      "18      lacement  0.000032            </s>  0.000032\n",
      "19             +  0.000032             ▁or  0.000032\n",
      "20         istre  0.000032               ḩ  0.000032\n",
      "21        ithmet  0.000032             ▁És  0.000032\n",
      "22           ity  0.000032              ▁s  0.000032\n",
      "23       itation  0.000032            than  0.000032\n",
      "24       agement  0.000032          ▁thous  0.000032\n",
      "25       ▁lowest  0.000032             )..  0.000032\n",
      "26       closure  0.000032           ▁LCCN  0.000032\n",
      "27             3  0.000032             ...  0.000032\n",
      "28          ▁AND  0.000032          <0xD1>  0.000032\n",
      "29         ensed  0.000032            ...,  0.000032\n",
      "30        aining  0.000032            Tube  0.000032\n",
      "31          ance  0.000032            ywna  0.000032\n",
      "32      ribution  0.000032              ▁→  0.000032\n",
      "33      ▁equival  0.000032          ▁miesz  0.000032\n",
      "34         arten  0.000032             сок  0.000032\n",
      "35            )-  0.000032         inition  0.000032\n",
      "36         oding  0.000032         ▁článku  0.000032\n",
      "37    ▁expensive  0.000032            cref  0.000032\n",
      "38       ▁sooner  0.000032             fér  0.000032\n",
      "39         ionic  0.000032              ța  0.000032\n",
      "S 3.7826917\n",
      "       token      prob    token      prob\n",
      "0       ▁the  0.000032        ,  0.000033\n",
      "1         ▁a  0.000032      ▁to  0.000032\n",
      "2     ▁their  0.000032        ▁  0.000032\n",
      "3      ▁your  0.000032      ▁in  0.000032\n",
      "4          ,  0.000032        ǧ  0.000032\n",
      "5      ▁this  0.000032      ▁if  0.000032\n",
      "6       ▁and  0.000032   ▁again  0.000032\n",
      "7     ▁these  0.000032       ▁(  0.000032\n",
      "8      ▁them  0.000032    folge  0.000032\n",
      "9       ▁any  0.000032   selves  0.000032\n",
      "10       ▁it  0.000032  Constra  0.000032\n",
      "11     ▁hina  0.000032       ,(  0.000032\n",
      "12     ▁konn  0.000032       ▁å  0.000032\n",
      "13      ▁our  0.000032        ṃ  0.000032\n",
      "14       ica  0.000032     ▁for  0.000032\n",
      "15      ▁its  0.000032     ▁Оте  0.000032\n",
      "16      ▁his  0.000032     zyma  0.000032\n",
      "17       ▁an  0.000032      ▁as  0.000032\n",
      "18       ▁my  0.000032       .:  0.000032\n",
      "19       ola  0.000032      ccc  0.000032\n",
      "20       ita  0.000032   morrow  0.000032\n",
      "21   ▁länkar  0.000032        내  0.000032\n",
      "22    ▁years  0.000032     udad  0.000032\n",
      "23       oba  0.000032   ▁ahead  0.000032\n",
      "24    ▁those  0.000032     appa  0.000032\n",
      "25    ▁spole  0.000032     inal  0.000032\n",
      "26       ▁if  0.000032    ▁scen  0.000032\n",
      "27     ▁some  0.000032      sak  0.000032\n",
      "28       ▁to  0.000032        գ  0.000032\n",
      "29  ▁another  0.000032       ▁o  0.000032\n",
      "30      ular  0.000032       .,  0.000032\n",
      "31      ▁you  0.000032    ▁konn  0.000032\n",
      "32         ѐ  0.000032       ük  0.000032\n",
      "33      ▁him  0.000032   mapsto  0.000032\n",
      "34     ▁time  0.000032        (  0.000032\n",
      "35         ╬  0.000032       uw  0.000032\n",
      "36       ▁in  0.000032     прав  0.000032\n",
      "37     istan  0.000032     ════  0.000032\n",
      "38  ▁listade  0.000032        !  0.000032\n",
      "39        ya  0.000032        :  0.000032\n",
      "S 3.7666528\n",
      "     token      prob        token      prob\n",
      "0        2  0.000033            .  0.000033\n",
      "1        1  0.000032            ▁  0.000032\n",
      "2        3  0.000032          ène  0.000032\n",
      "3        5  0.000032         ének  0.000032\n",
      "4        4  0.000032         orem  0.000032\n",
      "5        0  0.000032           ▁b  0.000032\n",
      "6        6  0.000032          kbd  0.000032\n",
      "7        7  0.000032           ▁F  0.000032\n",
      "8        8  0.000032  ▁Einzelnach  0.000032\n",
      "9        ­  0.000032      ershell  0.000032\n",
      "10       9  0.000032        ▁Tout  0.000032\n",
      "11  <0xEF>  0.000032         tern  0.000032\n",
      "12       ½  0.000032       <0xE6>  0.000032\n",
      "13         0.000032      isecond  0.000032\n",
      "14       ¬  0.000032          ści  0.000032\n",
      "15  <0xC2>  0.000032          hes  0.000032\n",
      "16       ¼  0.000032         pres  0.000032\n",
      "17       ©  0.000032           .“  0.000032\n",
      "18       ³  0.000032          cdn  0.000032\n",
      "19  <0xE0>  0.000032         oust  0.000032\n",
      "20       ·  0.000032          rie  0.000032\n",
      "21       ²  0.000032        строй  0.000032\n",
      "22       �  0.000032           :@  0.000032\n",
      "23   iddle  0.000032       <0xE8>  0.000032\n",
      "24       ​  0.000032        ölker  0.000032\n",
      "25  <0xE6>  0.000032           ▁n  0.000032\n",
      "26  <0xE3>  0.000032  Wikispecies  0.000032\n",
      "27     url  0.000032           zó  0.000032\n",
      "28    utch  0.000032         ▁вос  0.000032\n",
      "29     idd  0.000032        ▁ciel  0.000032\n",
      "30       ¨  0.000032        unicí  0.000032\n",
      "31    ivel  0.000032          ßer  0.000032\n",
      "32         0.000032         eton  0.000032\n",
      "33       ▁  0.000032            Ї  0.000032\n",
      "34       «  0.000032           äg  0.000032\n",
      "35     urr  0.000032       ▁tiene  0.000032\n",
      "36   ethod  0.000032       ▁связи  0.000032\n",
      "37       ‑  0.000032         stav  0.000032\n",
      "38       ¹  0.000032         ▁Kos  0.000032\n",
      "39       ñ  0.000032    ▁circumst  0.000032\n",
      "S 3.721647\n",
      "             token      prob            token      prob\n",
      "0                ❯  0.000032              <s>  0.000032\n",
      "1               :   0.000032          ▁echter  0.000032\n",
      "2     ▁Хронологија  0.000032             ▁way  0.000032\n",
      "3           ▁zvuky  0.000032              ▁it  0.000032\n",
      "4    ▁Begriffsklär  0.000032           gesamt  0.000032\n",
      "5         férences  0.000032                ‐  0.000032\n",
      "6             card  0.000032              ;</  0.000032\n",
      "7                ▸  0.000032              sBy  0.000032\n",
      "8          ulation  0.000032            ▁Read  0.000032\n",
      "9            owner  0.000032              ppa  0.000032\n",
      "10               ✿  0.000032               ▁–  0.000032\n",
      "11      ▁assigning  0.000032           ührung  0.000032\n",
      "12         ▁determ  0.000032           icture  0.000032\n",
      "13          icture  0.000032                ¦  0.000032\n",
      "14       ▁tutorial  0.000032             !...  0.000032\n",
      "15           cycle  0.000032  ▁setContentView  0.000032\n",
      "16             ▁IV  0.000032            angol  0.000032\n",
      "17            ▁upd  0.000032            ▁down  0.000032\n",
      "18             box  0.000032                朝  0.000032\n",
      "19         ▁odkazy  0.000032            ▁spin  0.000032\n",
      "20           strip  0.000032               `-  0.000032\n",
      "21       ification  0.000032            CCESS  0.000032\n",
      "22            ▁Alo  0.000032            typen  0.000032\n",
      "23            line  0.000032               it  0.000032\n",
      "24        ▁adapter  0.000032               őd  0.000032\n",
      "25        irectory  0.000032        scription  0.000032\n",
      "26       ▁emulator  0.000032            ▁Glad  0.000032\n",
      "27        ViewById  0.000032              iva  0.000032\n",
      "28          etwork  0.000032                包  0.000032\n",
      "29              IX  0.000032             ниче  0.000032\n",
      "30           uture  0.000032             тиче  0.000032\n",
      "31           omial  0.000032            eller  0.000032\n",
      "32     ▁identifier  0.000032            ldots  0.000032\n",
      "33           ology  0.000032              ède  0.000032\n",
      "34  ActivityThread  0.000032              nah  0.000032\n",
      "35             ase  0.000032              тил  0.000032\n",
      "36               🌍  0.000032                Ε  0.000032\n",
      "37            band  0.000032             this  0.000032\n",
      "38              kę  0.000032          alement  0.000032\n",
      "39       ▁Kontrola  0.000032           stract  0.000032\n",
      "S 3.5181408\n",
      "   token      prob         token      prob\n",
      "0     ).  0.000033             -  0.000033\n",
      "1      )  0.000033             ‑  0.000032\n",
      "2     ),  0.000033            -.  0.000032\n",
      "3     .)  0.000033            -)  0.000032\n",
      "4     );  0.000033            -}  0.000032\n",
      "5    .).  0.000033             ‐  0.000032\n",
      "6    .),  0.000033            -(  0.000032\n",
      "7      ]  0.000033            ▁C  0.000032\n",
      "8     ?)  0.000032           chr  0.000032\n",
      "9     ):  0.000032             ś  0.000032\n",
      "10    )?  0.000032           ová  0.000032\n",
      "11     ）  0.000032          ...]  0.000032\n",
      "12    ].  0.000032    ▁otherwise  0.000032\n",
      "13    .]  0.000032           edi  0.000032\n",
      "14    ))  0.000032           aze  0.000032\n",
      "15    !)  0.000032        <0xBA>  0.000032\n",
      "16    ],  0.000032             +  0.000032\n",
      "17   '),  0.000032            мі  0.000032\n",
      "18    )]  0.000032          ...)  0.000032\n",
      "19  );\\r  0.000032      servable  0.000032\n",
      "20    ')  0.000032            ?\"  0.000032\n",
      "21  ...)  0.000032          idia  0.000032\n",
      "22    )\"  0.000032  MainActivity  0.000032\n",
      "23   )..  0.000032            +)  0.000032\n",
      "24   )\\r  0.000032            -,  0.000032\n",
      "25   ▁).  0.000032             ▼  0.000032\n",
      "26   ▁),  0.000032          ▁...  0.000032\n",
      "27    ▁)  0.000032             џ  0.000032\n",
      "28   )).  0.000032           CLC  0.000032\n",
      "29   )),  0.000032        ▁Reich  0.000032\n",
      "30    ];  0.000032             ネ  0.000032\n",
      "31   ));  0.000032           кої  0.000032\n",
      "32    ])  0.000032         ichte  0.000032\n",
      "33   ())  0.000032            $-  0.000032\n",
      "34   )\",  0.000032          ▁Cet  0.000032\n",
      "35    )(  0.000032           ▁LI  0.000032\n",
      "36    \")  0.000032            ?)  0.000032\n",
      "37    }.  0.000032           ▁Жи  0.000032\n",
      "38    _)  0.000032           èce  0.000032\n",
      "39   ').  0.000032           >::  0.000032\n"
     ]
    }
   ],
   "source": [
    "for i in range(20):\n",
    "    print('S', Sh[i])\n",
    "    #u, v = U[:,i], V[:,i]\n",
    "    #print('U ENTROPY', entropy(softmax(u)))\n",
    "    #print('V ENTROPY', entropy(softmax(v)))\n",
    "    print(pd.concat([topk(Uh[:,i]), topk(Vh[i])], axis=1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "19874b0d-50e5-470a-af3c-2e1429bc4a37",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
