{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import scipy\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "from scipy.io import loadmat\n",
    "from scipy.stats import pearsonr\n",
    "from scipy.spatial import distance_matrix\n",
    "from sklearn.decomposition import PCA\n",
    "from sklearn import manifold\n",
    "import pylab\n",
    "import scipy.cluster.hierarchy as sch\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [],
   "source": [
    "path = os.path.join('cichy_data', 'all_noshuffle_wavenetclass_semb10_drop0.4', 'sub_emb.mat')\n",
    "data = np.array(loadmat(path)['X'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(15, 10)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [],
   "source": [
    "# pairwise distances\n",
    "dist_mat = distance_matrix(data, data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "for d in dist_mat:\n",
    "    d = [str(t) for t in d]\n",
    "    #print('\\t'.join(d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cluster embeddings\n",
    "mds = manifold.MDS()\n",
    "mds_data = mds.fit_transform(data)\n",
    "tsne = manifold.TSNE()\n",
    "tsne_data = tsne.fit_transform(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib.collections.PathCollection at 0x7fab68938ac0>"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAX8AAAD4CAYAAAAEhuazAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8QVMy6AAAACXBIWXMAAAsTAAALEwEAmpwYAAAUQElEQVR4nO3dcYic933n8feniuIuzYWNayWVVsrZR3WichyiZhEud9wdF3OrllKpBoPK0QgaEA3uXQuHqFVDSzmM0xPkj7R1iriWOODUCKrKbhuf4piGUEjirKsksuxsrdQ01krYW8pSh1tcWfn2j31kj+RZaXdndmdmn/cLhn3m+8zMfn/amY9mnuc3z5OqQpLULj8y6AYkSevP8JekFjL8JamFDH9JaiHDX5Ja6F2DbmC5brvttrr99tsH3YYkjZTnnnvuH6tqy/X1kQn/22+/nenp6UG3IUkjJck/dKu72UeSWsjwl6QWMvwlqYUMf0lqIcNfklpoZGb7SN2cOjPLsdMzXJxfYNv4GEemdnFgz8Sg25KGnuGvkXXqzCxHT55l4fIVAGbnFzh68iyA/wFIN2H4a2QdOz3zVvBftXD5CsdOzxj+Q8JPZsPL8NfIuji/sKK61pefzIabO3w1sraNj62orvV1o09mGjzDXyPryNQuxjZvuqY2tnkTR6Z2DagjdfKT2XDrOfyT/GiSZ5N8O8m5JL/b1G9N8nSSl5qf7+u4z9Ek55PMJJnqtQe104E9Ezx8711MjI8RYGJ8jIfvvctNCkPCT2bDrR/b/N8A/mtV/SDJZuBvkjwF3As8U1WfSvIA8ADwm0l2AweBO4FtwJeT/PuqurLUL5CWcmDPhGE/pI5M7bpmmz/4yWyY9PzOvxb9oLm6ubkUsB94tKk/ChxolvcDj1fVG1X1MnAe2NtrH5KGi5/MhltfZvsk2QQ8B/wk8IdV9Y0kH6iqSwBVdSnJ+5ubTwBf77j7habW7XEPA4cBPvjBD/ajVUnryE9mw6svO3yr6kpVfQTYDuxN8qEb3DzdHmKJxz1eVZNVNbllyzvORSBJWqW+zvapqnngK8A+4NUkWwGan681N7sA7Oi423bgYj/7kCTdWD9m+2xJMt4sjwH3AN8FngQONTc7BDzRLD8JHExyS5I7gJ3As732IUlavn5s898KPNps9/8R4ERV/WWSrwEnknwC+D5wH0BVnUtyAngBeBO435k+krS+UtV1c/vQmZycLM/hK0krk+S5qpq8vu43fCWphQx/SWohw1+SWsjwl6QWMvwlqYUMf0lqIcNfklrI8JekFjL8JamFDH9JaiHDX5JayPCXpBYy/CWphQx/SWohw1+SWsjwl6QWMvwlqYUMf0lqIcNfklrI8JekFjL8JamFDH9JaiHDX5JaqOfwT7IjyV8neTHJuSS/3tRvTfJ0kpean+/ruM/RJOeTzCSZ6rUHSdLK9OOd/5vA/6qqnwLuBu5Psht4AHimqnYCzzTXadYdBO4E9gGPJNnUhz4kScvUc/hX1aWq+ttm+XXgRWAC2A882tzsUeBAs7wfeLyq3qiql4HzwN5e+5AkLV9ft/knuR3YA3wD+EBVXYLF/yCA9zc3mwBe6bjbhabW7fEOJ5lOMj03N9fPViWp1foW/kneA/wZ8BtV9c83ummXWnW7YVUdr6rJqprcsmVLP9qUJNGn8E+ymcXgf6yqTjblV5NsbdZvBV5r6heAHR133w5c7EcfkqTl6cdsnwB/DLxYVZ/uWPUkcKhZPgQ80VE/mOSWJHcAO4Fne+1DkrR87+rDY/wH4JeBs0m+1dR+C/gUcCLJJ4DvA/cBVNW5JCeAF1icKXR/VV3pQx+SpGXqOfyr6m/ovh0f4GNL3Och4KFef7ckaXX8hq8ktZDhL0ktZPhLUgv1Y4evpCFy6swsx07PcHF+gW3jYxyZ2sWBPV2/R6kWM/xXwBeVht2pM7McPXmWhcuLE+hm5xc4evIsgM9VXcPNPst09UU1O79A8faL6tSZ2UG3Jr3l2OmZt4L/qoXLVzh2emZAHWlY+c5/mW70ovId1cr4CWrtXJxfWFFd7eU7/2XyRdUffoJaW9vGx1ZUV3sZ/svki6o/3Cyxto5M7WJs87WnxxjbvIkjU7sG1JGGleG/TL6o+sNPUGvrwJ4JHr73LibGxwgwMT7Gw/fe5WY1vYPb/Jfp6ovHbdW92TY+xmyXoPcTVP8c2DPh81I3ZfivgC+q3h2Z2nXNVETwE5Q0CIa/1pWfoLRRjPqsNcNf685PUBp1G+HLdO7wlaQV2giz1gx/SVqhjTBrzfCXpBXaCN/7MfwlaYU2wvd+3OErSSu0EWatGf6StAqjPmvNzT6S1EKGvyS1kOEvSS3Ul/BP8idJXkvyfEft1iRPJ3mp+fm+jnVHk5xPMpNkqh89SJKWr1/v/D8H7Luu9gDwTFXtBJ5prpNkN3AQuLO5zyNJNiFJWjd9Cf+q+irwT9eV9wOPNsuPAgc66o9X1RtV9TJwHtjbjz4kScuzltv8P1BVlwCan+9v6hPAKx23u9DUJEnrZBA7fNOlVl1vmBxOMp1kem5ubo3bkqT2WMvwfzXJVoDm52tN/QKwo+N224GL3R6gqo5X1WRVTW7ZsmUNW5WkdlnL8H8SONQsHwKe6KgfTHJLkjuAncCza9iHJOk6fTm8Q5I/Bf4LcFuSC8DvAJ8CTiT5BPB94D6AqjqX5ATwAvAmcH9VXen6wJKkNdGX8K+qX1pi1ceWuP1DwEP9+N2SpJXzG76S1EKGvyS1kOEvSS1k+EtSCxn+ktRChr8ktZDhL0ktZPhLUgsZ/pLUQoa/JLWQ4S9JLWT4S1ILGf6S1EKGvyS1UF8O6Sy10akzsxw7PcPF+QW2jY9xZGoXB/Z4OmqNBsNfWoVTZ2Y5evIsC5cXz0M0O7/A0ZNnAfwPQCPBzT7SKhw7PfNW8F+1cPkKx07PDKgjaWUMf2kVLs4vrKguDRvDX1qFbeNjK6pLw8bwl1bhyNQuxjZvuqY2tnkTR6Z2DagjaWXc4SutwtWdus720agy/KVVOrBnwrDXyHKzjyS1kOEvSS00sPBPsi/JTJLzSR4YVB+S1EYDCf8km4A/BH4W2A38UpLdg+hFktpoUO/89wLnq+rvq+pfgMeB/QPqRZJaZ1DhPwG80nH9QlO7RpLDSaaTTM/Nza1bc5K00Q1qqme61OodharjwHGAycnJd6yXNNw88unwGlT4XwB2dFzfDlwcUC9agi9c9cIjnw63QW32+SawM8kdSd4NHASeHFAv6uLqC3d2foHi7RfuqTOzg25NI8Ijnw63gYR/Vb0J/BpwGngROFFV5wbRi7rzhateeeTT4TawwztU1ReBLw7q9+vGfOGqV9vGx5jt8nzxyKfDwW/4qisPWaxeeeTT4Wb4qytfuOrVgT0TPHzvXUyMjxFgYnyMh++9y529Q8KjeqorD1msfvDIp8PL8NeSfOFKG5ebfSSphTb0O3+/pCRJ3W3Y8PfbhZK0tA272ccvKUnS0jZs+PslJUla2oYNf7+kJElL27Dh75eUJGlpG3aHr19SkjTK1nq24oYNf/BLSpJG03rMVtywm30kaVStx2xFw1+Shsx6zFY0/CVpyKzHbEXDX5KGzHrMVtzQO3wlaRStx2xFw1+ShtBaz1Z0s48ktZDhL0ktZPhLUgsZ/pLUQj2Ff5L7kpxL8sMkk9etO5rkfJKZJFMd9Y8mOdus+0yS9NKDJGnlen3n/zxwL/DVzmKS3cBB4E5gH/BIkquTVj8LHAZ2Npd9PfYgSVqhnsK/ql6sqm4Hm9gPPF5Vb1TVy8B5YG+SrcB7q+prVVXA54EDvfQgSVq5tdrmPwG80nH9QlObaJavr3eV5HCS6STTc3Nza9KoJLXRTb/kleTLwE90WfVgVT2x1N261OoG9a6q6jhwHGBycnLJ20mSVuam4V9V96zicS8AOzqubwcuNvXtXeqSpHW0Vpt9ngQOJrklyR0s7th9tqouAa8nubuZ5fNxYKlPD5KkNdLrVM9fTHIB+Bngr5KcBqiqc8AJ4AXg/wH3V9XVMxN8Evi/LO4E/h7wVC89SJJWLouTbobf5ORkTU9PD7oN6S1rfY5VqR+SPFdVk9fXPaqntArrcY5VaS15eAdpFdbjHKvSWjL8pVVYj3OsSmvJ8JdWYT3OsSqtJcNfWoX1OMeqtJbc4SutwnqcY1VaS4a/tEprfY5VaS252UeSWsjwl6QWMvwlqYUMf0lqIcNfklrI8JekFjL8JamFDH9JaiHDX5JayPCXpBYy/CWphQx/SWohw1+SWsjwl6QWMvwlqYU8nn9LnDoz64lHNJR8bg5GT+/8kxxL8t0k30ny50nGO9YdTXI+yUySqY76R5OcbdZ9Jkl66UE3d+rMLEdPnmV2foECZucXOHryLKfOzA66NbWcz83B6XWzz9PAh6rqw8DfAUcBkuwGDgJ3AvuAR5JcPeHpZ4HDwM7msq/HHnQTx07PsHD5yjW1hctXOHZ6ZkAdSYt8bg5OT+FfVV+qqjebq18HtjfL+4HHq+qNqnoZOA/sTbIVeG9Vfa2qCvg8cKCXHnRzF+cXVlSX1ovPzcHp5w7fXwGeapYngFc61l1oahPN8vX1rpIcTjKdZHpubq6PrbbLtvGxFdWl9eJzc3BuGv5Jvpzk+S6X/R23eRB4E3jsaqnLQ9UN6l1V1fGqmqyqyS1bttysVS3hyNQuxjZvuqY2tnkTR6Z2DagjaZHPzcG56WyfqrrnRuuTHAJ+HvhYsykHFt/R7+i42XbgYlPf3qWuNXR15oQzKjRsfG4OTt7O61XcOdkHfBr4z1U111G/E/gCsBfYBjwD7KyqK0m+CfwP4BvAF4Hfr6ov3ux3TU5O1vT09Kp7laQ2SvJcVU1eX+91nv8fALcATzczNr9eVb9aVeeSnABeYHFz0P1VdXWX/ieBzwFjLO4jeOodjypJWlM9hX9V/eQN1j0EPNSlPg18qJffK0nqjYd3kKQWMvwlqYUMf0lqIcNfklrI8JekFjL8JamFDH9JaiHDX5JayPCXpBYy/CWphQx/SWohw1+SWsjwl6QWMvwlqYUMf0lqIcNfklrI8JekFjL8JamFDH9JaiHDX5JayPCXpBYy/CWphd416AakUXTqzCzHTs9wcX6BbeNjHJnaxYE9E4NuS1q2nt75J/nfSb6T5FtJvpRkW8e6o0nOJ5lJMtVR/2iSs826zyRJLz1I6+3UmVmOnjzL7PwCBczOL3D05FlOnZkddGvSsvW62edYVX24qj4C/CXw2wBJdgMHgTuBfcAjSTY19/kscBjY2Vz29diDtK6OnZ5h4fKVa2oLl69w7PTMgDqSVq6n8K+qf+64+mNANcv7gcer6o2qehk4D+xNshV4b1V9raoK+DxwoJcepPV2cX5hRXVpGPW8wzfJQ0leAf47zTt/YAJ4peNmF5raRLN8fX2pxz6cZDrJ9NzcXK+tSn2xbXxsRXVpGN00/JN8OcnzXS77AarqwaraATwG/NrVu3V5qLpBvauqOl5Vk1U1uWXLlpuPRloHR6Z2MbZ50zW1sc2bODK1a0AdSSt309k+VXXPMh/rC8BfAb/D4jv6HR3rtgMXm/r2LnVpZFyd1eNsH42ynqZ6JtlZVS81V38B+G6z/CTwhSSfBraxuGP32aq6kuT1JHcD3wA+Dvx+Lz1Ig3Bgz4Rhr5HW6zz/TyXZBfwQ+AfgVwGq6lySE8ALwJvA/VV1dXrEJ4HPAWPAU81FkrSOsjjpZvhNTk7W9PT0oNuQpJGS5Lmqmry+7uEdJKmFDH9JaiHDX5JaaGS2+SeZY3Gn8nLdBvzjGrWzXhzDcHAMw8ExrM6/rap3fFFqZMJ/pZJMd9vJMUocw3BwDMPBMfSXm30kqYUMf0lqoY0c/scH3UAfOIbh4BiGg2Poow27zV+StLSN/M5fkrQEw1+SWmhDhP9GOJdwkmNJvtuM48+TjHesG/oxJLkvybkkP0wyed26oe+/myT7mp7PJ3lg0P0sJcmfJHktyfMdtVuTPJ3kpebn+zrWdf17DFKSHUn+OsmLzfPo15v6yIwjyY8meTbJt5sx/G5TH84xVNXIX1g8NeTV5f8J/FGzvBv4NnALcAfwPWBTs+5Z4GdYPMHMU8DPDngM/w14V7P8e8DvjdIYgJ8CdgFfASY76iPRf5fxbGp6/XfAu5sx7B50X0v0+p+Anwae76j9H+CBZvmB5TyfBjyGrcBPN8v/Bvi7pteRGUfzPH5Ps7yZxcPW3z2sY9gQ7/xrA5xLuKq+VFVvNle/ztsnvRmJMVTVi1XV7QzmI9F/F3uB81X191X1L8DjLI5l6FTVV4F/uq68H3i0WX6Ut/9tu/491qPPG6mqS1X1t83y68CLLJ7idWTGUYt+0Fzd3FyKIR3Dhgh/WNtzCQ/Ar/D2eQ5GdQxXjWr/S/U9Kj5QVZdgMViB9zf1oR9XktuBPSy+cx6pcSTZlORbwGvA01U1tGMYmfAf5LmE++VmY2hu8yCLJ8B57GppiV7XfQzL6b/b3brUBvY3WIFh72+1hnpcSd4D/BnwG9d9on/HTbvUBj6OqrpSVR9h8ZP73iQfusHNBzqGXs/ktW5qA5xL+GZjSHII+HngY82mEBiiMazgb9BpaPpfoaX6HhWvJtlaVZeaTWyvNfWhHVeSzSwG/2NVdbIpj9w4AKpqPslXgH0M6RhG5p3/jSTZ2XH1+nMJH0xyS5I7ePtcwpeA15Pc3cww+TjwxLo2fZ0k+4DfBH6hqv5/x6qRGcMSRrX/bwI7k9yR5N3AQRbHMiqeBA41y4d4+9+2699jAP1do3kO/DHwYlV9umPVyIwjyZY0s/SSjAH3sJhFwzmGQe4d79eFxXcLzwPfAf4CmOhY9yCLe9Fn6JhNAkw29/ke8Ac033Ye4BjOs7j971vN5Y9GaQzAL7L4TuYN4FXg9Cj1v8SYfo7FWSffAx4cdD836PNPgUvA5eZv8Angx4FngJean7fe7O8x4DH8RxY3eXyn4zXwc6M0DuDDwJlmDM8Dv93Uh3IMHt5BklpoQ2z2kSStjOEvSS1k+EtSCxn+ktRChr8ktZDhL0ktZPhLUgv9KxE571IxDufhAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.scatter(tsne_data[:, 0], tsne_data[:, 1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [],
   "source": [
    "# load accuracy recovery matrix\n",
    "df = pd.read_csv('emb_matrix.txt', sep=\"\\t\", header=0)\n",
    "emb_matrix = df.to_numpy()\n",
    "dist_matrix = 1 - emb_matrix\n",
    "dist_matrix = (dist_matrix + dist_matrix.T)/2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cluster accuracy matrices\n",
    "mds = manifold.MDS()\n",
    "mds_data = mds.fit_transform(emb_matrix.T)\n",
    "tsne = manifold.TSNE()\n",
    "tsne_data = tsne.fit_transform(emb_matrix.T)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# cluster average recovered accuracies both ways matrices\n",
    "mds = manifold.MDS(dissimilarity='precomputed')\n",
    "mds_data = mds.fit_transform(dist_matrix)\n",
    "tsne = manifold.TSNE(metric='precomputed')\n",
    "tsne_data = tsne.fit_transform(dist_matrix)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<matplotlib.collections.PathCollection at 0x7fab809d46a0>"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYwAAAD4CAYAAAD//dEpAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8QVMy6AAAACXBIWXMAAAsTAAALEwEAmpwYAAAXEklEQVR4nO3df4xdZ33n8fdnXUcaKMKEOMGehCZbWVbTTYmzo5Q2VUlKgxNrqU20lZJWNLuLZGWXSAXtWuuoEovUP5LFopWQUlCg0YaqEHWFYyw2YEIoyi4IlDEOsUMYYrKw8Yw3GQKGsowWx/vdP+ZMejOZH+f63pk7P94v6ere+5znuefrM9fzmfOcc89NVSFJ0mL+yaALkCStDgaGJKkVA0OS1IqBIUlqxcCQJLXyS4Mu4HxcdNFFdfnllw+6DElaVY4ePfrDqtp8vuNXZWBcfvnljI6ODroMSVpVkvygl/FOSUmSWjEwJEmtGBiSpFYMDElSKwaGJKmVVXmWlFa2Q8fGOXBkjIkzU2zdNMS+ndvZs2N40GVJ6pGBob46dGycuw4eZ+rsOQDGz0xx18HjAIaGtMr1ZUoqyf1JXkhyYp7lSfKRJCeTPJnkmo5lNyUZa5bt70c9GpwDR8ZeDosZU2fPceDI2IAqktQv/TqG8V+AmxZYfjOwrbntBT4KkGQDcG+z/ErgtiRX9qkmDcDEmamu2iWtHn0JjKp6DPjRAl12A5+saV8HNiXZAlwLnKyqZ6vqF8CDTV+tUls3DXXVLmn1WK6zpIaB5zqen2ra5mt/lSR7k4wmGZ2cnFyyQtWbfTu3M7RxwyvahjZuYN/O7QOqSFK/LFdgZI62WqD91Y1V91XVSFWNbN583tfO0hLbs2OYu2+5iuFNQwQY3jTE3bdc5QFvaQ1YrrOkTgGXdTy/FJgALpinXavYnh3DBoS0Bi3XHsZh4E+as6XeCvykqk4DjwPbklyR5ALg1qavJGmF6cseRpJPA9cDFyU5BfwnYCNAVX0MeBjYBZwEfg7862bZS0nuBI4AG4D7q+qpftQkSeqvvgRGVd22yPIC3jvPsoeZDhRJ0grmtaQkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUipc3lwT4PSZanIEhye8xUStOSUnye0zUioEhye8xUSsGhiS/x0StGBiS/B4TteJBb0kvH9j2LCktxMCQBPg9JlqcU1KSpFYMDElSKwaGJKkVA0OS1EpfAiPJTUnGkpxMsn+O5fuSPNHcTiQ5l+TCZtn3kxxvlo32ox5JUv/1fJZUkg3AvcCNwCng8SSHq+rbM32q6gBwoOn/TuD9VfWjjpe5oap+2GstkqSl0489jGuBk1X1bFX9AngQ2L1A/9uAT/dhvZKkZdSPwBgGnut4fqppe5UkrwFuAj7T0VzAF5McTbJ3vpUk2ZtkNMno5ORkH8qWJHWjH4GROdpqnr7vBL46azrquqq6BrgZeG+S351rYFXdV1UjVTWyefPm3iqWJHWtH4FxCris4/mlwMQ8fW9l1nRUVU009y8ADzE9xSVJWmH6ERiPA9uSXJHkAqZD4fDsTkleD7wN+GxH22uTvG7mMfAO4EQfapIk9VnPZ0lV1UtJ7gSOABuA+6vqqSR3NMs/1nR9F/DFqvo/HcMvAR5KMlPLp6rqC73WJEnqv1TNd7hh5RoZGanRUT+yIUndSHK0qkbOd7yf9JYktWJgSJJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUSs8f3JMkde/QsXEOHBlj4swUWzcNsW/ndvbsmPO6rSuGgSFJy+zQsXHuOnicqbPnABg/M8VdB48DrOjQcEpKkpbZgSNjL4fFjKmz5zhwZGxAFbVjYEjSMps4M9VV+0phYEjSMtu6aair9pXCwJCkZbZv53aGNm54RdvQxg3s27l9QBW140FvSVpmMwe2PUtKkrSoPTuGV3xAzOaUlCSplb4ERpKbkowlOZlk/xzLr0/ykyRPNLcPtB0rSVoZep6SSrIBuBe4ETgFPJ7kcFV9e1bX/15V/+I8x0qSBqwfexjXAier6tmq+gXwILB7GcZKkpZRPwJjGHiu4/mppm2230ryrSSfT/LrXY6VJA1YP86SyhxtNev5N4FfqaqfJdkFHAK2tRw7vZJkL7AX4M1vfvN5FytJOj/92MM4BVzW8fxSYKKzQ1X9tKp+1jx+GNiY5KI2Yzte476qGqmqkc2bN/ehbElSN/qxh/E4sC3JFcA4cCvwR50dkrwJeL6qKsm1TAfVi8CZxcZKamc1Xi5bq0vPgVFVLyW5EzgCbADur6qnktzRLP8Y8C+Bf5vkJWAKuLWqCphzbK81SevNar1ctlaXTP/eXl1GRkZqdHR00GVIK8Z193yZ8TmudDq8aYiv7v+9AVSklSjJ0aoaOd/xftJbWgNW6+WytboYGNIasFovl63VxcCQ1oDVerlsrS5erVZaA1br5bK1uqybwPCUQ611q/Fy2Vpd1kVgeMrhymegSyvfujiGceDI2MthMWPq7DkOHBkbUEXqNBPo42emKP4x0A8dGx90aZI6rIvA8JTDlc1Al1aHdREYnnK4shno0uqwLgLDUw5XNgNdWh3WRWDs2THM3bdcxfCmIcL05RLuvuUqD6quEAa6tDqsi7OkwFMOVzI/QyCtDusmMLSyGejSyrcupqQkSb0zMCRJrRgYkqRWDAxJUit9CYwkNyUZS3Iyyf45lv9xkieb29eSvKVj2feTHE/yRBK/Rk+SVqiez5JKsgG4F7gROAU8nuRwVX27o9v/BN5WVT9OcjNwH/CbHctvqKof9lqLJGnp9GMP41rgZFU9W1W/AB4Ednd2qKqvVdWPm6dfBy7tw3olScuoH4ExDDzX8fxU0zaf9wCf73hewBeTHE2yd75BSfYmGU0yOjk52VPBkqTu9eODe5mjrebsmNzAdGD8TkfzdVU1keRi4JEk36mqx171glX3MT2VxcjIyJyvL0laOv3YwzgFXNbx/FJgYnanJL8BfALYXVUvzrRX1URz/wLwENNTXJKkFaYfgfE4sC3JFUkuAG4FDnd2SPJm4CDw7qr6bkf7a5O8buYx8A7gRB9qkiT1Wc9TUlX1UpI7gSPABuD+qnoqyR3N8o8BHwDeCPxVEoCXqmoEuAR4qGn7JeBTVfWFXmuSJPVfqlbf4YCRkZEaHfUjG5LUjSRHmz/Wz4uf9JYktWJgSJJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUioEhSWrFwJAktWJgSJJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUioEhSWql52/ck6R+OnRsnANHxpg4M8XWTUPs27mdPTuGB12W6NMeRpKbkowlOZlk/xzLk+QjzfInk1zTdqyk9ePQsXHuOnic8TNTFDB+Zoq7Dh7n0LHxQZcm+hAYSTYA9wI3A1cCtyW5cla3m4FtzW0v8NEuxkpaJw4cGWPq7LlXtE2dPceBI2MDqkid+jEldS1wsqqeBUjyILAb+HZHn93AJ2v6C8S/nmRTki3A5S3GakCcGtBymzgz1VW7llc/pqSGgec6np9q2tr0aTMWgCR7k4wmGZ2cnOy5aC3MqQENwtZNQ121a3n1IzAyR1u17NNm7HRj1X1VNVJVI5s3b+6yRHXLqQENwr6d2xnauOEVbUMbN7Bv5/YBVaRO/ZiSOgVc1vH8UmCiZZ8LWozVADg1oEGYmfJ0KnRl6kdgPA5sS3IFMA7cCvzRrD6HgTubYxS/Cfykqk4nmWwxVgOwddMQ43OEg1MDWmp7dgwbECtUz1NSVfUScCdwBHga+LuqeirJHUnuaLo9DDwLnAQ+Dvy7hcb2WpN659SApNkyfeLS6jIyMlKjo6ODLmPN8ywpaW1JcrSqRs53vJ/01rycGpDUyWtJSZJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUioEhSWrFwJAktWJgSJJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUioEhSWrF78OQpFVgJXyhWU97GEkuTPJIkmea+zfM0eeyJH+f5OkkTyX5045lH0wynuSJ5rarl3okaS06dGycuw4eZ/zMFAWMn5niroPHOXRsfFnr6HVKaj/waFVtAx5tns/2EvDvq+rXgLcC701yZcfyv6yqq5vbwz3WI0lrzoEjY0ydPfeKtqmz5zhwZGxZ6+h1Smo3cH3z+AHgK8B/7OxQVaeB083jf0jyNDAMfLvHdUtdWwm79VK3Js5MddW+VHrdw7ikCYSZYLh4oc5JLgd2AN/oaL4zyZNJ7p9rSqtj7N4ko0lGJycneyxb69FK2a2XurV101BX7Utl0cBI8qUkJ+a47e5mRUl+GfgM8L6q+mnT/FHgV4Grmd4L+fB846vqvqoaqaqRzZs3d7NqCVg5u/VSt/bt3M7Qxg2vaBvauIF9O7cvax2LTklV1e/PtyzJ80m2VNXpJFuAF+bpt5HpsPjbqjrY8drPd/T5OPC5boqXurFSduulbs1Mmw56OrXXYxiHgduBe5r7z87ukCTAXwNPV9VfzFq2ZWZKC3gXcKLHeqR5bd00xPgc4bDcu/XS+dizY3jgx9t6PYZxD3BjkmeAG5vnJNmaZOaMp+uAdwO/N8fpsx9KcjzJk8ANwPt7rEea10rZrZdWq572MKrqReDtc7RPALuax/8DyDzj393L+qVurJTdemm18pPeLXk65tqwEnbrpdXKwGhh5nTMmTNsZk7HBPzlI2nd8OKDLXg6piQZGK14OqYkGRitrJRPWUrSIBkYLXg6piR50LsVT8eUJAOjNU/HlLTeOSUlSWrFwJAktWJgSJJaMTAkSa0YGJKkVgwMSVIrBoYkqRUDQ5LUioEhSWqlp8BIcmGSR5I809y/YZ5+32++ivWJJKPdjpckDV6vexj7gUerahvwaPN8PjdU1dVVNXKe4yVJA9RrYOwGHmgePwDsWebxkqRl0mtgXFJVpwGa+4vn6VfAF5McTbL3PMaTZG+S0SSjk5OTPZYtSerWolerTfIl4E1zLPqzLtZzXVVNJLkYeCTJd6rqsS7GU1X3AfcBjIyMVDdjJUm9WzQwqur351uW5PkkW6rqdJItwAvzvMZEc/9CkoeAa4HHgFbjJUmD1+uU1GHg9ubx7cBnZ3dI8tokr5t5DLwDONF2vCRpZej1C5TuAf4uyXuA/wX8IUCSrcAnqmoXcAnwUJKZ9X2qqr6w0HhJWmqHjo37LZpd6ikwqupF4O1ztE8Au5rHzwJv6Wa8JC2lQ8fGuevgcabOngNg/MwUdx08DmBoLMBPektadw4cGXs5LGZMnT3HgSNjA6podTAwJK07E2emumrXNAND0rqzddNQV+2aZmBI4tCxca6758tcsf+/cd09X+bQsfFBl7Sk9u3cztDGDa9oG9q4gX07tw+ootWh17OkJK1y6/EA8My/y7OkumNgSOvcQgeA1/Iv0D07htf0v28pOCUlrXMeAFZbBoa0znkAWG0ZGNI65wFgteUxDGmd8wCw2jIwJHkAWK04JSVJasXAkCS1YmBIklrxGMY64bX/JfXKwFgH1uOlHyT1X09TUkkuTPJIkmea+zfM0Wd7kic6bj9N8r5m2QeTjHcs29VLPZqb1/6X1A+9HsPYDzxaVduAR5vnr1BVY1V1dVVdDfxz4OfAQx1d/nJmeVU93GM9moOXfpDUD70Gxm7ggebxA8CeRfq/HfheVf2gx/WqC176QVI/9BoYl1TVaYDm/uJF+t8KfHpW251Jnkxy/1xTWuqdl36Q1A+LBkaSLyU5McdtdzcrSnIB8AfAf+1o/ijwq8DVwGngwwuM35tkNMno5ORkN6te9/bsGObuW65ieNMQAYY3DXH3LVd5wFtSV1JV5z84GQOur6rTSbYAX6mqOf9sbQLmvVX1jnmWXw58rqr+2WLrHRkZqdHR0fOuW5LWoyRHq2rkfMf3OiV1GLi9eXw78NkF+t7GrOmoJmRmvAs40WM9kqQl0mtg3APcmOQZ4MbmOUm2Jnn5jKckr2mWH5w1/kNJjid5ErgBeH+P9UiSlkhPH9yrqheZPvNpdvsEsKvj+c+BN87R7929rF+StHy8lpQkqRUDQ5LUioEhSWrFwJAktWJgSJJaMTAkSa0YGJKkVvwCJalP/FZDrXUGhtQHfquh1gOnpKQ+8FsNtR4YGFIf+K2GWg8MDKkP/FZDrQcGhtQHfquh1gMPekt9MHNg27OktJYZGFKf7NkxbEBoTXNKSpLUioEhSWrFwJAktWJgSJJaMTAkSa2kqgZdQ9eSTAI/mNV8EfDDAZTTDWvsD2vsD2vsj9VU469U1ebzfZFVGRhzSTJaVSODrmMh1tgf1tgf1tgf66lGp6QkSa0YGJKkVtZSYNw36AJasMb+sMb+sMb+WDc1rpljGJKkpbWW9jAkSUvIwJAktbKqAiPJHyZ5Ksn/SzLvKWJJbkoyluRkkv0d7RcmeSTJM839G5agxkXXkWR7kic6bj9N8r5m2QeTjHcs2zWIGpt+309yvKljtNvxS11jksuS/H2Sp5v3xZ92LFuy7Tjf+6tjeZJ8pFn+ZJJr2o5dxhr/uKntySRfS/KWjmVz/twHUOP1SX7S8TP8QNuxy1jjvo76TiQ5l+TCZtmSb8ck9yd5IcmJeZb3971YVavmBvwasB34CjAyT58NwPeAfwpcAHwLuLJZ9iFgf/N4P/Cfl6DGrtbR1Pu/mf5ADcAHgf+wxNuxVY3A94GLev03LlWNwBbgmubx64Dvdvysl2Q7LvT+6uizC/g8EOCtwDfajl3GGn8beEPz+OaZGhf6uQ+gxuuBz53P2OWqcVb/dwJfXubt+LvANcCJeZb39b24qvYwqurpqhpbpNu1wMmqeraqfgE8COxulu0GHmgePwDsWYIyu13H24HvVdXsT64vpV63w4rYjlV1uqq+2Tz+B+BpYKm/kGKh99eM3cAna9rXgU1JtrQcuyw1VtXXqurHzdOvA5cuQR091bhEY5eyxtuATy9BHfOqqseAHy3Qpa/vxVUVGC0NA891PD/FP/4SuaSqTsP0Lxvg4iVYf7fruJVXv8nubHYf71+K6Z4uaizgi0mOJtl7HuOXo0YAklwO7AC+0dG8FNtxoffXYn3ajF2uGju9h+m/QmfM93Pvp7Y1/laSbyX5fJJf73LsctVIktcANwGf6Wheju24mL6+F1fcN+4l+RLwpjkW/VlVfbbNS8zR1tdzhxeqscvXuQD4A+CujuaPAn/OdM1/DnwY+DcDqvG6qppIcjHwSJLvNH/R9EUft+MvM/0f9X1V9dOmuS/bca7VzdE2+/01X58lf28usv5Xd0xuYDowfqejeUl/7l3U+E2mp2p/1hyDOgRsazm2H7pZzzuBr1ZV51/7y7EdF9PX9+KKC4yq+v0eX+IUcFnH80uBiebx80m2VNXpZrfshX7XmKSbddwMfLOqnu947ZcfJ/k48LlB1VhVE839C0keYno39jFW0HZMspHpsPjbqjrY8dp92Y5zWOj9tVifC1qMXa4aSfIbwCeAm6vqxZn2BX7uy1pjR/hTVQ8n+askF7UZu1w1dnjVTMEybcfF9PW9uBanpB4HtiW5ovkL/lbgcLPsMHB78/h2oM0eS7e6Wcer5jybX44z3gXMefZDjxatMclrk7xu5jHwjo5aVsR2TBLgr4Gnq+ovZi1bqu240Purs/Y/ac5QeSvwk2Zarc3YZakxyZuBg8C7q+q7He0L/dyXu8Y3NT9jklzL9O+rF9uMXa4am9peD7yNjvfoMm7HxfT3vbiUR/D7fWP6P/4p4P8CzwNHmvatwMMd/XYxfcbM95ieypppfyPwKPBMc3/hEtQ45zrmqPE1TL/5Xz9r/N8Ax4Enmx/glkHUyPTZE99qbk+txO3I9DRKNdvqiea2a6m341zvL+AO4I7mcYB7m+XH6Tijb7735hJsv8Vq/ATw447tNrrYz30ANd7Z1PAtpg/M//ZK247N838FPDhr3LJsR6b/4DwNnGX6d+N7lvK96KVBJEmtrMUpKUnSEjAwJEmtGBiSpFYMDElSKwaGJKkVA0OS1IqBIUlq5f8D+QAFnXxQPMQAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.scatter(mds_data[:, 0], mds_data[:, 1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/var/folders/nv/wjmf18wd5_j38vg9v0cthl5h0000gn/T/ipykernel_3012/672112163.py:6: ClusterWarning: scipy.cluster: The symmetric non-negative hollow observation matrix looks suspiciously like an uncondensed distance matrix\n",
      "  Y = sch.linkage(D, method='centroid')\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<matplotlib.colorbar.Colorbar at 0x7fab68f40c10>"
      ]
     },
     "execution_count": 48,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYYAAAD+CAYAAAA+hqL9AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8QVMy6AAAACXBIWXMAAAsTAAALEwEAmpwYAAAUhUlEQVR4nO3dW3DdV3XH8d/SxZJlW3Zi+SLkGBOSmIpLnODcSAsNlxICxNMZGCADnfQy4aFloNOZAg+lLS8t0xnaPtAWD9cOOIQJpA6UhFIuk1KCG9uIkMg2Do7jWFZiK44t2Ypk6ZzVB118jqRzkdbf52xb38/Mf6Ij7bPO1pGjpb33f69t7i4AAKY01LsDAIC0kBgAAEVIDACAIiQGAEAREgMAoAiJAQBQhMQAAChCYgAAFCExAACKNJX7YkdHh2/atKlGXVlc9uzZM+Dua6YeN69c6q3rVoZiNjXkw/2aiJMLx2hpGA/HaFQ234/LwjFG8s3hGEss/p5I0sDI8nCM1a1nwzHGPZu/K8e8MRxjPB/vy+hY/GcsSS1PD4eeP6KzOuej0/9o337bMn/hZPn/J/c8Pvp9d7899MIFyiaGTZs2affu3Vm9FgqY2TOFj1vXrdR1//KhUMyOpWdCz5+yuiX+S+OqtuPhGCsbXwrHkKTRDH6pHxheH45xRevJcAxJ+vK+m8MxPviqx8IxBsbiCUqSjo+sCMd4YWRZOMbBvrXhGJJ09R/sDT1/l/+w6PELJ3P6v+9vLPucxs6DHaEXnaFsYgAA1JdLymc0eq4WiQEAkubKOYkBADDJJY0rvu43H9yVBAAJc7lyXv6qxMw2m1lPwTVoZh8r1Z4RAwAkLq/YuTnufkDSFkkys0ZJfZIeKNW+bGI4dOKs3vf5R0MdulRt29Klu24qf6cAAES5pFwwMczwFkm/cfdnSjVgKmkBevsHtbOnr97dALBI5OVlr3l6v6R7yzUoO2K4cs0y3ffhW+b7opc8RlEAasWlatYROsyscNPZdnffPrORmS2RdKekT5YLxhoDACSuiptVB9x9axWh3iFpr7s/X64RiQEAEubyLNcYPqAK00gSiQEA0uZSLoO8YGZtkt4m6cOV2pIYACBhLtNYBoUg3X1Y0upq2pIYACBhLimf6d2qlZEYFqi3f1A7dh3JbC/D0qYxve7y2C2wb165L5O+PPHShnCM/Wc6wzFaGrMpU53z+F9bPz+2KRzj3Zti5ZinrF81FI7x9QM3hGOsaBsJx5CkoeHWcIx8Pv4zjlZFnXLw368PPX/0U7PvesxlMGKYD/YxLNDQyDh7GQBccBMb3KzslTVGDAu0opW3DkBt5DMY9c4Hv90AIGFTI4ZaIjEAQMJcplyNZ/1JDACQOKaSAADTkptKouz23Hr7B+vdBQCLhMs05rX9G54RwwJ0d7br+NBovbsBYJFIasRA2e3SGEkBqAV3U85ZfAYAFMinNGLAeTt2HSna6dzbP6juzvY69gjAYjCx+FzbEQMlMaq0s6ePRWcAdTAxlVTuyhojhnno7myfXnNhjQFALbikPBvcAACFsqgQPB8kBgBIGCUxFrGRXJN+Pbg2FOOTa3+cSV/+/uDt4Rivvvy5cIzXLz8cjiFJJ3PLwjFe9orT4Ri/PN0VjiFJb12/PxzjqwM3h2OcHVkSjiFJDQ1VHHVfwcb3PhmOcfi+14VjSNLVHcdDzz/ZPFb02CU2uAEAznMZU0kAgGIsPgMAprmLnc8AgELGzmcAwHmu2o8Y2PkMAInLqaHsVQ0zW2Vm95vZfjPbZ2YlK6RyHkOVpsphTL0f1EoCUAsuy+oEt3+W9LC7v8fMlkhqK9WQqaQF6u5s17Yt2dyXDgDlRDe4mVm7pDdKuluS3P2cpHOl2nMeQwWFVVULayUBQC1MnODWGA1zpaQTkr5sZtdK2iPpo+5+dq7GrDFUQFVVAPXkkvLeUPaS1GFmuwuue2aEaZJ0vaR/dffrJJ2V9IlSr8lUUhVYSwBQT1Uc7Tng7lvLfP2opKPuvmvy8f0qkxgYMQBAwtytmhFDhRj+nKRnzWzz5KfeIqm3VHtGDACQuIz2MXxE0tcn70g6JOkPSzUkMQBAwiYO6onfruruPZLKTTdNIzEk4qrWU9q5+T9CMR4dyWYt5E2dT4VjjObj/7SOnFsdjiFJjxy/KhxjSUMuHGPwXEs4hiR96fAbwjG6N/aHYxwbzObf25o7D4RjHP3Wq8MxGvIejiFJq1vnvNGnak2zypAbtZIAAOdN3JVErSQAQAFOcAMATHOZxuMb3OaFxAAACZs4j4GpJABAAdYYAADTJqqrJrTGQNltFdVJojQGgHqooiRGpiiJUYXh0XFJ0vGhUe3YdaTOvQGwmEzdrlruyhpltyt43+cfnT6Up7d/UDt7+nTXTRvr3S0Ai0btp5IYMVRh6hwGppIA1ENeVvbKGovPAJAwblcFABRxmcbzbHADABS4ENNF5ZAYACBhFNEDAMyS1AY31M5ArkVfOH1lKMbp8bZM+nJqbGk4xm8ti9f7H803h2NIUkvjeDjGu9c/Ho7xPy9eHY4hSbetPxiO0dXyYjjGg7+bzXkZJx7cXLlRJWPxECvaRuJBJK1tHQo9v9lmnP1xgfYqlENiAICEZXWC23yQGAAgcYwYAADTWHwGAMxCYgAATJs4wY27kgAAUzyxEQPnMWi6suqOXUemPwaAWslqjcHMDksakpSTNO7uW0u1ZcRQQXdnu7Zt6dLOnj4NjcTvhweA+cpwxHCbuw9UasR5DFXa2dOnFa3kUQC1NXG0Jye4AQAKuFvZS1KHme0uuO6ZK4yk/zKzPSW+Po0/gQEgcVXsfB4ot2Yw6VZ3P2ZmayX9wMz2u/sjczVkxAAACXPP5sxndz82+d/jkh6QdGOptiQGAEhcFVNJZZnZMjNbMfWxpN+T9ESp9kwlAUDSTLl8+G/4dZIeMDNp4vf+Dnd/uFRjEkMiTo8t1X8+/9pQjLu7/jeTvjx4NNYPSbql/TfhGPefeH04hiStXRorgyxJj556ZTjG0aFV4RiS9MzgZeEY7e+I/3zu7H0hHEOSHjo+GI5x4Ni6cIx8/JevJKmj+Uzo+U2WL3qcxT4Gdz8k6dqq+xB6NQDAheUT6wy1RGIAgMRxHgMAYJpLVS0wZ4nEAABJ42hPAMAMrDEAAIokNZVE2W3p+OCIBs6e0/AolVUB1J57YokBmkgK53KSpLaWJm3b0lXnHgFYbHL5hBIDZbc1a8R0100b69QTAIsVIwYAwDRXdfWQskRiAIDE1fimJBIDACSNxWcAwCzsYwAAFGLEsFiZ1GCxPwt+eKo7k660NsX3bLTaWDjGkwc3hGNI0uZXHgvHyHm8JPPJM23hGJJ0xXtKnq9StcGH4mXE+0bzlRtVofdIZzjGH235WTjGfz/3qnAMSfra/htCz39hZO+sz7HzGQAwjSJ6AIBiLnlKG9wAAAlgKgkAcB4b3AAAMzFiAABMS22DG2W3pd7+wemPuzvb69gTAItWjUcM8ZuzF4nuznZKbgOoE6twVRnFrNHMfmFm3y3XjrLbFUyNmBb7+wCgjrIbMXxU0j5JZac/GDEAQOq8wlUFM9sg6Z2SvlCpLYvPVejtH5y11rJtSxeH9gC48LLb4PZPkv5S0opKDRkxLEBv/6B29vTVuxsAFovKI4YOM9tdcN1T+HQze5ek4+6+p5qXY8RQhe7O9qI1hsV+pxaAGqt8u+qAu28t8/VbJd1pZndIapXUbmZfc/cPztWYEQMAJM68/FWJu3/S3Te4+yZJ75f0o1JJQWLEAABpm8cCc1ZIDIlosrxWLXkpFOPw0OpM+nL3xnht+799/F3hGM3Lz4VjSNKSxlw4xpN7rwjHuOrPfx6OIUnP3v+acIzLbTgc49BwRziGJK1bczocY++p+M/nt9f+JhxDklZ0joSe/7nWMzM+Y9VMJVXN3X8i6Sfl2pAYACB1jBgAAEVIDACAIiQGAMA0l4wT3AAARaiuCgCoJ85jKIMy2wBSUM0mtiwxlVRC4QE9AFBXKZ3gtpjPY1jMIyUACWHnMwBgFhIDAKAQawwAgGIkBgDAFHPJ8rV9TRJDGVN3JnV3lj03GwAurJTuSsJEUqjFfoaVTcO6s+MXoRjLGkYz6cumphfDMW7Y8Ew4xkiuORxDkvrOrAzHyKJk9lP/eHM4hiRdeVn8WNl1S4fCMW5ZlU2Z6hdHrg3HuHZl/D359tPxfkjS73QdCj3/nM/xa5mppHTMPNJTknbsOqLe/kFGEQBqhsXnxO3s6dPQyHi9uwFgMSExpG9FK28bgBqp8lznLPEbDgBSR2IAABQhMQAACiU1lbSYy25z5xGAZKSUGBazWu1fAICyUlt8XsxltwEgGcHEYGatkh6R1KKJ3/v3u/tfl2rPiAEAUhcfMYxKerO7nzGzZkk/NbOH3H3OLf0kBgBImCk+leTuLunM5MPmyatk1IbYywEALjivcFXBzBrNrEfScUk/cPddpdqSGAAgZZOLz+UuSR1mtrvgumdWGPecu2+RtEHSjWb2mlIvyVQSAKSu8qhgwN23VhXK/ZSZ/UTS7ZKemKsNIwYASF1wKsnM1pjZqsmPl0p6q6T9pdozYkjEyoYx3dH2fCjGWx//YCZ9+ZtrvhOO0dk6GI7xwP5s6uO/4gO/DMc48/CV4RivXno4HEOSzuUawzEaMjgS7DvPvS4cQ5LO5ePfT1tj/CySm192OBxDkja3PRd6fmvD2KzPZfDj6pT0VTNr1MSA4Jvu/t1SjUkMAJCyeSwwlwzh/rik66ptT2IAgMQltfMZcxseHVdv/+CsOlLbtnTprps21qlXAC5ZNU4MLD5npLd/UDt74ufOAsBMVdyumilGDAvQ1tI06zzoxVqFFkANpDSVtJjLbpfS2z+o4VHOfAZQIxksPs8XI4YFaGtpoiQ3gJqwyauWKLs9T1MjKBaZAdQMIwYAQKEMNrjNC4kBAFLHiAEAMC21oz0BAAkgMQAACjFiAAAUIzEsTifGl+pzL742FGMsl02Fk0eGNodjPHAgXpI5i3LZkvT0vfHy3VuWHw3H6Hl2QziGJI2dWRKO0XR1/Pu5bc2vwzEkaTgf/34ubzwbjtGY0Z/lLXOUzZ4PmyMLMGIAAJzHzmcAwCwkBgDAFBMb3AAAM5jXdshAYsjQzMN7OLgHQFgd1hg4qOcC4eAeAFlJ6qAezmOYrbd/UN2d7XN+rfDwHt43AJlh8Tlt3Z3tnMUAoKaS2sfAeQwAkADWGAAA0yqsL1QzmjCzK8zsx2a2z8yeNLOPlmvPVBIApC4+YhiX9BfuvtfMVkjaY2Y/cPfeuRqTGAAgYRMb3GKZwd37JfVPfjxkZvskdUkiMQDAxaiK6aIOM9td8Hi7u2+fM5bZJknXSdpVKhiJAQBSVt0GtwF331qpkZktl/QtSR9z98FS7UgMiVjfNKqPrz4YinHf09dn0pePryn5h0TV9lwXv6/h6W/ES3dL0u9vjpfv7h+Ze+/KfDQ2ZVPw5tNvvD8cY8SbwzFO5drCMSSp/9zKcIyfvXRVBj3Jxunc0tDzc3PcE5RFrSQza9ZEUvi6u3+7XFsSAwCkLrj4bGYm6YuS9rn7Zyu153ZVAEhcBiUxbpX0IUlvNrOeyeuOUo0ZMQBAylxSsLqqu/9UEzc4VYXEAACJS6okBgAgAZTEuHRMnc+wY9eRencFwEXK3GX58lfWKLudkVLluHv7J24V5sAeAAvFVNJFaq5y3KXObQCAeUkpMVB2GwDqjxEDAOA8l3QB1hHKITEAQOoYMQAACjGVBAAoFtz5PF8kBgBIHCMGAMA08/gJbvNFYkjEc7kW/cPJV4ZiPPb6ezPpyx1d8VuUv3k0vjHyMyeyOb/gjSsOhGNccdmpcIzHLnt5OIYk/dszbwrHGBmP/69/bUdfOIYkrWp+KRzj5yfXh2O8a8MT4RiS9NTw2tDzR/Nz/Gyy+V+haiQGAEicscYAAJhW3dGemSIxAEDSnLuSAADFuCsJAFAspREDZbcXrlQZbgCYF5esxnclcVDPBTJVhru3f3D6TAYAWBD38lfGKLt9gf3dQ/vq3QUAFzk2uAEAitV4jYGpJABImWti53O5qwIz+5KZHTezqrZ3kxgAIGEml3n5qwpfkXR7ta9JYgCA1AUXn939EUknq3051hgAIHUp7WMAANTZ1BpDeR1mtrvg8XZ3377QlyQxJGJ5w4je0HYwFOOOrusz6cv3+vaGY9yw5+5wDMuoDsCPGq8Jx/ira74bjnFv343hGJK0edXz4RhvWdUbjvHUSLzUtSS9YVns370kfWz1T8Mxdo1m8/30nN4Qev54vnHW56pYRxhw962hFy5AYgCA1HG7KgBgmruUz5e/KjCzeyU9KmmzmR01sz8u154RAwCkLlgryd0/MJ/2JAYASBwnuAEAipEYAADTXFJKRfQ4jyFueHRcbS3kXwALxdGel5y2liZ1LG+pdzcAXMxSSgycxxDHiAtAWEqJAQBQZ6mtMQAA6s2lfK6mr0hiAICUMWIAAMzCGgMAoAiJAQBwHvsYFq1jv1qmT18ZO0/hU4fi5yhI0mdfvDocY+/W+8IxPvNCvB+S9KeX/Soc43vD68Ix1iw9E44hSX3Dq8IxvnL21nCMd66Lv6+SdEvraDjGtgPvC8e4pv14OIYkDby0PPT88fyMoteuqiqoZonEAACpY8QAAChCYgAAnOfcrgoAKOCS59jgBgAolNJUEmW343r7B9Xd2V7vbgC4WE2d+VxDjBgusO7Odm3b0lXvbgC4mKU0YqDsNgDUnzNiAACcx85nAEChOlRXbajcBABQV54vf1XBzG43swNm9pSZfaJcW0YMAJAwl+TBEYOZNUr6nKS3SToq6TEze9Dde+dqT2IAgJS5Z7HB7UZJT7n7IUkys29I2iZpzsTAVBIApC4+ldQl6dmCx0cnPzcn8zKr3WZ2QtIzVXYd8/Nyd18z9YD3GsCkmb8bHpbUUeE5rZJGCh5vd/ftBTHeK+nt7v4nk48/JOlGd//IXMHKTiUVdg4XFu81gLm4++0ZhDkq6YqCxxskHSvVmKkkALj0PSbpajN7hZktkfR+SQ+WasziMwBc4tx93Mz+TNL3JTVK+pK7P1mqfdk1BgDA4sNUEgCgCIkBAFCExAAAKEJiAAAUITEAAIqQGAAARUgMAIAiJAYAQJH/Bw+gmbaFghdFAAAAAElFTkSuQmCC\n",
      "text/plain": [
       "<Figure size 432x288 with 3 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "D = dist_mat\n",
    "\n",
    "# Compute and plot dendrogram.\n",
    "fig = pylab.figure()\n",
    "axdendro = fig.add_axes([0.09,0.1,0.2,0.8])\n",
    "Y = sch.linkage(D, method='centroid')\n",
    "Z = sch.dendrogram(Y, orientation='right')\n",
    "axdendro.set_xticks([])\n",
    "axdendro.set_yticks([])\n",
    "\n",
    "# Plot distance matrix.\n",
    "axmatrix = fig.add_axes([0.3,0.1,0.6,0.8])\n",
    "index = Z['leaves']\n",
    "D = D[index,:]\n",
    "D = D[:,index]\n",
    "im = axmatrix.matshow(D, aspect='auto', origin='lower')\n",
    "axmatrix.set_xticks([])\n",
    "axmatrix.set_yticks([])\n",
    "\n",
    "# Plot colorbar.\n",
    "axcolor = fig.add_axes([0.91,0.1,0.02,0.8])\n",
    "pylab.colorbar(im, cax=axcolor)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "PCA(n_components=10)"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pca = PCA(10)\n",
    "pca.fit(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "data_pca = pca.transform(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(15, 10)"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data_pca.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "losses = np.array([0.388252169, 0.289999992, 0.061253563, 0.112696148, 0.471509963, 0.464949936, 0.428164989,\n",
    "                   0.318116993, 0.705128193, 0.212553501, 0.490662158, 0.52285713, 0.637268841, 0.454415947,\n",
    "                   0.159771755])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(-0.08441318130106498, 0.7648621656323589)\n",
      "(0.170553174848983, 0.5433706006163662)\n",
      "(0.037797839719343196, 0.8936106239588107)\n",
      "(0.42059076259824796, 0.11850791273365809)\n",
      "(0.0026670686163731694, 0.9924734383175551)\n",
      "(-0.25837123580578414, 0.3524852418745564)\n",
      "(-0.26461697238872334, 0.34054633704712595)\n",
      "(-0.3453863787426796, 0.20735519379301923)\n",
      "(0.22293371353859237, 0.4244984108063906)\n",
      "(0.6135417814038514, 0.014989626602006968)\n"
     ]
    }
   ],
   "source": [
    "for i in range(10):\n",
    "    R = pearsonr(data_pca[:, i], losses)\n",
    "    print(R)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "dist_mat = distance_matrix(data_pca[:, :9], data_pca[:, :9])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "13\n",
      "9\n",
      "4\n",
      "3\n",
      "10\n",
      "7\n",
      "6\n",
      "8\n",
      "2\n",
      "14\n",
      "11\n",
      "0\n",
      "12\n",
      "1\n",
      "5\n"
     ]
    }
   ],
   "source": [
    "a = np.argsort(trans[:, 1])\n",
    "for i in range(15):\n",
    "    print(a[i])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "-2.7713237\n",
      "-1.5848564\n",
      "-1.2942537\n",
      "-1.1458896\n",
      "-0.96686363\n",
      "-0.8512446\n",
      "-0.6140935\n",
      "0.27170765\n",
      "0.27438506\n",
      "0.3201905\n",
      "1.0133637\n",
      "1.0717618\n",
      "1.2812381\n",
      "1.8232166\n",
      "3.1726623\n"
     ]
    }
   ],
   "source": [
    "a = np.sort(trans[:, 1])\n",
    "for i in range(15):\n",
    "    print(a[i])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "3.1475883\n",
      "4.669107\n",
      "3.3961842\n",
      "3.4729512\n",
      "3.7277327\n",
      "4.6251507\n",
      "4.637158\n",
      "3.6892009\n",
      "4.107788\n",
      "3.6550326\n",
      "3.6904097\n",
      "4.046842\n",
      "3.725337\n",
      "3.4583468\n",
      "3.2108207\n"
     ]
    }
   ],
   "source": [
    "# vector length\n",
    "for a in data:\n",
    "    print(np.linalg.norm(a, 2))"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
