{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "import torch\n",
    "from transformers import PegasusForConditionalGeneration, PegasusTokenizer\n",
    "from datasets import load_dataset\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "from nltk import sent_tokenize\n",
    "from utils import get_summary_indices, get_overlap_scores, visualize_summary\n",
    "from summa.summarizer import summarize\n",
    "from tqdm import trange"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "model_name = 'tuner007/pegasus_paraphrase'\n",
    "torch_device = 'cuda' if torch.cuda.is_available() else 'cpu'\n",
    "tokenizer = PegasusTokenizer.from_pretrained(model_name)\n",
    "model = PegasusForConditionalGeneration.from_pretrained(model_name).to(torch_device)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_response(input_text,num_return_sequences,num_beams):\n",
    "  batch = tokenizer(input_text,truncation=True,padding='longest',max_length=60, return_tensors=\"pt\").to(torch_device)\n",
    "  translated = model.generate(**batch,max_length=60,num_beams=num_beams, num_return_sequences=num_return_sequences, temperature=1.5)\n",
    "  tgt_text = tokenizer.batch_decode(translated, skip_special_tokens=True)\n",
    "  return tgt_text"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.read_csv('~/user/textrank_test.csv').dropna().reset_index(drop=True)\n",
    "bart_df = pd.read_csv('~/user/bart_test.csv', index_col=0).dropna().reset_index(drop=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['James Best was best known for his portrayal of bumbling sheriff Rosco P. Coltrane on TV\\'s \"The Dukes of Hazzard\" He died in hospice in Hickory, North Carolina, of complications from pneumonia, a friend says.']"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[sent_tokenize(bart_df.summary[0])[0]]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([ 0,  2, 11, 15, 16])"
      ]
     },
     "execution_count": 50,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "get_summary_indices(sent_tokenize(bart_df.article[2]), sent_tokenize(bart_df.summary[2]), top_k=2, tolerance=0.01)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['President Barack Obama took part in a roundtable discussion this week on climate change.',\n",
       " 'Obama: \"No challenge poses more of a public threat than climate change\" Obama encouraged ordinary citizens, doctors and nurses to start putting some pressure on elected officials \"to reduce the impacts of climate change.\"',\n",
       " 'He also issued a presidential proclamation declaring April 6-12 as National Public Health Week']"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sent_tokenize(bart_df.summary[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 1000/1000 [13:51<00:00,  1.20it/s]\n"
     ]
    }
   ],
   "source": [
    "paraphrases = []\n",
    "idxs = []\n",
    "\n",
    "for i in trange(1000):\n",
    "    summ = df.summary[i]\n",
    "    summ = sent_tokenize(summ)\n",
    "    article = df.article[i]\n",
    "    article = sent_tokenize(article)\n",
    "    idx = get_summary_indices(article, summ, top_k=2, tolerance=0.1)\n",
    "    sentences = [article[x] for x in idx]\n",
    "    paraphrase = get_response(sentences, 1, 10)\n",
    "    paraphrased_article = article\n",
    "    \n",
    "    for j, k in enumerate(idx):\n",
    "        paraphrased_article[k] = paraphrase[j]\n",
    "\n",
    "    new_summ = summarize(' '.join(paraphrased_article), words=75)\n",
    "    new_summ = sent_tokenize(new_summ)\n",
    "    new_idx = get_summary_indices(paraphrased_article, new_summ, top_k=2, tolerance=0.1)\n",
    "\n",
    "    paraphrases.append((' '.join(paraphrased_article), ' '.join(new_summ)))\n",
    "    idxs.append((idx, new_idx))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "paraphrase_df = pd.read_csv('./paraphrase_df.csv', index_col=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "different = [i for i in range(len(idxs)) if idxs[i][0].tolist() != idxs[i][1].tolist()]\n",
    "equal = [i for i in range(len(idxs)) if idxs[i][0].tolist() == idxs[i][1].tolist()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(<Figure size 1296x288 with 2 Axes>, <AxesSubplot:>)"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA70AAAD4CAYAAAAgoIHuAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAAjMUlEQVR4nO3de7RkVX3g8e/vXh6iBFsRsniKUXonLsUEUWSCiYmChEmEJBrpaFrja9A1JB2HlVEjpIMJywRjCNoOCCa0GFsjMfgYJsQkGmPiC6EFFLYNtDY2Kj2Ea5xkRbHZ88fZV6qKqupz+97b93D4ftY6q6r22eecX+1bder+au+zK0opSJIkSZLURzMrHYAkSZIkScvFpFeSJEmS1FsmvZIkSZKk3jLplSRJkiT1lkmvJEmSJKm39lrpAJba+ohOT0d97tW/u9IhTLf//isdwXQHH7bSEeza9/5jpSN4cJvt+GkpZlc6gunuu3elI5gqDjhypUPYpXL3bSsdwlTx6KNWOoSpynfuXOkQpor9D1npEKYq3/vOSocwXcfPMQDM7rPSEUwV+65a6RCmigMeu9IhTLfvo1Y6gukedmCsdAhLpW1etb6Uzj/njv93KUmSJEna0/o0JNikV5IkSZI0pPPdtwtg0itJkiRJGmJPryRJkiSpt0x6JUmSJEm91fGpOxfEpFeSJEmSNMRreiVJkiRJveXwZkmSJElSby1X0ptSWg1sBA4E7gbW5py3jNQ5GTgfeDLwtpzz2SPrfwU4h6ZDugDPyTl/a9Ix+5TAS5IkSZKWQLRcdsPFwIac82pgA3DJmDq3A68ALhhdkVI6DlgPnJRzfhJwIvDtaQe0p1eSJEmSNKRt72hKaRWwasyquZzz3Ejdg4FjgZNq0Sbg7Smlg3LOO+br5ZxvrfVPH7Pf3wLeknP+Zq07NeEFe3olSZIkSSNmWy7AOmDrmGXdmN0eAWzPOe8EqLd31vK2ngj8SErpkyml61JKb0wpTe10tqdXkiRJkjRkAb2jFwKXjymfW5JAHmgWOIamt3gf4G+AbcC7J21g0itJkiRJGtL2et06hHmuZfU7gMNSSrM5550ppVng0Fre1jbgypzzd4HvppQ+BDydKUmvw5slSZIkSUNmWi4LkXO+C9gMrKlFa4DrB6/nbeG9wMkppUgp7Q08G/jitA3s6ZUkSZIkDVnG3tEzgY0ppXOBe4C1ACmlq4Fzc87XppROBN4HHABESukM4OU552tq+XHAl4H7gGuAd007oEmvJEmSJGnI7DLtN+d8C3D8mPJTB+5/Cjh8wvb3Aa+tSysmvZIkSZKkIX26DtakV5IkSZI0pO1EVg8GJr2SJEmSpCH29EqSJEmSesukV5IkSZLUWw5vliRJkiT11nLN3rwSTHolSZIkSUMc3ixJkiRJ6i2TXkmSJElSb3lNryRJkiSpt+zplSRJkiT1lkmvJEmSJKm3Zmb6M8DZpFeSJEmSNCTCpFeSJEmS1FP29EqSJEmSesueXkmSJElSb4U9vZIkSZKkvpqZ7c/8zSa9kiRJkqQhDm+WJEmSJPXWcg1vTimtBjYCBwJ3A2tzzltG6pwMnA88GXhbzvnsMftJwPXAO8atH9SfPmtJkiRJ0pKIiFbLbrgY2JBzXg1sAC4ZU+d24BXABeN2kFKardtd1eaAJr2SJEmSpCEzM9FqWYiU0sHAscCmWrQJODaldNBgvZzzrTnnzcD3J+zqdcBHga+0Oa7DmyVJkiRJQ9r24qaUVgGrxqyayznPjZQdAWzPOe8EyDnvTCndWct3tDzeU4DnAj8DnNNmG3t6JUmSJElDZmZnWi3AOmDrmGXdUseUUtobeCdw5nzi3IY9vZIkSZKkIQuYyOpC4PIx5XNjyu4ADkspzdZe3lng0FrexiHA44Grm3msWAVESumAnPOrJm1k0itJkiRJGtJ2eHMdwjzXsu5dKaXNwBrgPfX2+pxzq6HNOedtwGPmH6eU1gP772r2ZpNeSZIkSdKQ5frJIuBMYGNK6VzgHmAtQErpauDcnPO1KaUTgfcBB9D05J4BvDznfM3uHNCkV5IkSZI0ZDd/jmiXcs63AMePKT914P6ngMNb7Gt9m2Oa9EqSJEmShiz054i6zKRXkiRJkjSkzszcCya9kiRJkqQhyzW8eSWY9EqSJEmShkR/OnpNeiVJkiRJw+zplSRJkiT11jL+ZNEeZ9IrSZIkSRoy60RWkiRJkqS+cnizJEmSJKm3HN4sSZIkSeote3olSZIkSb1lT68kSZIkqbfs6ZUkSZIk9dbMXrMrHcKSMemVJEmSJA2zp1eSJEmS1Fde0ytJkiRJ6q2YmVnpEJaMSa8kSZIkaYgTWUmSJEmS+svhzZIkSZKkvpqZdfZmSZIkSVJPLddEViml1cBG4EDgbmBtznnLSJ2TgfOBJwNvyzmfPbDuHOAMYCdwL/CGnPM1047Zn6uTJUmSJElLYybaLQt3MbAh57wa2ABcMqbO7cArgAvGrPsc8LSc8zHAy4D3p5T2m3ZAe3olSZIkSUMi2vWPppRWAavGrJrLOc+N1D0YOBY4qRZtAt6eUjoo57xjvl7O+dZa//TRnY706t4ABE2v8dcnxWhPryRJkiRpSMxEqwVYB2wds6wbs9sjgO05550A9fbOWr471gK35ZwnJrxgT68kSZIkaUS0n8jqQuDyMeVzSxTKWCmlnwbexP29xhOZ9EqSJEmShrSdyKoOYZ5ruds7gMNSSrM5550ppVng0FreWkrpBOA9wGk557yr+g5vliRJkiQNWcDw5tZyzncBm4E1tWgNcP3g9by7klJ6GvB+4Pk55+vabGNPryRJkiRpSMTy/GQRcCawMaV0LnAPzXW5pJSuBs7NOV+bUjoReB9wABAppTOAl9dJrN4B7AdcklKa3+ev5ZxvnHRAk15JkiRJ0rCZ5RkUnHO+BTh+TPmpA/c/BRw+YfunLfSYJr2SJEmSpCELHbrcZSa9kiRJkqQhM+1nb+48k15JkiRJ0hB7eiVJkiRJ/bV8E1ntcSa9kiRJkqQh9vRKkiRJknorlmn25pVg0itJkiRJGrKMv9O7x5n0SpIkSZKGxF7O3ixJkiRJ6il7eiVJkiRJveVEVpIkSZKk/rKnV5IkSZLUV/b0SpIkSZL6y6RXkiRJktRXPRrdbNIrSZIkSRphT68kSZIkqa/s6ZUkSZIk9VePsl6TXkmSJEnSsJmVDmDpmPRKkiRJkobEzPJkvSml1cBG4EDgbmBtznnLSJ2TgfOBJwNvyzmfPbBuFrgIOAUowJtzzpdNO2aP8ndJkiRJ0lKIaLfshouBDTnn1cAG4JIxdW4HXgFcMGbdi4AnAEcDJwDrU0pHTTugSa8kSZIkadhMtFsWIKV0MHAssKkWbQKOTSkdNFgv53xrznkz8P0xu3khcGnO+b6c8w7gKuAF047r8GZJkiRJ0rCW+WxKaRWwasyquZzz3EjZEcD2nPNOgJzzzpTSnbV8R8vIjgS+NvB4W91+Int6JUmSJElDIqLVAqwDto5Z1q1U7KPs6ZUkSZIkDYnZ1kOXLwQuH1M+N6bsDuCwlNJs7eWdBQ6t5W1tAx4LfL4+Hu35fQCTXkmSJEnSsJY5bx3CPNey7l0ppc3AGuA99fb6em1uWx8AXplS+iDNDNCnA8+ctoFJryRJkiRp2G5OzdzCmcDGlNK5wD3AWoCU0tXAuTnna1NKJwLvAw4AIqV0BvDynPM1wBXA8cD8zxydl3PeOu2AJr2SJEmSpCHLlfPmnG+hSVpHy08duP8p4PAJ2+8EXr2QY5r0SpIkSZKGLfDniLrMpFeSJEmSNGT5RjfveSa9kiRJkqQhYU+vJEmSJKm3THolSZIkSb3Vo/HNJr2SJEmSpCE9ynmZWaodRcTVEbFqF3XOi4jn7Ob+nxURH92t4CRJkiRJ7UW0Wx4EFt3TGxEBRCnl1F3VLaWcu9jjSZIkSZKWVyxZ9+jKa/VUIuK1EXFTXdZFxFERkSPi3cBNwBER8dWIeEytf05d/6mI2BQRZ9fyyyPi+fX+VyPi9yLiuoi4MSJ+tJY/PSI+HRHXR8S/RERanqcuSZIkSRprJtotDwK77OmNiKcCvw4cDwTwWeAfgaOBl5RSPlPrzdd/GvDLwFOAvYHrgC9M2P3/LaUcGxGvAc4GXgHcAjyzlPL9OhT6/Lo/SZIkSdIeEA+SoctttBnefCLw16WUfweIiA8CzwS+Np/wjvhJ4EOllP8E/jMiPjJl3x+st18AfqnefySwMSKOBgpN4jxVRLwKeBXAzwNP3eVTkiRJkiRN9CDpxW1jMSO1/30Jjv/deruT+xPwNwEfL6U8CfgF4GG72kkp5Z2llONKKceZ8EqSJEnSIvVoIqs2Se8/AadHxMMj4hHAL9aySf4Z+IWIeFhE7E/T+boQjwS21/svXeC2kiRJkqTFeihd01tKuS4iLgc+V4suA+6ZUv/zEfFh4AbgW8CNwLcXENMf0QxvfiPwvxewnSRJkiRpKczMrnQES6bVTxaVUt4KvHWk+EkjdY4aePiWUsr6iHg48EnqRFallJeOq19KuRZ4Vr3/aWD1wL7eWMs/AXyiTbySJEmSpEV4kPTitrHo3+md4J0R8USa63E3llKuW6bjSJIkSZKWWo9+qHdZkt5Syq8ux34lSZIkSXuAPb2SJEmSpN56kMzM3IZJryRJkiRp2IzDmyVJkiRJfTW7PLM3p5RWAxuBA4G7gbU55y0jdWaBi4BTgAK8Oed8WV13MPDnwBHA3sDHgd/IOX9/0jH7k75LkiRJkpZGRLtl4S4GNuScVwMbgEvG1HkR8ATgaOAEYH1K6ai67g3AzTnnY4BjgKcCvzTtgPb0SpIkSZKGtUxoU0qrgFVjVs3lnOdG6h4MHAucVIs2AW9PKR2Uc94xUPWFwKU55/uAHSmlq4AXABfQ9Pz+UEppBtgX2AfYPi1Ge3olSZIkScNmZtotsA7YOmZZN2avRwDbc847AertnbV80JHA1wYebxuo8yZgNfAN4JvANTnnf576VFo+ZUmSJEnSQ0X74c0XAo8bs1y4TJG9ALgBOAQ4DPiplNLzp23g8GZJkiRJ0pBo+Tu9dQjzXMvd3gEcllKazTnvrBNWHVrLB20DHgt8vj4e7Pk9C3hZHfr87ZTSh4CfAa6cdFB7eiVJkiRJw2Zn2y0LkHO+C9gMrKlFa4DrR67nBfgA8MqU0kxK6SDgdO5ParfSzOpMSmkf4DnATdOOa9IrSZIkSRq2fLM3nwmclVL6Ck2v7ZkAKaWrU0rH1TpXALcDW4DPAOflnLfWdeuAZ6aUbqRJoL8CXDrtgA5vliRJkiQNm1me/tGc8y3A8WPKTx24vxN49YTtb+P+2Z9bMemVJEmSJA3bvV7cTjLplSRJkiQNM+mVJEmSJPXWAiep6jKTXkmSJEnSsJY/WfRgYNIrSZIkSRoW/fmhH5NeSZIkSdIwe3olSZIkSb3lRFaSJEmSpN5apt/pXQkmvZIkSZKkYSa9kiRJkqTeciIrSZIkSVJv9eeSXpNeSZIkSdIIJ7KSJEmSJPWWSa8kSZIkqbdMeiVJkiRJvWXSK0mSJEnqLZNeSZIkSVJvmfRKkiRJknrLpFeSJEmS1F/Lk/SmlFYDG4EDgbuBtTnnLSN1ZoGLgFOAArw553zZwPpfAc6pQRbgOTnnb0065sxSPwlJkiRJ0oPcTLRbFu5iYEPOeTWwAbhkTJ0XAU8AjgZOANanlI4CSCkdB6wHTso5Pwk4Efj2tAPa0ytJkiRJGtZyeHNKaRWwasyquZzz3Ejdg4FjgZNq0Sbg7Smlg3LOOwaqvhC4NOd8H7AjpXQV8ALgAuC3gLfknL8JkHOemvCCPb2SJEmSpAeIlgvrgK1jlnVjdnoEsD3nvBOg3t5ZywcdCXxt4PG2gTpPBH4kpfTJlNJ1KaU3ppSmZuj29EqSJEmShrWfyOpC4PIx5XNLFMmoWeAYmt7ifYC/oUmK3z1pA5NeSZIkSdKwlklvHcI813KvdwCHpZRmc84764RVh9byQduAxwKfr48He363AVfmnL8LfDel9CHg6UxJeh3eLEmSJEka1np0c3s557uAzcCaWrQGuH7kel6ADwCvTCnNpJQOAk4Hrqzr3gucnFKKlNLewLOBL047rkmvJEmSJGlYzLRbFu5M4KyU0leAs+pjUkpX15mZAa4Abge2AJ8Bzss5b63r3gfcBXyZJoH+EvCuaQd0eLMkSZIkaVj7a3oXJOd8C3D8mPJTB+7vBF49Yfv7gNfWpRWTXkmSJEnSsGVKeleCSa8kSZIkaVh/cl6TXkmSJEnSCHt6JUmSJEm9tXuTVHWSSa8kSZIkaZg9vZIkSZKk3upR0tufPmtJkiRJkkbY0ytJkiRJGtajnl6TXkmSJEnSMJNeSZIkSVJvOXuzJEmSJKm37OmVJEmSJPWWPb2SJEmSpP6yp1eSJEmS1FcOb5YkSZIk9ZbDmyVJkiRJvWXSK0mSJEnqL5NeSZIkSVJfeU2vJEmSJKm3THolSZIkSf21PElvSmk1sBE4ELgbWJtz3jJSZxa4CDgFKMCbc86XjdRJwPXAO3LOZ087Zn8GakuSJEmSlsbMbLtl4S4GNuScVwMbgEvG1HkR8ATgaOAEYH1K6aj5lTUpvgS4qs0B7emVJEmSJI1o19ObUloFrBqzai7nPDdS92DgWOCkWrQJeHtK6aCc846Bqi8ELs053wfsSCldBbwAuKCufx3wUWD/ukxlT68kSZIkaVjMtFtgHbB1zLJuzF6PALbnnHcC1Ns7a/mgI4GvDTzeNl8npfQU4LnAn7R9Kvb0SpIkSZKGRPuJrC4ELh9TPrdEofxASmlv4J3Ar+ecdzaX9e6aSa8kSZIkaUS7pLcOYZ5rudM7gMNSSrM1aZ0FDq3lg7YBjwU+Xx/P9/weAjweuLomvKuASCkdkHN+1aSDmvRKkiRJkobF0l8Jm3O+K6W0GVgDvKfeXj9yPS/AB4BXppQ+SDPL8+nAM3PO24DHzFdKKa0H9nf2ZkmSJEnSwrS/pnehzgTOSil9BTirPialdHVK6bha5wrgdmAL8BngvJzz1t19Kvb0SpIkSZKGLUNPL0DO+Rbg+DHlpw7c3wm8usW+1rc5pkmvJEmSJGlE64msOs+kV5IkSZI0rP3szZ1n0itJkiRJGrZMw5tXgkmvJEmSJGmEPb2SJEmSpL6K2ZWOYMmY9EqSJEmShnlNryRJkiSpt0x6JUmSJEn95URWkiRJkqS+sqdXkiRJktRb/mSRJEmSJKm/7OmVJEmSJPWVw5slSZIkSf3l8GZJkiRJUl/Z0ytJkiRJ6i+TXkmSJElSXzl7syRJkiSptxzeLEmSJEnqL5NeSZIkSVJfLVNPb0ppNbAROBC4G1ibc94yUmcWuAg4BSjAm3POl9V15wBnADuBe4E35JyvmXbM/gzUliRJkiQtkZmWy4JdDGzIOa8GNgCXjKnzIuAJwNHACcD6lNJRdd3ngKflnI8BXga8P6W037QD2tMrSZIkSRrWsqc3pbQKWDVm1VzOeW6k7sHAscBJtWgT8PaU0kE55x0DVV8IXJpzvg/YkVK6CngBcMFIr+4NNOOwDwS+PilGe3olSZIkSSNa9/SuA7aOWdaN2ekRwPac806AentnLR90JPC1gcfbxtQBWAvclnOemPCCPb2SJEmSpBHR/preC4HLx5TPLVEoY6WUfhp4E/f3Gk9k0itJkiRJGtEu6a1DmOda7vQO4LCU0mzOeWedsOrQWj5oG/BY4PP18VDPb0rpBOA9wGk557yrgzq8WZIkSZI0LKLdsgA557uAzcCaWrQGuH7kel6ADwCvTCnNpJQOAk4HrgRIKT0NeD/w/JzzdW2Oa0+vJEmSJGnEsv1O75nAxpTSucA9NNflklK6Gjg353wtcAVwPDD/U0bn5Zy31vvvAPYDLkkpze/z13LON046oEmvJEmSJGlYzC7LbnPOt9AktKPlpw7c3wm8esL2T1voMU16JUmSJEnDFjh0uctMeiVJkiRJI0x6JUmSJEl9ZU+vJEmSJKm/THolSZIkSX1lT68kSZIkqbeWafbmlWDSK0mSJEkaYU+vJEmSJKmvHN4sSZIkSeqv/iS9UUpZ6Rg6LSJeVUp550rHMYnxLU7X44Pux2h8i2N8i9P1+KD7MRrf4hjf4nU9RuNbHONTF8ysdAAPAq9a6QB2wfgWp+vxQfdjNL7FMb7F6Xp80P0YjW9xjG/xuh6j8S2O8WnFmfRKkiRJknrLpFeSJEmS1FsmvbvW9TH+xrc4XY8Puh+j8S2O8S1O1+OD7sdofItjfIvX9RiNb3GMTyvOiawkSZIkSb1lT68kSZIkqbdMeiVJkiRJvfWQTHoj4qsRcWNEbI6Ia8esj4i4KCJujYgbIuLYWp4i4gu17IRatldE/F1EPHwR8fxZRNwVETcNlD06Ij4WEVvq7aMmbPuSWmdLRLyklu0bEX8TETdFxGsG6r5z/rksUYzrI2J7bcfNEXHqhG1PiYhc2/N1A+V/Udvy/IGyN0bE6QuM7YiI+HhEfDkivhQRv1nLO9OGU2LsShs+LCI+FxFfrPH9Xi1/XER8th73/RGxz4TtX1/r5Ih4bi07KCI+Vdvw9IG6H4qIQ5covssjYutA+/34hO331PtkNiKuj4iP1sedaL8p8XWt/R5wbu7Y+3hcfJ14D9ftVkXElRFxS0TcHBEndKz9xsXXifaL5vN988DybxGxrivtNyW+TrRf3e63ojk/3xQRm6I5bz8uunUOHBdjZ86DEfGbdV9fioh1tawTr8Ep8a3oazAW8D90NB7w//2YfT41mnP9rbV+1PI/rNu9e6Dui+fbQh1XSnnILcBXgcdMWX8q8H+AAJ4BfLaWvxU4ETgc+Ktadhbw0kXG81PAscBNA2V/BLyu3n8d8Idjtns0cHu9fVS9/yjgecAbab7U+HSt+xTgXUsc43rg7F1sNwvcBvwIsA/wReCJwDHAZbXOx4BHAocAH9mN2A4Bjq33fwj4Sj1GZ9pwSoxdacMA9q/39wY+W1/7fwmcUcsvBl49Ztsn1pj2BR5XY50FfgN4MfBw4BO17i8A65cwvsuB5+9i2z35Pnkt8F7go/VxJ9pvSnxda7+vMnJuplvv43HxracD7+G6j43AK+r9fYBVHWu/cfF1pv1GjvdN4LFdar8J8XWi/YDDgK3AfvXxXwIvpUPnwCkxXk4HzoPAk4Cb6vPdC/g74AldeQ1OiW9FX4Ms4H9oJvx/P2afn6vro9b/uRrbx+r6y4AnA/sBfw/svZj3tMueWR6SPb0tnAa8uzQ+A6yKiEOAe2ne7A8H7o2IVTQn4HdP3FMLpZRPAv86JoaN9f5G4PQxmz6X5g34r6WUe2hOGKcMxLk3zRsW4E3AOUscYxtPB24tpdxeSvke8D6a53YvsF9EzNQ4dwLnAb+7G7F9o5RyXb3/HeBmmg+3zrThlBjb2BNtWEop/68+3LsuBfhZ4MpaPqkNTwPeV0r5billK3BrjXm+DfcFdkbEXsA6mg+jpYqvjT3yN46Iw4H/SvNhSP1muBPtNy6+Bdhj55kJOvM+XoRlfw9HxCNp/vl7F0Ap5XullDk60n5T4mtj2dtvxLOB20opX6Mj7Tclvjb2VPvtVfe3F83z/gYdOgdOiPHOltvtib/xj9EkYf9RSvk+8I/AL9Gd1+Ck+NpYttfgAv+HnvT//Q/UxweUUj5TSik0/+OfDtwH7F0/2x9eYz8beFsp5d628WrlPFST3gL8bTRDlV81Zv1hwB0Dj79eyzYAb6B5A51Pc9I4v5Ry3zLE+MOllG/U+98EfngBcX4MOAr4DHBRRDwPuK6U0vbkvhD/vQ71+LMJQ27GxlhKuRnYAVwHfITm28KZ+cRwd0XEUcBP0PQEdrINR2KEjrRhNENfNwN30Tz/24C5+uH2g+O2jY+mR/G0uq/zgdcAV5RS/mMp4iulzLffH9T2+5OI2HcB8S313/hC4LdpPhgBDqRD7TcmvnldaT8Yf27u0vt40mdHF97Dj6v7+vNohrBfFhGPoDvtNyk+6Eb7DToD2FTvd6X9JsUHHWi/Usp24C3ANppk99vAF+jQOXBcjKWUv62ru3AevAl4ZkQcGM0lc6cCR9Cd1+Ck+KADr8ERk9psUjuNxvr1MbF+B7gauJ77X+PHl1KuWmSs2kP2WukAVsiJpZTtEXEw8LGIuKV+UzRVKWUb8CyAiHgCzTDnmyPiCprhGueUUr6y1MGWUkpEtO3Von7A/GqNc2/gGuC0iHgrcCTNt1wfXoLQ/hfNN4al3v4x8LIFxLlu/n5EfAT4bxHxOzRDbz5WSrl0IcFExP7AXwHrSin/Vi/BmD9WJ9pwTIydacNSyk7gx+sIhr8GfrTtthP2922ankXqh+DrgF+MiEtphl39cSnl07sbX0Q8CXg9zQfaPjS/s/c/ab4lbrO/JfsbR8TPA3eVUr4QEc9q+5x2Ed+Std+U+DrRfgMecG4eOeZKv4/HxdeV9/BeNEP8ziqlfDYi/pTmNTN4rJVsv0nxvZ1utN/8PvahGRL6+jHHWunX37j4OvH6q+eo02i+3JgDPkDT07jblvozZFyMEfFiOnIeLKXcHBF/CPwt8O/AZpqez8E6K/YanBJfJ16DU/a/oDbbxb7+iDrSICIuA86NiFcAJwM3lFJ+fymOo+XxkOzprd/2UUq5i+af+6ePVNnO/d9eQZPcbh+p8wc010n8Bs1wwd9m8UOqBn0r6pCLenvXmDpt4nwNzdCMZ9B8K/VC4H8sRYCllG+VUnbWnu5LeWA7tooxIk6j+UZ4f+DxpZRfAZ4fC5gcrJ7M/wr4i1LKB2txp9pwXIxdasN5pRly+HHgBJqhP/Nfjo1rm1bx0YyK+ANgDfAp4CU01wEt2EB8p5Rm2HgppXwX+HN2s/1Y/N/4J4HnRcRXaYZt/Szwp3Sn/R4QX0S8p0PtB0w8N3fmfTwuvg69h78OfL3cPwLiSpoksyvtNza+DrXfvJ+j6Qn7Vn3clfYbG1+H2u85wNZSyo7SDPX8IM15pyvnwEkx/pcunQdLKe8qpTy1lPJTwD0083905jU4Lr4OvQYHTWqzNu20vZZPi/UnaIaLZ+AFNdbHR8TRuxGr9pCHXNIbEY+IiB+av0/z7cxNI9U+DKyNxjNohsB8Y2AfPw3cWUrZQjOu/7667M4bc5IP05zUqbcfGlPnGuDkiHhU/Qbz5Fo2H+ejgJ+nOcnNx1loLrxftBi+DuIXeWA7AnweODqaGRz3oRmW9YNvFWsiuI7mm7P9uP86zVmab13bxBE014ndXEp568CqzrThpBg71IYH1R5UImI/4CSa644/Djy/VpvUhh8GzohmlsjHAUfTTAIxv++jgcNLKZ9gN9twQny3DHyoBc01N+Pab9n/xqWU15dSDi+lHEXz9/mHUsqL6Ej7TYjvxV1pv7qfSefmTryPJ8XXlfdwKeWbwB0RkWrRs4Ev05H2mxRfV9pvwBqGhw53ov0mxdeh9tsGPCMiHl7PJ/Ovv06cA6fEeHPHzoMH19sjaa6XfS8deg2Oi69Dr8FBk9ps6v/30MzBAvxbRDyjvibW8sA2n78ueu8aIyx9HqClVjowm9aeXGhmjvtiXb4E/E4tPxM4s94Pmut3bwNuBI4b2D5orpF4dH38YzTXItwA/ORuxrSJ5vqAe2m+DX85zfWAfw9soZkhb/54x1FnuquPX0Yz6cOtwK+P7PdPgGfV+w+jGZLyJZrhZUsR4xW1fW6gOZEcUuseClw9sO2pNN9W3jbf3gPr1lFnv65tu6nu8wGzE06J7USaE+QNNMNtNtdjdqYNp8TYlTY8huY6lRtoPrDOHXi/fK62zQeAfWv584DzBrb/nRpbBn5uZN9/CRxd7x8M/Ettw19egvj+oT7Xm4D3cP8MzyvyPqn7eBb3z47cifabEl9n2o/J5+ZOvI+nxNeJ93Dd9seBa2ssV9EMAe1E+02Jr0vt9wjgbuCRA2Vdar9x8XWp/X4PuIXmfHIFzQRUnToHToixS+fBf6L5suCLwLM7+BocF9+KvgZZ2P/Q0/6/3zxw/7j6eriN5hKMGFh3OgMziNNcJ34jzSi+Bb0eXfbsEvUPJkmSJElS7zzkhjdLkiRJkh46THolSZIkSb1l0itJkiRJ6i2TXkmSJElSb5n0SpIkSZJ6y6RXkiRJktRbJr2SJEmSpN76/6++NUHp3L0BAAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 1296x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "visualize_summary(df.article.iloc[:1000], [df.summary.iloc[:1000]], summary_labels=['original'], num_bins=20, tokenize=True, amortize=True, figsize=(18,4))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "paraphrase_df = pd.DataFrame(paraphrases, columns=['article', 'summary'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(<Figure size 1296x288 with 2 Axes>, <AxesSubplot:>)"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA9IAAAD4CAYAAAAATN4TAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAAgQ0lEQVR4nO3df5QlZX3n8fenZ5iRHwaQRBcBAyvEDWrWKCJujCGyIrgJQxJI0HjEDcloXEzYxDUYlSAxnkN+SH7IZjMKESERCcY4xkkQRdfEReSH/BqQMCArAyoqiEFX+fXdP6pars3t21XTPberzft1Tp2u+9ynqr799L11+3ufp55KVSFJkiRJkrqZWe4AJEmSJElaSUykJUmSJEnqwURakiRJkqQeTKQlSZIkSerBRFqSJEmSpB5WL3cAK9GpyeCnOn/Tu1+z3CFMlB/cZ7lDmGzN2uWOYLJVq5Y7gsm+cd9yR7Cwx37fckcw2dqBvwbvG/bfOP/uycsdwkR167XLHcJkP/jDyx3Bwr70ueWOYLLdv3+5I1hAljuAyR741nJHMNnA73qTXfda7hAWtvOeyx3BRHnsk5Y7hMkes8fA38Td9MmrTq0a1O9sIi1JkiRJmrqVPDzaRFqSJEmSNHWD6mLuyURakiRJkjR19khLkiRJktSDibQkSZIkST0MfPrciUykJUmSJElT5zXSkiRJkiT14NBuSZIkSZJ6MJGWJEmSJKkHh3ZLkiRJktSDPdKSJEmSJPXgrN2SJEmSJPVgj7QkSZIkST14jbQkSZIkST3YIy1JkiRJUg8m0pIkSZIk9eBkY5IkSZIk9WCPtCRJkiRJPTjZmCRJkiRJPdgjLUmSJElSDybSkiRJkiT14NBuSZIkSZJ6cNZuSZIkSZJ6cGi3JEmSJEk9mEhLkiRJktSD10hLkiRJktSDPdKSJEmSJPVgIi1JkiRJUg8zMyt3cLeJtCRJkiRp6pKVm0iv5N50SZIkSdIKNTOTzksXSY5IclOSLUlOHvP885NcleTBJMeMlD8jyaVJNie5NskvLHQse6QlSZIkSVO3lD3SSVYBZwIvBLYClyfZWFU3jFT7PPAK4LVzNv8m8PKqujnJE4Erk1xUVV+b73gm0pIkSZKkqcvSXiN9MLClqm4FSHI+sA74TiJdVbe1zz08umFV/cvI+p1J7gJ+APjafAczkZYkSZIkTd3Mqu5XGidZD6wfKdpQVRtGHu8F3D7yeCvwnL4xJTkYWAPcMqmeibQkSZIkaer6DO1uk+YNC1ZchCR7AucCx1fVw5PqmkhLkiRJkqZuiYd23wHsM/J477asWyzJ9wEfAt5QVZ9aqL6zdkuSJEmSpi5J56WDy4EDkuyXZA1wHLCxYxxrgPcD766qC7tsYyItSZIkSZq6pbz9VVU9CJwIXATcCFxQVZuTnJbkKIAkz06yFTgW+Iskm9vNfx54PvCKJFe3yzMmHc+h3ZIkSZKkqVvK218BVNUmYNOcslNG1i+nGfI9d7vzgPP6HMtEWpIkSZI0dX1m7R4aE2lJkiRJ0tQt8WRjU2UiLUmSJEmauqUe2j1NJtKSJEmSpKmzR1qSJEmSpB7skZYkSZIkqYcut7UaKhNpSZIkSdLUOWu3JEmSJEk9OLRbkiRJkqQesnI7pE2kJUmSJEnTZ4+0JEmSJEk9ePsrSZIkSZJ6WOVkY5IkSZIkdefQbkmSJEmSenBotyRJkiRJPdgjLUmSJElSD/ZIS5IkSZLUgz3SkiRJkiT1MLN61XKHsM1MpCVJkiRJ02ePtCRJkiRJ3XmNtCRJkiRJPWRmZrlD2GYm0pIkSZKkqXOyMUmSJEmS+nBotyRJkiRJ3c2sctZuSZIkSZI6W8mTja3cq7slSZIkSSvXTLovHSQ5IslNSbYkOXnM889PclWSB5McM+e545Pc3C7HL3Qse6QlSZIkSVOXLF2/bpJVwJnAC4GtwOVJNlbVDSPVPg+8AnjtnG0fB/wOcBBQwJXttvfMdzx7pCVJkiRJU5eZdF46OBjYUlW3VtX9wPnAutEKVXVbVV0LPDxn2xcBF1fV3W3yfDFwxKSD2SMtSZIkSZq69JhsLMl6YP1I0Yaq2jDyeC/g9pHHW4HndNz9uG33mrSBibQkSZIkaer6TDbWJs0bFqw4JQ7tliRJkiRN3RIP7b4D2Gfk8d5t2XbZ1kRakiRJkjR1STovHVwOHJBkvyRrgOOAjR1DuQg4PMnuSXYHDm/L5mUiLUmSJEmavpmZ7ssCqupB4ESaBPhG4IKq2pzktCRHASR5dpKtwLHAXyTZ3G57N/C7NMn45cBpbdm8vEZakiRJkjR1fa6R7qKqNgGb5pSdMrJ+Oc2w7XHbng2c3fVYJtKSJEmSpKmb6TFr99CYSEuSJEmSpm6pe6SnyURakiRJkjR93SYRGyQTaUmSJEnS1NkjLUmSJElSD+kwG/dQmUhLkiRJkqau4/2hB8lEWpIkSZI0dVntrN2SJEmSJHVmj7QkSZIkST042ZgkSZIkSX3YIy1JkiRJUnf2SEuSJEmS1IeJtCRJkiRJ3a3gkd0m0pIkSZKkZWCPtCRJkiRJ3dkjLUmSJElSHys4kzaRliRJkiRN38xyB7DtTKQlSZIkSVOXmZWbSZtIS5IkSZKmbgWP7DaRliRJkiQtA2ftliRJkiSph5WbR5tIS5IkSZKmLyt4bLeJtCRJkiRp6rLKRFqSJEmSpO5Wbh5tIi1JkiRJWgYreGj3yr1xlyRJkiRpxUq6L932lyOS3JRkS5KTxzy/Nsl72+cvS7JvW75DknOSXJfkxiSvX+hYJtKSJEmSpOmbSfdlAUlWAWcCRwIHAi9JcuCcaicA91TV/sAZwOlt+bHA2qp6OvAs4JWzSfa8off5PSVJkiRJWgpL3CN9MLClqm6tqvuB84F1c+qsA85p1y8EDkszdXgBOydZDewI3A98fdLBTKQlSZIkSVOXmXRfkvVJrhhZ1s/Z3V7A7SOPt7ZlY+tU1YPAvcAeNEn1N4AvAJ8H/rCq7p4Uu5ONSZIkSZKmr8OQ7VlVtQHYsJ0iORh4CHgisDvwT0k+UlW3zreBPdKSJEmSpOlb2rHddwD7jDzeuy0bW6cdxr0r8FXgpcA/VtUDVXUX8EngoEkHM5GWJEmSJE3dEl8jfTlwQJL9kqwBjgM2zqmzETi+XT8GuKSqimY49wuamLIzcAjw2UkHG1wineTQJH+/jMd/V5Jjluv4kiRJkvRvwhJm0u01zycCFwE3AhdU1eYkpyU5qq12FrBHki3AbwCzt8g6E9glyWaahPwvq+raScfbrtdIJ1nd/kLbY9+rquqh7bFvSZIkSdL2lSXu1q2qTcCmOWWnjKx/i+ZWV3O3u29c+SQLhp5k3ySfTfJX7c2pL0yyU5JTklye5PokG9ppw0ny8SR/nOQK4NeT/HR7s+vPJPlIkie09U5Ncm6SS5PcnORXRg67S3uc2ePO7vu2JKcnuQo4NsmvtDFck+R9SXZq6x3bxnVNkk+0ZauS/EFb/9okr2zLk+Tt7Y27PwI8vk8DSpIkSZK2wRLeR3rauvZIPwU4oao+meRs4NXA26vqNIAk5wI/BXywrb+mqg5qn9sdOKSqKskvA68DfrOt9yM04893Bj6T5ENt+Y8CTwXupLnQ+8eAf26f+2pVPbPd9x5V9Y52/S00N9j+M+AU4EVVdUeS3drtTgDurapnJ1kLfDLJh9tjPYXmpt1PAG4Azu7YLpIkSZKkbZCOFz8PUdfO9Nur6pPt+nnA84CfbHuar6O5MPupI/XfO7K+N3BRW+9/zKn3gar6f1X1FeBjNNOOA3y6qrZW1cPA1cC+8+z7aUn+qd33L47s+5PAu9pe7lVt2eHAy5NcDVxGc7+wA4DnA++pqoeq6k7gknENMHrfsivHt5EkSZIkqasV3CPdNZGuMY//J3BMVT0deAfwmJHnvzGy/mc0vddPB145p964/QJ8e6TsIb6753x03+8CTmz3/ebZfVfVq4A30kxtfmWSPYAAr6mqZ7TLflX14fl/5TmBVW2oqoOq6qBndd1IkiRJkjTeEk/bPU1dE+knJXluu/5SHhlm/ZUku9BMHT6fXXnk/l3Hz3luXZLHtInuoTQzpPXxWOALSXag6ZEGIMmTq+qy9sLyL9Mk1BcBv9rWJckPtVObfwL4hfYa6j2Bn+wZgyRJkiSprxXcI931GumbgP/WXh99A/DnwO7A9cAXmZwAnwr8TZJ7aIZN7zfy3LU0Q7q/H/jdqrozyQ/1iP9NNMO0v9z+fGxb/gdJDqDphf4ocE17rH2Bq9rJy74MHA28n2Zo+g009w+7tMfxJUmSJEnbYmbVwnUGqmsi/WBVvWxO2Rvb5btU1aFzHn8A+MA8+722ql4+p/7HgY+PPD5xZH3fOXX/nCapnxvDz445VgG/3S5znTimTJIkSZK0vQywp7mr7XofaUmSJEmSxlrqG0lP0YKJdFXdBjxtqQ9cVacu9T4lSZIkSSuEPdKSJEmSJPUwwNm4uzKRliRJkiRN38z38NBuSZIkSZKW3Krv/Vm7JUmSJElaOg7tliRJkiSpBxNpSZIkSZJ68BppSZIkSZJ6sEdakiRJkqTu4n2kJUmSJEnqwVm7JUmSJEnqwaHdkiRJkiT14GRjkiRJkiT1YI+0JEmSJEk9mEhLkiRJktSDk41JkiRJktSDt7+SJEmSJKmHrNzJxlZu5JIkSZKklWsm3ZcOkhyR5KYkW5KcPOb5tUne2z5/WZJ9R577kSSXJtmc5Lokj5kYet/fVZIkSZKkRUu6LwvuKquAM4EjgQOBlyQ5cE61E4B7qmp/4Azg9Hbb1cB5wKuq6qnAocADk45nIi1JkiRJmr6Zme7Lwg4GtlTVrVV1P3A+sG5OnXXAOe36hcBhSQIcDlxbVdcAVNVXq+qhiaH3+DUlSZIkSVoaS5tI7wXcPvJ4a1s2tk5VPQjcC+wB/BBQSS5KclWS1y10MCcbkyRJkiRNX4/JxpKsB9aPFG2oqg1LFMlq4HnAs4FvAh9NcmVVfXTSBpIkSZIkTVePu1+1SfOkxPkOYJ+Rx3u3ZePqbG2vi94V+CpN7/UnquorAEk2Ac8E5k2kHdotSZIkSZq+JZxsDLgcOCDJfknWAMcBG+fU2Qgc364fA1xSVQVcBDw9yU5tgv0TwA2TDmaPtCRJkiRp+rolyJ1U1YNJTqRJilcBZ1fV5iSnAVdU1UbgLODcJFuAu2mSbarqniRvo0nGC9hUVR+adDwTaUmSJEnS9C1hIg1QVZuATXPKThlZ/xZw7DzbnkdzC6xOTKQlSZIkSdO3xIn0NJlIS5IkSZKmz0RakiRJkqQeTKQlSZIkSerBRFqSJEmSpD5MpCVJkiRJ6m7GRFqSJEmSpO4c2i1JkiRJUh8m0pIkSZIkdWePtCRJkiRJPZhIS5IkSZLUw8rNo02kJUmSJEnLIDPLHcE2M5GWJEmSJE2fQ7slSZIkSerBRFqSJEmSpB5Wbh5tIi1JkiRJWgb2SEuSJEmS1IOTjUmSJEmS1IM90pIkSZIk9bCCE+mV25cuSZIkSdIysEdakiRJkjR9K7hH2kRakiRJkjR9JtKSJEmSJPXgrN2SJEmSJPVgj7QkSZIkST3YIy1JkiRJUh8rt0d65X4FIEmSJElauZLuS6fd5YgkNyXZkuTkMc+vTfLe9vnLkuw75/knJbkvyWsXOpaJtCRJkiRp+jLTfVloV8kq4EzgSOBA4CVJDpxT7QTgnqraHzgDOH3O828D/qFL6CbSkiRJkqTpW8JEGjgY2FJVt1bV/cD5wLo5ddYB57TrFwKHJU13d5Kjgc8Bm7sczERakiRJkrQMZjovSdYnuWJkWT9nZ3sBt4883tqWja1TVQ8C9wJ7JNkF+C3gzV0jd7IxSZIkSdL09bj9VVVtADZsp0hOBc6oqvvSMSYTaUmSJEnS9C3tfaTvAPYZebx3WzauztYkq4Fdga8CzwGOSfL7wG7Aw0m+VVVvn+9gJtKSJEmSpGWwpIn05cABSfajSZiPA146p85G4HjgUuAY4JKqKuDHvxNRcipw36QkGkykJUmSJEnLYWbVku2qqh5MciJwEbAKOLuqNic5DbiiqjYCZwHnJtkC3E2TbG8TE2lJkiRJ0jJY0h5pqmoTsGlO2Skj698Cjl1gH6d2OZaJtCRJkiRp+rrd1mqQTKQlSZIkSVPXdYbsITKRliRJkiQtAxNpSZIkSZK6c2i3JEmSJEk9mEhLkiRJktSDibQkSZIkSX14jbQkSZIkSd05a7ckSZIkST04tFuSJEmSpD7skZYkSZIkqbusWu4ItpmJtCRJkiRp+rxGWpIkSZKkHkykJUmSJEnqw8nGJEmSJEnqzh5pSZIkSZJ68PZXkiRJkiT1YY+0JEmSJEndObRbkiRJkqQ+HNotSZIkSVJ39khLkiRJktSHibQkSZIkSd05a7ckSZIkST04tFuSJEmSpD5MpCVJkiRJ6m4F90iv3EHpkiRJkqQVbKbHsrAkRyS5KcmWJCePeX5tkve2z1+WZN+2/IVJrkxyXfvzBV0ilyRJkiRpupLuy4K7yirgTOBI4EDgJUkOnFPtBOCeqtofOAM4vS3/CvDTVfV04Hjg3IWOZyItSZIkSVoGS9ojfTCwpapurar7gfOBdXPqrAPOadcvBA5Lkqr6TFXd2ZZvBnZMsnahyCVJkiRJmqokfZb1Sa4YWdbP2d1ewO0jj7e2ZWPrVNWDwL3AHnPq/BxwVVV9e1LsTjYmSZIkSVoG3Scbq6oNwIbtFwskeSrNcO/DF6prj7QkSZIkafqW8Bpp4A5gn5HHe7dlY+skWQ3sCny1fbw38H7g5VV1y0IHM5GWJEmSJC2D9FgWdDlwQJL9kqwBjgM2zqmzkWYyMYBjgEuqqpLsBnwIOLmqPtnlYCbSkiRJkqTpy6ruywLaa55PBC4CbgQuqKrNSU5LclRb7SxgjyRbgN8AZm+RdSKwP3BKkqvb5fGTjuc10pIkSZKk6es2ZLuzqtoEbJpTdsrI+reAY8ds9xbgLX2OZSItSZIkSVoGS5tIT5OJtCRJkiRp+pa4R3qaTKQlSZIkScvARFqSJEmSpO7skZYkSZIkqYcOs3EPlYm0JEmSJGkZ2CMtSZIkSVJ3Du2WJEmSJKmPlZtIp6qWOwYBSdZX1YbljmM+xrc4xrc4Q48Phh+j8S2O8S3O0OOD4cdofItjfIs39BiNT9M2s9wB6DvWL3cACzC+xTG+xRl6fDD8GI1vcYxvcYYeHww/RuNbHONbvKHHaHyaKhNpSZIkSZJ6MJGWJEmSJKkHE+nhGPo1E8a3OMa3OEOPD4Yfo/EtjvEtztDjg+HHaHyLY3yLN/QYjU9T5WRjkiRJkiT1YI+0JEmSJEk9mEhLkiRJktSDifR2lOS2JNcluTrJFWOeT5I/TbIlybVJntmWPyXJlW3Zc9uy1Uk+kmSnRcRzdpK7klw/Uva4JBcnubn9ufs82x7f1rk5yfFt2dok/5jk+iSvHqm7YfZ3WYL4Tk1yR9uGVyd58TzbHpHkprYtTx4p/6u2Hd86UvbGJEdvQ3z7JPlYkhuSbE7y6235INpwQnyDaMMkj0ny6STXtPG9uS3fL8ll7XHfm2TNPNu/vq1zU5IXtWU/kOSf2/Y7eqTuB5I8sU98C8T4riSfG2nDZ8yz/XZ/n7TbrkrymSR/3z4eTBvOE99g2i9jzstDeQ9PiG8Q7+F2u92SXJjks0luTPLcIbXfhBgH0YZpPt+vHlm+nuSkobThhPgG0X7tdv89zfn5+iTvSXPe3i8DOQfOE9+QzoG/3u5rc5KT2rJBvP4WiHHZXoPp8f9zGo/6337MPp+V5ly/pa2ftvz0drt3j9R92Ww7aGCqymU7LcBtwPdPeP7FwD8AAQ4BLmvL3wY8D9gbeF9b9hrgFYuM5/nAM4HrR8p+Hzi5XT8ZOH3Mdo8Dbm1/7t6u7w4cBbyR5guZS9u6/xE4awnjOxV47QLbrQJuAf49sAa4BjgQ+BHgnW2di4FdgT2BD25jfHsCz2zXHwv8S3ucQbThhPgG0Ybt63yXdn0H4LL2dX8BcFxb/r+AXx2z7YFtTGuB/dpYVwG/BrwM2An4eFv3p4FTt/FvPF+M7wKOWWDbqbxP2u1/A/hr4O/bx4Npw3niG0z7Mea8zEDewxPiO5UBvIfbfZwD/HK7vgbYbUjtNyHGwbThnON9EfjBobXhmPgG0X7AXsDngB3bxxcAr2Ag58AJ8b2LAZwDgacB17e/62rgI8D+Q3r9TYhx2V6D9Pj/mXn+tx+zz0+3z6etf2Qb18Xt8+8Eng7sCHwU2GEx72eX7bPYI7281gHvrsangN2S7Ak8QHMC2Ql4IMluNCf1d8+7pw6q6hPA3WNiOKddPwc4esymL6J5Y99dVffQnISOGIlzB5oTAcDvAm9awvi6OBjYUlW3VtX9wPk0v9cDwI5JZtoYHwJOA35nG+P7QlVd1a7/K3AjzYfmINpwQnxdbPc2bF/n97UPd2iXAl4AXNiWz9d+64Dzq+rbVfU5YEsb82z7rQUeSrIaOInmA663CTF2MZX3SZK9gf9C8yFL+y32YNpwbnw9TKX95jGI9/Aibff3cJJdaf6hPAugqu6vqq8xoPabEGMXU/ksGXEYcEtV/V8G1IbzxNfFtNpvdbu/1TS/9xcY0DlwTHx3dtxuGn/fH6ZJ7L5ZVQ8C/xv4WYb1+psvxi62y2uw5//P8/1v/x3t4++rqk9VVdH8f3808DCwQ/u5vlMb92uBP6uqB7o1gabJRHr7KuDDaYZprx/z/F7A7SOPt7ZlZwK/TfPGfCvNyeitVfXwdojxCVX1hXb9i8ATesR5MbAv8CngT5McBVxVVV0/NLo6sR3mcvY8w43GxldVNwJfBq4CPkjzjebMbLK5GEn2BX6UpsdycG04Jz4YSBumGfJ7NXAXze9+C/C19sPyO8ftGh9Nr+e6dl9vBV4NnFtV39yW+MbFWFWzbfh7bRuekWRtjxiX+m/8x8DraD5wAfZgWG04N75ZQ2m/ceflIb2H5/vcGMJ7eL92X3+ZZuj+O5PszLDab74YYRhtOOo44D3t+pDacFx8MID2q6o7gD8EPk+TQN8LXMlAzoHj4quqD7dPD+EceD3w40n2SHOp4IuBfRjW62++GGEAr8ER87XZfO00N86tY+L8V2AT8BkeeX0/p6r+bhFxajtavdwBfI97XlXdkeTxwMVJPtt+qzVRVX0eOBQgyf40Q7xvTHIuzVCVN1XVvyx1sFVVSbr2vtF+aL20jXMH4CJgXZK3AU+i+UZu4yLD+nOabzar/flHwC/1iPGk2fUkHwRemeQNNMOOLq6qd/QNKMkuwPuAk6rq6+1lLbPHW/Y2HBPfYNqwqh4CntGOsng/8B+6bjvP/u6l6f2k/VA9GfiZJO+gGXL2R1V1ac99fleMSZ4GvJ7mg3INzX0gf4vm2+wu+1uyv3GSnwLuqqorkxza49eaFN+SteGE+AbRfq1HnZfnHG+538Pj4hvKe3g1zfDG11TVZUn+hOb1Mnqs5W6/+WJ8O8Now9l9rKEZEvv6Mcda7jYcF98gXoPtOWodzRcmXwP+hqZXdJst8TnwUfEleRkDOQdW1Y1JTgc+DHwDuJqmd3a0zrK+/ibEOIjX4Dz77tVmC+zr92lHQyR5J3BKkl8GDgeuraq3LMVxtDTskd6O2m8mqaq7aJKGg+dUuYNHvmWDJmG+Y06d36O59uTXaIZKvo7FDycb9aW0Q07an3eNqdMlzlfTDE05hOYbtF8AfnOxwVXVl6rqobY3/h08ug07xZdkHc231rsAT66qnweOSc/J29oPifcBf1VVf9sWD6YNx8U3tDZsY/oa8DHguTTDnma/1BvXLp3ioxm58XvAS4B/Bo6nuaZqm4zEeEQ1w+arqr4N/CXb2IYs/m/8Y8BRSW6jGbL2AuBPGE4bPiq+JOcNqP3mOy8P5j08Lr4BvYe3AlvrkVEaF9IkrYNpv/liHFAbzjqSptfuS+3jIbXho+IbUPv9Z+BzVfXlaoa6/i3NeWco58Bx8f2ngZ0Dz6qqZ1XV84F7aOZTGdTrb1yMA3oNzpqvzbq00x1t+aQ4f5RmqPxNwLFtnE9OckDPOLUdmUhvJ0l2TvLY2XWab5Kun1NtI/DyNA6hGQL0hZF9/ARwZ1XdTHOtxMPt0jtxmWAjzQcF7c8PjKlzEXB4kt3bb1sPb8tm49wd+Cmak+dsnEUzQcKi5LuvK/kZHt2GAJcDB6SZtXMNzXC073z72SaXJ9F8w7cjj1zzuorm2+GusYTmursbq+ptI08Nog3ni28obZhmZtTd2vUdgRfSXMf9MeCYttp87bcROC7N7KD7AQfQTNQxu+8DgL2r6uMs4jU4T4yfHfmwDM11TOPacLv/javq9VW1d1XtS/M3uqSqfpGBtOE88b1sKO034bw8lPfw2PiG8h6uqi8Ctyd5Slt0GHADA2m/STEOpQ1HvITvHjY9mDYcF9+A2u/zwCFJdmrPJ7OvwUGcA+eJ78ahnAPb/Ty+/fkkmmuP/5qBvf7GxTig1+Cs+dps4v/20MxpA3w9ySHta+LlPLrNZ68z36GND5Y+B9Bi1QBmPPteXGhmDLymXTYDb2jLXwW8ql0PzfXQtwDXAQeNbB+a604e1z7+YZprO64FfmwbY3oPzTUXD9B8a38CzfWVHwVuppkZcfZ4B9HOcNg+/iWaiTm2AP91zn7PAA5t1x9DMxxnM83QusXGd27bNtfSnJz2bOs+Edg0su2Lab5VvWW2rUeeO4l2xvO2Xd/T7vNRs1IuEN/zaE6619IMNbq6Pe4g2nBCfINoQ5pZMz/TxnE9cMrIe+XTbbv8DbC2LT8KOG1k+ze0sd0EHDln3xcAB7Trjwf+T9t+P9fzbzxfjJe0v+/1wHk8MrP31N8nI/s7lEdmxR5MG84T3yDaj/nPy0N5D88X3yDew+22zwCuaGP5O5qhr4NovwViHFIb7gx8Fdh1pGwwbThPfENqvzcDn6U5n5xLM0nYYM6B88Q3iHNgu+0/0Xz5cA1w2NBefxNiXLbXIP3+f570v/3VI+sHta+HW2guPcnIc0czMms8zXX319GMNuzVli7bd0n7B5IkSZIkSR04tFuSJEmSpB5MpCVJkiRJ6sFEWpIkSZKkHkykJUmSJEnqwURakiRJkqQeTKQlSZIkSerBRFqSJEmSpB7+P50uq0GWGoOAAAAAAElFTkSuQmCC",
      "text/plain": [
       "<Figure size 1296x288 with 2 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "visualize_summary(paraphrase_df.article, [paraphrase_df.summary], summary_labels=['paraphrased'], tokenize=True, num_bins=20, amortize=True, figsize=(18,4))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "interpreter": {
   "hash": "9464976d858fa45bf8197a005399e2ab173edbfe73eaf93acf0f6ea5a30bc6d6"
  },
  "kernelspec": {
   "display_name": "Python 3.9.7 ('summarization')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
