{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import seaborn as sns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "summarizers = ['textrank', 'matchsum', 'presumm_ext', 'azure', 'pegasus', 'bart']\n",
    "sort_order = {k:i for i, k in enumerate(summarizers)}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "match_percents_df = pd.read_csv('~/Data/paraphrasing/targeted/no_sample_overlap_percent.csv', index_col=0)\n",
    "match_percents_df.groupby('summarizer').head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "match_percents_df = match_percents_df.sort_values(by='summarizer', key=lambda x: x.map(sort_order))\n",
    "sns.set(rc={'figure.figsize':(10,6)})\n",
    "sns.boxenplot(data=match_percents_df, y='percent_overlap', x='summarizer')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "overlap_df = pd.read_csv('../data/paraphrasing/untargeted/no_sample_overlap_percent.csv')\n",
    "overlap_df = overlap_df.sort_values(by='summarizer', key=lambda x: x.map(sort_order))\n",
    "sns.set(rc={'figure.figsize':(10,6)})\n",
    "sns.boxenplot(data=overlap_df, y='percent_overlap', x='summarizer')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.9.7 ('summarization')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "fb9173d43df76b287d1b53052eec4ff84d0ee52790be7057998c9269beecf529"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
