{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import statsmodels.api as sm\n",
    "from sklearn.linear_model import LogisticRegression\n",
    "from sklearn.model_selection import train_test_split\n",
    "import seaborn as sns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = pd.read_csv('../dataset_final.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "# convert decision to binary classes accept, reject\n",
    "decision_to_binary = {'Accept (Poster)': 1, 'Accept (Oral)': 1, 'Accept (Talk)': 1, 'Accept (Spotlight)': 1, 'Invite to Workshop Track': 0, 'Withdrawn': 0, 'Reject': 0}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "scores = []\n",
    "citations_per_paper = []\n",
    "top_10_indicator = []\n",
    "\n",
    "y = []\n",
    "\n",
    "for ratings, rankings, cits, pubs, decision, year, in zip(data['ratings'], data['csranking'], data['authors_citations'], data['authors_publications'], data['decisions'], data['year']):\n",
    "    if year == 2020 and pd.notnull(rankings):\n",
    "        # get decision\n",
    "        binary_decision = decision_to_binary.get(decision)\n",
    "        \n",
    "        # get distinct rankings\n",
    "        ranks = rankings.split(';')\n",
    "        ranks = [int(x) for x in ranks]\n",
    "        ranks_set = set(ranks)\n",
    "        ranks_set.discard(-1)\n",
    "        \n",
    "        # get mean reviewer score\n",
    "        rates = ratings.split(';')\n",
    "        rates = [int(x) for x in rates]\n",
    "        rating_avg = np.average(rates)\n",
    "        \n",
    "        # get author citatins and publications\n",
    "        cits_last = int(cits.split(';')[-1])\n",
    "        pubs_last = int(pubs.split(';')[-1])\n",
    "        \n",
    "        # discard papers with no last author data\n",
    "        if cits_last == -1:\n",
    "            continue\n",
    "        if pubs_last == -1:\n",
    "            continue\n",
    "            \n",
    "        # for each distinct rank\n",
    "        for rank in ranks_set:\n",
    "            scores.append(rating_avg)\n",
    "            citations_per_paper.append(cits_last/pubs_last + 1)\n",
    "            y.append(binary_decision)\n",
    "                \n",
    "            if 1 <= rank <= 10:\n",
    "                top_10_indicator.append(1)\n",
    "            else:\n",
    "                top_10_indicator.append(0)\n",
    "        \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2.948196187247188 1.2797669207629767\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZEAAAEPCAYAAACDTflkAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAAgAElEQVR4nO3dd3wUdfrA8c8TCCGVXkINEgQFFCQixVMUFAQFgbMgRWx4lrtTRMU7C3iInqKcBVHwTkTlByhwKCiKNJVDEVCpFpAuQqjB0ELy/P6YiS7Lpuwmm0l53q9XXpud+c7Ms5PNPjvfNqKqGGOMMaGI8DoAY4wxJZclEWOMMSGzJGKMMSZklkSMMcaEzJKIMcaYkFkSMcYYE7LyXgdQlKpXr65JSUleh2GMMSXKypUr96pqjUDrylQSSUpKYsWKFV6HYYwxJYqIbM1pnVVnGWOMCZklEWOMMSGzJGKMMSZklkSMMcaEzJKIMcaYkFkSMcYYEzJLIsYYY0JmScQYY0zIytRgQ2OKUpv7J+e6fuUzg4ooEmPCx65EjDHGhMySiDHGmJBZEjHGGBMySyLGGGNCZknEGGNMyCyJGGOMCZl18TUmF9ZN15jc2ZWIMcaYkFkSMcYYEzJLIsYYY0LmeZuIiHQB+gB7AFXVkX7rrwN6Ad8A5wOTVfV9d90WYItbdKeq9i+isI0xxuBxEhGRGOAVoLmqHheRGSLSWVUX+BSLBoar6jYRaQ1MB953101S1RFFG7UxxphsXl+JtAe2qupx9/lSoAfwWxJR1Uk+5ZOB9T7PLxKRB4B44ENV/V94wzXGGOPL6yRSEzjs8zzNXXYKEYkGRgCdAN8qq+Gquty9olklIleq6ka/bYcAQwAaNGhQqMEbY0xZ53US2YNzFZEtwV12ClU9CjwoIsnAIhE5Q1UzVHW5u/6IiHwDdAQ2+m07AZgAkJKSouF5GaYky2ssiDEmZ173zloGNBSRKPd5R2CuiFQVkQQAERkmIuKu3wFUB6JFpLOIdPPZVzKwqagCN8YY4/GViHsFcQfwgoikAqtVdYGIPA3sB54CooBxIrINOAv4q6qmicgeYISInAfUAWao6ucevRRjjCmTvK7OQlXnA/P9lj3g8/sTOWy3Bugb3uiMMcbkxuvqLGOMMSWYJRFjjDEhsyRijDEmZJZEjDHGhMySiDHGmJB53jvLmJJAVTm2dwcZ6QepWK0ukXFV+H34kjFllyURY3KhWVnsWTGPfWs/49j+n39bXi46jmotLmLnzs7UrVvXwwiN8ZZVZxmTA9Usts2fxM5Pp1E+Jo76XW6kybXDqd95IPH1z2LPig9JSkri9ttvZ9euXV6Ha4wn7ErEmABUlR0L3mLfmiXUbteTOhf+Pq41vsFZ1GjdheMHU+kUtZkJEybw1ltvMWzYMO6//37i4uI8jNyYomVXIsYEkLpqPqnfLKBmyhUkduwTsExU5Rq89NJLbNiwgR49evD444+TnJzMK6+8wsmTJ4s4YmO8YUnEGD8njxxm1/9mkZDUkroXX5dnA3rjxo2ZPn06X3zxBU2aNOGOO+6gTZs2/LrjhyKK2BjvWBIxxs+uZf8l88Qx6nbqF1QPrAsuuIBPP/2Ud999lwMHDvDD1CfY+vF/yDp5IozRGuMtSyLG+Di272dSv1lI9XM6EV09+F5XIkLfvn3ZsGEDtc7vzr7VS/hh6pOcOLw/DNEa4z1LIsb42PnpdCIio0js0LtA+4mNjaXuxddxRq+/cGzfz3z31giO7f+lcII0phixJGKM69iB3Rza9DU123QlMjahUPZZuUkbmvZ/BLKy2DRrLCePpRfKfo0pLiyJGOPa++0ikAiqn9upUPcbXb0ejXrezfFDqWyZMx7NyirU/RvjJUsixgBZGSfYt/ZTKiefR4W4KoW+//j6zWjQZRBpW9aw63//LfT9G+MVSyLGAAd+WE7msXRqtO4ctmNUP6cTVc5qz+6vPuD4odSwHceYomRJxBhg7zcLiaqaSFz9s8J6nLoXXQsi/PzZO2E9jjFFxZKIKfOO7NlG+q5N1Dj3krDPzFshviq1zr+CA999ybJly8J6LGOKgudzZ4lIF6APsAdQVR3pt/46oBfwDXA+MFlV33fXDQBaA5nAJlV9tShjN6XDge++AImg6lkdiuR42eNHLus7kDNveCTHxLXymUFFEo8xBeFpEhGRGOAVoLmqHheRGSLSWVUX+BSLBoar6jYRaQ1MB94XkXrAMKC1qqqIfCUiC1X1x6J/JaakUlUOfL+chIbNKR8TXyTHLFehIrU7XM32+ZNI3/kjcfXOLJLjGhMOXldntQe2qupx9/lSoIdvAVWdpKrb3KfJwHr3967ASlVV9/ky4Iowx2tKmZUrV3LiUCqVm7Yt0uNWO7sD5aJiSP3mkyI9rjGFzeskUhM47PM8zV12ChGJFpF/4lx53BfktkNEZIWIrEhNtR4x5lTTpk1DIspRuUmbIj1uRGQU1Vr8gQM/rCDj14NFemxjCpPXSWQP4FuHkOAuO4WqHlXVB4H+wCIRiQxi2wmqmqKqKTVq1CjU4E3JpqpMnz6d+IYtKF8xtsiPX71VZ8jKZO/qxUV+bGMKi9dJZBnQUESi3OcdgbkiUlVEEgBEZJj83vK4A6iO007yEdDGZ1174MOiC92UdMuXL2fbtm1UKeKqrGwVq9QiIakle79dhGba/UdMyeRpw7qqHhGRO4AXRCQVWK2qC0TkaWA/8BQQBYwTkW3AWcBfVTUNSBORMcBYEckEXrNGdROMadOmUaFCBSolt/Yshhqtu7Bp1lgObvyaKk3P9ywOY0LleRdfVZ0PzPdb9oDP70/ksu1bwFvhi86UVllZWbzzzjt07dqVnR5UZWVLaHQOkbGV2f/dMksipkTyujrLGE988cUX7Nixg2uvvdbTOCQigspN25L202oyjx/xNBZjQmFJxJRJ06ZNIyoqip49e3odClWbXYBmZnDwx1Veh2JM0CyJmDInuyrriiuuICGhcO4bUhAxiY2pkFDdGTlvTAljScSUOUuXLmXXrl2eV2VlExGqNLuAtK3rOHnkcN4bGFOMWBIxZc60adOoWLEiV111ldeh/KZKs3agWRz44SuvQzEmKJZETJmSmZnJu+++S48ePYiLi/M6nN9E16hPVNVEDnz3pdehGBMUSyKmTPn000/ZvXt3sanKyiYiVDmzLb/u/J6MI2leh2NMvlkSMWXK9OnTiYmJoUePHnkXLmKVm5wHqhza9I3XoRiTb5ZETJlx8uRJZsyYwZVXXklsrHcDDHMSXbMhFRKqc/DHlV6HYky+WRIxZcbixYtJTU0tdlVZ2USESsnncXjrOjJPHPU6HGPyxZKIKTOmT59ObGws3bt39zqUHFVu0gbNzCBt81qvQzEmXyyJmDIhIyODmTNn0rNnT6Kjo70OJ0dxdc+kfHQ8BzdalZYpGSyJmDJh4cKF7Nu3r9hWZWWTiAgqNW5N2k/fcuLECa/DMSZPlkRMmTBlyhQSEhLo1q2b16HkqVKT88g8foRFixZ5HYoxefJ8Knhjwi09PZ0ZM2bQr18/KlasWKj7bnP/5ELdH0BCw+ZEREYxa9YsunbtWuj7N6Yw2ZWIKfVmzZpFeno6AwcO9DqUfIkoX4GERucwe/ZssrKyvA7HmFwFlURE5KdwBWJMuLz55ps0bNiQCy+80OtQ8q1ykzb88ssvfPmlTYNiirdgr0SSRGSkiDQISzTGFLJdu3bxySefMGDAACIiSs6Fd6UzziUyMpJZs2Z5HYoxuQrlv+pM4DsR+UBEeolIyfnPNGXOlClTyMrKKjFVWdnKRcVw6aWXMmvWLFTV63CMyVHQCUBV+wENgIXAU8B2ERklIkmhBCAiXUTkZREZISKPBVj/oIiMdR+ni0gzn3VbRGSx+/N2KMc3pZeqMnnyZM4//3yaNm3qdThBu/rqq9m4cSPr1q3zOhRjchRU7yxVjXAf9wJjgDEi0gm4DVgnIp8BrwLvqWpmXvsTkRjgFaC5qh4XkRki0llVF/gUiwOGqqqKyHXAM0D2jSAmqeqIYF6DKX1y6iGVvmsT369ezSuvvFLEERWOXr16ceeddzJr1ixatGgR1La59Rpb+cyggoZmzG8KXBWlqouBG4F7gYuAd3GuTkaLSKM8Nm8PbFXV4+7zpcAp06uq6iP6+/V8BPCrz+qLROQBEfmHiHQo4EsxpczebxcREVmRG264wetQQpKYmEi7du2sXcQUa8H2zhrk97yBiPwD2AqMByoCq3GuFhKBb0VkqohUy2GXNQHf+4GmucsCHbsCTrJ62GfxcFV9GngS+I+IJAfYboiIrBCRFampqfl5maYUOHksnf3ffUnVs9oRHx/vdTgh6927N19//TVbt271OhRjAgr2SuR1cfQSkQ+An4C/AwnA60A7VW2tqmNV9SactpMDwJQc9rcH8P0PT3CXncJNIOOBv6vqpuzlqrrcfTwCfAN09N9WVSeoaoqqptSoUSPIl2tKqv3r/4eePEH1cy/xOpQC6d27NwD//e9/PY7EmMCCTSICbAdmAt2Ab4E7gTqqemv2h3o2VT2IU8112oe7axnQUESi3OcdgbkiUlVEEgBEJBqnneU5VV0pIn3d5Z1FxHcOi2RgE6bMU1X2rl5MTK1GxNRK8jqcAklOTqZFixZWpWWKrVCmPUkA/g1MUNUVuRUUkcrAMCAj0HpVPSIidwAviEgqsFpVF4jI08B+nN5fbwMtgEYiAhALzMC5YhkhIucBdYAZqvp5CK/HlDLpO3/k2N4dNLj8JiA8U5MUpauvvprRo0eTmpqKXU2b4iaUJJKoqun5LFsPaIpTFRWQqs4H5vste8Dn9z45bLcG6JvPOEwZsnvlPMpVjKXqWe29DqVQ9O7dm1GjRvH+++9z8803ex2OMacItjrrptwSiIhc4tsjS1XXquo1qvq3kCM0JgjHDuzm0I+rqNHqUiIio/LeoARo3bo1DRs2tHYRUywFm0ROGwzo5wXgexG5KcR4jCmQ1JUfIeXKUaN1F69DKTQiQu/evfn44485ePCg1+EYc4pgk0jDPNanAH/C6bFlTJE6efRX9q39jCrN2hEZW9nrcApV//79OX78ONOmTfM6FGNOUajzXrmDBqfhjBExpkjtXb2IrJMnqJVS/G88Faw2bdrQokULJk2a5HUoxpwi14Z1EbkI6OS37BGcrr6BVAQ6AJsLIzhj8isr8ySpqz4hPqkF0TXqex1OoRMRBg8ezLBhw9iwYQNnnXWW1yEZA+TdO+sSTm0HUWBkHtscBGxyHlOkDmz4goz0gzS84lavQwmbAQMG8OCDD/LGG2/w1FNPeR2OMUDeSWQSsNj9XYAFOIklEMUZnb5RVY8WRnDG5IeqsmflPCpWr0d8w+AmKixJatWqRffu3XnzzTd54oknKFeunNchGZN7ElHVrTjzYgEgIttUdUnYozImCIe3redo6nYadr0Fd0BqqTV48GDef/995s2bR48ePfLewJgwC6phXVXzmpXXmCK356sPKR9biSqlZHBhbq688koSExN54YUXvA7FGKCQe2dlE5E87yViTGFYt24daVvWUKN1FyLKR3odTthVqFCBP//5z3z88cesWbPG63CMyT2JiEg13/upi8hF+fkJf9jGOMaOHYuUr0CNcy/1OpQic/vttxMTE8Nzzz3ndSjG5NmwvgKoLiL13Rl5F+M0oBvjud27d/Pmm29SrfmFlI+O8zqcQpfbxJE33XQTEyZMYPTo0SQm2rAs4528ksgGIAnw7W31eB7bCPBIAWIyJl/GjRtHRkYGNVO6eh1Kkbvnnnt4+eWXGTduHKNGjfI6HFOG5dU7q3uAZXmNE0FEHi1IUMbk5ciRI7z88sv07NmT7VVqex1OkUtOTqZ379689NJLDB06lKpVq3odkimjgm1Yz+9t4kr27eRMsTd58mT27dvH0KFDvQ7FMyNGjCAtLY1//vOfXodiyrBgu/jma4yIjSUx4ZSVlcXYsWNJSUnhD3/4g9fheKZly5bccMMNvPjii/z8889eh2PKqKCSiIhUFpFB7k+suyxSRCaIyH4R2Skiw8ITqjGOuXPn8sMPP3DfffeV+sGFeRk5ciQZGRnWLmI8E2x11gCcqVBuAaLdZSOAW4E4IAb4p4j0LqT4jDnNs88+S4MGDfjjH//odSiea9y4MbfddhsTJ05k48aNXodjyqBgk8jVwAhVvVhV94pINHAnkAokq2oV4HngL4UcpzEArFy5kiVLlvCXv/yF8uVDubtz6fPII48QFRXFgw8+6HUopgwKNok0A172eX4FUAl4WVW3ucvGADZPtQmL5557jvj4eG69tfTO1husxMREhg8fzsyZM1myxJojTdEKNolUAnzvsX4tzuDDt32W7QXi87tDEekiIi+LyAgROe32uyLyoIiMdR+ni0gzn3UDRORZEXlaRG4P8rWYEmb79u1MmzaN2267jUqVKnkdTrFy3333Ub9+fYYOHUpWVpbX4ZgyJNj6gK3AxcA8dzqUnsDXqupbGZsM5KuriIjEAK8AzVX1uIjMEJHOqrrAp1gcMFRVVUSuA54BrhKResAwoLW77isRWaiqPwb5mkwJ0Ob+yexYPJXMLOWjw3VZnMto7rIoOjqap556iv79+zN58mTCNC2eMacJ9p32NjBVRKYDnwNRwG/Tibo9tp4Evsnn/toDW93b6gIsBU6Z31pVH1HV7KlWIoBf3d+7Ait91i3DqV4zpVDm8aPsXb2YKmeeT1Sl6l6HUyz169ePtm3b8uijj5J18oTX4ZgyItgkMhbnxlR9gXrAf1R1MoCIdMW5KdWVwNR87q8mcNjneZq77DQiUgG4EXg4mG1FZIiIrBCRFampqfkMyxQ3+9Z+StaJo9QshfdPLywiwlNPPcX27dtJ/XpB3hsYUwiCHWx4TFX7AlWBSqp6m8/qT4EmwBnAf/O5yz2c2n6S4C47hZtAxgN/V9VNwWyrqhNUNUVVU2rUqJHPsExxcvLkSfas/Ji4emcSm3iG1+EUa5dccgndunXjly/f5+Sx9Lw3MKaAQqo4VdVDqnrYb9lRVd3q3g2xYz53tQxoKCJR7vOOwFwRqSoiCQBuN+JXgedUdaWI9HXLfgS0kd9Hm7UHPgzl9Zji7Z133uFE2l5qplhtZX48+eSTZB5LZ/dXH3gdiikDwtXRfhGQ5w2gVfWIiNwBvCAiqcBqVV0gIk8D+4GncNphWgCN3HwRC8xQ1R0iMgYY694E6zVrVC99srKyGD16NBWr1qFS41Zeh1MitGrViipntSd15cfUatON8jH57ixpTNCCTiIiUhenTaQJzgj1As07oarzgfl+yx7w+b1PLtu+BbxVkOOb4m3u3LmsXbuWhlcMQcR6HOVX7Quu4sCGZaR+8wmJHWwCCRM+QSUREekMzMZJHrmxG1eZAlNVnnjiCZKSkqjS7AKvwylRoqvXpVLjVuz5+hNqnd+diMiovDcyJgTBXok8A2zGuTHVBpzutv4JQ4BNGFNAixYt4ssvv2T8+PFM3GRTnPjK7a6H2Wqd34NDU59g39rPqNG6SxFEZcqiYOsHzgKuVdV3VHWtqm7Jbkz3+dmC01PLmJCpKo899hi1a9dm8ODBXodTIsXWbUJsnWR2r5iHZmV6HY4ppYJNIvuAnXkVUlW7KZUpkDlz5vD555/z6KOPUrFiRa/DKZFEhFrnd+fEoVQO/rjS63BMKRVsEnkDyHP+bRFZGFo4xjjjQoYPH86ZZ55pEy0WUKXGrakQX429a2xiRhMewVY0vw48JyItgfdw5sg66ldGcObXMiYkkydPZv369bz77rtERkZ6HU6JJhERVG3xB35ZNpvjh1KJqmQDbk3hCjaJ/MDvDel2zxBT6A4fPsyjjz7KBRdcQJ8+OfbuNkGo5iaRfWs/o05HO6emcIXS5SWvbiECDAxhv8bw4IMP8vPPP/POO++U+VvfFpaoStVJSGrBvrWfkdj+aq/DMaVM0ElEVW/Kq4yIDAotHFOWLV68mPHjx3PvvffSvn17r8MpVaq1vIjN748jbetar0MxpUywDev98lnOemeZoKSnp3PLLbfQuHFjRo0a5XU4pU6lxq0pHx3PvjXW+94UrqCuRFR1Wj7LWVcQk2+qypAhQ/jpp59YvHgxMTF5TYhgghVRPpIqzdqxd/Vi0tLSSEhI8DokU0qENAxYRM7EafdIAWqqahu3x9a5wP+pqo1sKoPyGkW98pnAtZyjRo1iypQpPPHEE1x8sXXsC5cqzdqS+vV83nvvPQYMGOB1OKaUCHpGOxH5G7AW+DvO3QWzp1aNASYC7/tM7W5MrqZOncqjjz7KoEGDeOihh7wOp1SLrZNMZHxVpk3LV4WCMfkS7ASM1wKjgM9w7l64A/cGVKr6pYgkAx8Ad+LcBdGYHL355pvcdNNN/OEPf2B11YtIeeBNr0Mq1UQiqNK0LR999BEHDhygSpUqXodkSoFgr0T+Ajyhqher6nhVfd93parudMtY7yyTq+eff55BgwZx8cUXM3fuXCLK26DColClWTsyMjKYNWuW16GYUiLYJNISeC6PMsuBRqGFY0q7jIwM7r77bu655x769OnD3LlziY+3myYVlZhaSZxxxhlWpWUKTbBJpByQlUeZ2iHs15QBe/bsoUuXLowbN4777ruPadOm2eSKRUxEuP7661mwYAGpqaleh2NKgWA/7NcAw/IoczvwTWjhmNLqyC+bSUlJYfny5bz11luMGTOG8uXtHiFeuOaaa8jMzGT27Nleh2JKgWCTyHjg7yKySET6i0gLABFpJCKXishknCQzrrADNSXX/g3L+H7qEwAsXbqU/v37exxR2XbuuedyxhlnMGPGDK9DMaVAsIMNJ4tIW5zeVxf5rNroPgrwr/wOSgQQkS5AH2CPcwgdGaDMtcCTwF9VdY7P8i3AFvfpTlW1T6diZs+qj9mx8G3i6jVjxYol1KxZ0+uQyjwRoW/fvvzrX//i4MGDVK5c2euQTAkWdNuFqt4N9AI+AvYDmTg3q/oA6KGqQ/O7LxGJAV4B7lXVEcA57n3cfcs0AlKB7QF2MUlVO7k/lkCKmV++nMuOhW9TuUkKydfcbwmkGOnTpw8ZGRnMmTMn78LG5CKkBnBVfV9Vu6tqDVWtoKo1VfUqVf0wyF21B7aq6nH3+VKgh9+xNqvqohy2v0hEHhCRf4hIhyCPbcJo94p5/PzZdKo0a0ejq+4kopy1fxQnbdu2pW7dulalZQos3//ZIhIJXA90A5KBSsAh4Hucq5JpqnoyyOPXBA77PE9zl+XXcFVd7l7RrBKRK1V1o28BERkCDAFo0KBBkOGZUBzcuIqdi6dSuUkKSd1vRyKss15xExERQe/evXnttddIT08nNjbW65BMCZWv/24RaY9zQ6pJODP5ng+c6T4OwLnHyA8i0i7I4+8BfAcJJLjL8kVVl7uPR3B6hHUMUGaCqqaoakqNGnZXt3A7snsrW+aMJ6Z2Ekndh1gCKcb69u3LsWPH+PDDYCsQjPldnv/hbjXRAqAhzlXHS8C9wG3AUJw2jU1AErDQTTj5tQxo6DPXVkdgrohUFZFcpxkVkc4i0s1nUbIbh/HIyWPp/DT7BcpFx9G49z1ERNoUasXZhRdeSPXq1a1KyxRIrtVZIlIB+D+cKqfrVfW9XMpei9MFeIqInKmqGXkdXFWPiMgdwAsikgqsVtUFIvI0TqP9U+Lc3u7vOEnsOhHJUNWPcK5YRojIeUAdYIaqfp6fF20Kn6qyff4bnPj1AE37/Z3IWOvxU9yVL1+eq6++mqlTp3Ls2DEb+GlCklebSH+gGtBOVXO9JZqqTheRjTiTM/bHqfrKk6rOB+b7LXvA53fFmfRxlF+ZNUDf/BzDhN/kyZM58P2X1Lnwj8QmNvY6HJNPffv25bXXXuOTTz7hyiuv9DocUwLlVZ11JfBSXgkkm6quAl4GehY0MFNybN68mbvvvpu4es2o1bZH3huYYuPSSy+lUqVKzJw50+tQTAmV15VIG2B0kPucBrwbWjimpFFV/vSnPwHk2ZCe102rTNGrUKECV111FbNnzyYjI4PISJtN2QQnryuRaji9soLxPVA9tHBMSfPWW2/x8ccf89RTT1EhoZrX4ZgQ9OnTh/3797Nkid3V2gQvryQSo6qH8yhzCrd8dOghmZIiNTWVe++9l/bt23PHHXd4HY4JUdeuXYmJibEqLRMS68RvQjZs2DDS0tKYOHEiETYepMSKiYnhiiuuYObMmWRmZnodjilh8moTERGxd5UBTm3T+HXnD/zwf5OpdcGVDJq0EljpXWCmwK677jpmzJjBokWL6NKli9fhmBIkP18fJYQfU4ppVibbP3mTyPiq1L7AOuKVBldeeSUJCQm8/fbbXodiSpi8koiqakSwP0USufFM6jcLOZq6jXqdbqBcBRuVXhpER0fTt29fZsyYwdGjR70Ox5QgeX3gbwtxv6FuZ4q5jPQ0di2dSXyDs6l8ZorX4ZhC1L9/fw4fPsz777/vdSimBMk1iahqo1B2Gup2pvj7+bN3yMw4Tr3OA3FmpDGlRadOnahTp45VaZmgWNWTybf0nzeyb+2n1GzTlehqdbwOxxSycuXK0a9fPz744AP27dvndTimhLAkYvIlMzOTbQsmExlXmcT21pheWg0YMICTJ08yZcoUr0MxJYQlEZMvr776Kkd3b6Vup36Uq2BjSUurVq1a0bZtW8aNG4cz96kxubMkYvK0a9cuHnroIeIbnE2Vphd4HY4Js7vvvpvvv/+eBQsWeB2KKQEsiZg83XPPPRw/fpz6l91ojellwDXXXEP16tUZN26c16GYEsCSiMnVBx98wPTp03n44YepWKW21+GYIlCxYkVuu+023nvvPbZts976JneWREyOjhw5wl133UWzZs24//77vQ7HFKHs6f3Hjx/vcSSmuLMkYnL0+OOPs2XLFl599VWiomxkelnSoEEDevfuzcsvv8z+/fu9DscUY5ZETEBr1qzh2Wef5eabb+aiiy7yOhzjgREjRnD48GGefvppr0MxxZglEXOarKwshgwZQuXKle0DpAxr0aIFN9xwAy+88AK7du3yOhxTTOU1FXzYiUgXoA+wB0AlRRIAACAASURBVGfCx5EBylwLPAn8VVXn+CwfALQGMoFNqvpq0URduj3//PN88cUXvPHGG1SrZncrLG3yuk3xymcG/fb7iBEjmDp1KqNHj+bFF18Md2imBPI0iYhIDPAK0FxVj4vIDBHprKoLfMo0AlKB7X7b1gOGAa1VVUXkKxFZqKo/FuVrKG3Wr1/PQw89xFVXXcXAgQO9Dsd4LDk5mZtvvplXX32Vv/zlLzRp0iTXJOSbgEzZ4HV1Vntgq6oed58vBXr4FlDVzaq6KMC2XYGV+vuw2mXAFWGLtAzIyMhg4MCBxMfHM3HiRBsTYgAYOXIkMTEx3HbbbWRlZXkdjilmvE4iNQHfe7inucsKbVsRGSIiK0RkRWpqasiBlgUjR45k1apVvPLKK9SqVcvrcEwxkZiYyJgxY1iyZAkTJ070OhxTzHjdJrIHiPd5nuAuy++2yX7bbvQvpKoTgAkAKSkpNhlQDhYsWMDo0aOp2vxCRn+Rzugvcq83N2XLLbfcwpQpU3jggQdo0G8kFeKreh2SKSa8vhJZBjQUkexBCB2BuSJSVUQS8tj2I6CN/F7n0h74MExxlmq7d+9mwIABNG3alPqdrU7bnE5EmDhxIhkZGWz9cCJq1VrG5WkSUdUjwB3ACyIyCljtNqoPB+4EEMfDQEPgOhHp6m67AxgDjBWRZ4HXrFE9eJmZmQwcOJCDBw8yffp0u92tyVHjxo158cUXObxtPb988Z7X4ZhiQsrSdM8pKSm6YsUKr8PwlH/Pmp2fTmf38rk0uPwmqp/TyZugTLGSWw8rVaV6iwvZv34ZTa59gPgGZ+d7W1NyichKVQ14P2yvq7OMh/ZvWMbu5XOpfu6llkBMvogI9bvcSFTV2mye8woZ6Qe9Dsl4zJJIGXXkl81s/ejfxNVrSr1L+3sdjilBylWoyBlX3U3miaNsmfuqtY+UcZZEyqCM9ENsmv0CkdEJNLrqbiLKed1Jz5Q00TXq0aDzQA5vW8+uZbO9Dsd4yJJIGZOVeZKf3nuJk0d/5Yyr/0pkbF6d4IwJrFrLi6ja/EJ+WTabtK3rvA7HeMS+ghZDwcxtFAxVZfuCyaTv/IGkK+8kplbDkPZjTLb6nQdx5Jef2DL3Fc4a9A+vwzEesCuRMmT06NHsW72E2u2uomozu1e6KbhyFaJodNXdZJ04xua548nMzPQ6JFPELImUEW+88QYPP/wwVc/uQGLHvl6HY0qR6Op1qd/lRn7d/h2PP/641+GYImbVWaWQf3VY2pY1bJw5lviGzWnQ9RabWNEUumotLuTwtvU88cQT9OrVi/POO8/rkEwRsSuRUu7Inq38NPsloqvV4Yyef7aeWCZs6l3an5o1a3LTTTdx4sQJr8MxRcQ+UUqx44f2smnGc5SrGEPjPkMpFxXtdUimBMirY0dOyleMJfqCa1n93+dJuuR6EjtcfVoZG9Fe+tiVSCl14tcDbHznn2SdPEFy3/ts1lVTJConn0eVZu345Yv3OJq6Pe8NTIlnSaQUykg/xI/T/0lGehrJfe8juno9r0MyZUj9SwdQLiqGrfNeQ7Ost1ZpZ0mklNm7dy8/vvM0GWn7SO47lNg6yXlvZEwhKh8TT/0ugziyewu7v7K7M5R2lkRKkQMHDnD55Zdz/OBuzuh9D3H1mnodkimjqjRtS+UmKez63385uu9nr8MxYWRJpJQ4dOgQ3bp1Y926dZzR6y8kNGzudUimjKvfZRARkRXY9tG/bZLGUsySSCmwa9cuLr74YlatWsX06dOp1Ogcr0MyhsjYStS7pD/pP28k9etPvA7HhIklkRLuxx9/pGPHjmzcuJE5c+bQq1cvr0My5jdVz+5AQqNz+fmzdzh+cI/X4ZgwsCRSgq1YsYKOHTty+PBhFi5cSNeuXb0OyZhTiAgNLrsRIiLY9vHrZFm1VqljSaSEmj9/Pp06dSImJoalS5fStm1br0MyJqAKCdWo16kfh7et5/nnn/c6HFPIbMR6CTRlyhQGDx5Ms2bNmDdvHnXq1PE6JGNyVa3lxRz66VuGDx9O586dOeec09vtwnULBBNenl+JiEgXEXlZREaIyGMB1lcUkZdE5CER+Y+InOmzbouILHZ/3i7ayL2x+6sP6d+/Px06dODTTz+1BGJKBBGh4eU3U7VqVW644QaOHj3qdUimkHiaREQkBngFuFdVRwDniEhnv2L3ANtU9UlgLPBvn3WTVLWT+1OqbxSumsWORVPYuWQq11xzDfPmzaNy5cpeh2VMvpWPiWfSpEmsW7eOP/3pT6iq1yGZQuB1dVZ7YKuqHnefLwV6AAt8yvQA/gagqmtE5FwRSVDVNOAiEXkAiAc+VNX/FWHsRSbrZAZb503kwHdfUuO8y9jYoDsdH5nudVjGBK1r166MHDmSxx57jHPPPZehQ4d6HZIpIK+TSE3gsM/zNHdZfsqkAcNVdbl7RbNKRK5U1Y2+G4vIEGAIQIMGDQo5/PDLyjjOpln/4vC29dS96Dpqnn+F3Q/ElGgPP/wwq1ev5v777+fss8+mW7duXodkCsDrNpE9OFcR2RLcZfkqo6rL3ccjwDdAR/8DqOoEVU1R1ZQaNWoUYujhl3XyBJtmv8DhbRto2O02arXtbgnElHgRERFMmjSJli1b0rdvXz7//HOvQzIF4HUSWQY0FJEo93lHYK6IVBWRBHfZXJxqL0SkJfCtqqaJSGcR8f0KkwxsKqrAwy0r8yQ/vTeOw1vW0rDrzVRrcaHXIRlTaOLi4pg3bx716tWje/fufPnll16HZELkaRJxryDuAF4QkVHAalVdAAwH7nSLPY+TaB4G7gNucZfvAW4Tkb+JyEvADFUtFV9pVJVtH79O2k/fUL/LjVRreZHXIRlT6GrXrs3ChQupWbMmXbt25fD277wOyYTA6zYRVHU+MN9v2QM+vx8F7gqw3Rqgb9gD9MDu5XPZv+5zarfvRY1Wl3odjjFhU7duXRYtWkTXrl357p2nadjtVqqe3cHrsEwQvK7OMn5mzpzJz5+9Q5VmF5DYobfX4RgTdvXr12fp0qXE1m3Clg9e5eelM1G16VFKCksixcjGjRu58cYbiUlsTMNut1ojuikzqlSpQnLfYVRtfiG/LJvNpln/4uSxdK/DMvlgSaSYOH78ONdddx3ly5fnjKvuIqJ8Ba9DMqZIRZSPpGG3W6nfeRBpW9by/Vsj7D7tJYAlkWLioYceYtWqVbz++utUSKjmdTjGeEJEqNG6M2de9xBZGSf4/u3H2f/dF16HZXJhSaQYmDNnDmPHjuXuu+/m6quv9jocYzwXV7cJzQaOJLpWElvmjGfHov/j5MmTXodlArAk4rEdO3YwePBgzj33XJ555hmvwzGm2IiMq0yTax+kRuvL2LNyHpdddhl79tiNrYobz7v4lmWZmZn079+fY8eOMW3aNCpWrOh1SMYUKxHlylO/8wBiajdiyfzXqZd8Fmf0vJvYxManlbWp4r1hVyIeGjVqFJ9++ikvv/wyTZs29TocY4qtas070rTfI4hE8MPU0exdvdjrkIzLkohHlixZwuOPP87AgQMZNMi+QRmTl5haDWk2cCRx9Zux7ePX2b7gTTQr0+uwyjxLIh7Yu3cvN9xwA40bN2bcuHFeh2NMiVE+Oo7kPvdRM6UbqV9/wsZ3x3Dy6K9eh1WmWRIpYllZWQwePJi9e/cybdo04uPj897IGPMbiYigXqd+NOx6C7/u+J7v336cY/t+9jqsMsuSSBF7/PHHmTt3Ls899xytW7f2OhxjSqxqLS+iyXXDyTxxlO+n/IN58+Z5HVKZZEmkCL333nuMHDmSG2+8kTvvvDPvDYwxuYqreyZN+z9GhYTqdO/enREjRpCZae0kRcmSSBFZu3YtAwYMoE2bNowfP97mxTKmkERVqs6Z/R5m0KBBjBw5kssvv5ydO3d6HVaZYeNEisDGjRu57LLLiIuLY+bMmURHR3sdkjGlSrkKUUyaNImLL76Yu+66i+bNm/Pcc89x0003FfgLW5v7J+e6vqyPT7ErkTDbsWMHXbp0ISMjg/nz55fI+7wbU1LcdNNNrF69mlatWnHLLbdwySWX8NVXX3kdVqlmVyJh9O2339KrVy8OHDjAwoULad68udchGeOpvL7VF4bk5GQWLlzIxIkTeeSRR2jbti1//OMfGTp0KO3atbOq5EJmVyJhMnPmTDp06MDJkydZuHAhbdq08TokY8qMiIgIbr/9djZt2sSjjz7Kxx9/TIcOHWjTpg1jxozhu+++Q1W9DrNUkLJ0IlNSUnTFihVhPcaOHTsYNmwY06ZN44ILLmDWrFkkJiYGtY+i+LZmTGmTW9vEr7/+yttvv82rr77K119/DUC9evVo1aoVLVu2pG7dutSsWZO4uDgiIpzv1unp6aSnp/P3yQvIyjh+yk+m+ygREfS9sCWVK1emYcOGNGrUiKSkJJKSkoiNjS2S110URGSlqqYEWud5dZaIdAH6AHsAVdWRfusrAmOAnUAT4ClV/cFdNwBoDWQCm1T11aKM3deGDRuYOHEiEyZMIDMzk8cee4zhw4fbpIrGFAMXj5wJRCOd76HF+fs49NM3/LrzRz5Z9jVz5n4A+bwdr5SLJCKyAhGRUURERoFmMXfuNvbv38/x48dPKZuYmMjZZ59N8+bNf3ts3rw5VapUCcMr9I6nVyIiEgOsBpqr6nERmQG8rKoLfMoMB7JU9WkRaemu/4OI1APmAK1VVUXkK+AGVf0xp+MV1pVIRkYGW7duZcOGDXz22WcsWrSIFStWEBkZSd++fRk9ejSNGjUKef92JWJM0dGsTD58oDu7d+/m6NGjv40ziY2NJTY2lj7PfuAmjQpIRLnTtl/5zCBUld27d7NlyxY2b97M5s2b+fHHH1m3bh3r168nPf33W/0mJibSrFkzGjRoQP369alfvz4NGjSgdu3aVKlShSpVqhAfH1+s2m6K85VIe2Crqman8KVAD2CBT5kewN8AVHWNiJwrIglAV2Cl/p4FlwFXADkmkVDt3buXvn37sn//fvbt28eePXt+e6NVqFCBtm3b8vTTT3PjjTdSs2bNwj68MSaMJKIc3cd8lOP6yLjKee9DhNq1a1O7dm3atWt3yrrzhk3iRNp+ju3bybG9Ozm6byfLv9/O5yu+JTP9IFlZp18FRUREULlyZWJjY4mKiqJixYqnPUZGRiIiv/1EREQEfJ6ZmUlmZibJyck8+eSTwZ+gvF67x1ci/YDrVPVq9/mtQCdVHeBT5nu3zDfu8x1AJ+AaoJaq3uMuHwWgqg/7HWMIMMR92hT4PpyvqZBUB/Z6HUQxY+fkdHZOTmXn43SFdU4aqmqNQCu8vhLZA/jOQJjgLstPmT1Ast/yjf4HUNUJwITCCLaoiMiKnC4dyyo7J6ezc3IqOx+nK4pz4nUX32VAQxGJcp93BOaKSFW3ygpgLk61F26byLeqmgZ8BLSR3ysO2wMfFl3oxhhjPL0SUdUjInIH8IKIpAKrVXWBiDwN7AeeAp4HxojIwzhXHre42+4QkTHAWBHJBF7LrVHdGGNM4StT40RKChEZ4lbDGZedk9PZOTmVnY/TFcU5sSRijDEmZF63iRhjjCnBLIkYY4wJmdddfI2fvKaBKWtEpDEwClgF1AP2qerj3kblPRGJBr4EPlbVYV7H4zURaQr0A44CFwMjVHW5t1F5R0TuB5Jwxog0AW5R1aNhOZa1iRQf+ZkGpqwRkfOBOqo6232+Hhioqiu9jcxbIvIszkCy1LKeRESkHPAecJWqZolIInBSVVM9Ds0TIlIbWA9Ud8/HbGC6qr4djuPZlUjxkp9pYMoUVfW/o1AEkB6obFkhIgNx3hvnAHEeh1McnA8I8Gf3i9g+YKK3IXnqCHACZwD2QZz3yLpwHcySSPFSEzjs8zzNXWYAEekNfKSq33kdi1dE5GzgLFX9m4ic43U8xURDnC9g/VT1kIi8hfMhOsnTqDyiqmluddY0EdkF7CDAbB6FxRrWi5f8TANTJonIJcAlwL1ex+Kx3sAxd3brC4G2InKPxzF5LQ34TlUPuc8/x5lfr0wSkVbA/UAPVR2M0y7yaLiOZ1cixctv08C4VVodgZc9jslzItID+APwVyBRRBqq6jKPw/KEqj6R/bt7r504Vf2XhyEVB18C1USknKpm4lyZ/OBxTF6qC+xX1ZPu811Ag3AdzBrWixkRuQz4I5AKZFjvLGkDLAGybwQTC4xT1UmeBVUMiEhf4C6gAs75+D+PQ/KUW9V5Kc7/TQPgz+HqjVTcuR0NXgCO4bSJtADuUdVdYTmeJRFjjDGhsjYRY4wxIbMkYowxJmSWRIwxxoTMkogxxpiQWRIpgUSkoohc73UcxpjiSURiROS6ojiWJZF8EJHBIqI+P0kextIAWI4zbiLUfVwiIgdF5KEA6waLyIgChOi/v6tFZISIVM5h/UNuLJcU1jHDSUTquu+BIpuvyu+9NyIf5ZP8thnst76GiGwWkQ/CFXMucY0QkU45rD9bRPaIyPiijKukEZFzReTrPD6LMoCHRGSaO54obCyJ5IOqTlJVAd7wMg4RqQR8DGwA/lyAXdUEKhF4ANJg4LEC7Nvf1e7+AiYRN4ZKlJzpXXq6j+8X1QHd916+k6yqbnG3uSmHIrFALaBRIYQXjCSc90KnHNZXBqq65YwfESkvIo8AnwLNciurqhlAZ6AVYZ7+xZJIyfIEzmjce1U1K9SdqOo0oA7OYDWv3YUzS+80rwPJp57AD6r6vdeBhEpVt+BMq3+ex6GcQlX/h/O+7JlX2ZJERBaLyJZC2NXbwJXABcDuvAqr6j7gb8B1IvLHQjh+QJZESggRqQXcBkxV1Z8Luj9V3VWQRFRYVDUrXCNpC5uIxOFcEbzndSwFpar7i+OIblXd436LNqd7A+gQ5ASkM4HNwN/DE5IlkUIjIg1E5DUR2SEiJ9zHiSJSP4fyHURkkYiki8ghEZkvIm3dby3ZddmLfTa5FmeKi09yiaGdiLwnIvtF5IiIfC8i/yciPdypEMhp/9ntPjg39PGvhx/sLisnIgNFZLaIbBGR4yKyS0TeFufmUb6xdHL3d6O7aLN/vX5edf0iEisij4nIdyJyzH1d74tIe79yw/32FS8ir4hIqogcFZHPROS0b90iUlVE/ikiP7jna5uIfCAiN4szpbi/rkAUbhLxP5cicoGIfOL+PdNFZKGItPU7ZsC2ChEZ5rN8S4Bj++7jChFZ5h5jv3v+6+a2jc+2I3xjyKFMnu8jt1yKiLwoImtE5FcROSwiS0XkmgD73AIscp8+5v9aRWRSXq9fRK50z+kh9+/6jYj81S+m2v7nWEQGich69/26RXKYsFJE+rnndb+IHBCRr0TkHyLSJD/nNtxU9QN3brBgtlGc895KRJqHKzD7yecPTt2iAkl+y5vjzNmzFkjB+aBJwZnDfzfO1N2+5TsBx4FvcOoso3AmW1wNbMv+2/ttM9M9duscYrsOpzHtHZw65RjgIpz2EwVa+ZVXYHGA/SwOdHx3XXV3uynAGUBFN/6FODOFNsjvOfM7F4pzJzrf5bHAV8AhnDs9Rruv6133dV6XU+xumd44syC3B3YCvwCxPmXF3f8OnNlwo3GqeF5x99EpwP7fcF9nuQDncpv792zv/j3Pc98PR3G+PfqWH+xuMzjAMbYAW3I5T0tw2mMau+f/KuAAsBWoFcRxAv6dg3kfAXPc43Zyz18izjdeBe7K7986n6//QXfbl4DaOPfIuM2N9b9ARA6vfT7wPE41WSIw1V3+R7/yf3aXP4DTLhMPXINza4ZJBfzcWBzoNRVwn1vI5f/Kr+xQt+yfCzOG3/Yfjp2W1h9yTiKrgCygmd/ys9zlX/ksi8CZ2z8TONOv/GXu/jXAsb9z19UKsK42zo2aNgORfutS/P/53eWhJJHKwBdAlN/yqu7reTG/58xnfcAPFmCsu3yI3/IK7gfXr/7ngt+TyFC/5Q+4y6/2WXaOu2yMX9kId/+dAixPBd4I8BrU/bnEb3lLd/k6v+WDCT2JHAYq+a271V33nyCOc9rfOdj3Ec4kfz0D7HsWsD/APgL+rfN6/UBr9/31vwDln3T3eXcOr3213/Ja7vL/+i1fBewNsP9/UPKTyPVu2ZcLM4bsH6vOKiARuQDnTf61+tVVquoGnG+nKT7VGh1xvkV+rao/+JWfj/NBFUgd9/FggHWDcL4xzlC/+mRVXQG8iHO3twJR1YOq2k5/v/Ni9vL9ON/2Oxb0GOD0QgFuwXnjn9LgrqongBk4Vyo35rCL2X7PN7iPvtUS6j52EZFqPvvPAjrgTC/uqyPOlVhO7SF7VHWRX6xrcG5TeraIpOSwXbA+1N/vm5FtOs7ruV5EKhRg30G9j1T1L6oa6HysAargfIkqDENwknigmYqzl92Zw7anvBdUdTdOgvOvolKgqjizaPt6GudLSEmW/X6pk2upEFkSKbjz3cecGru+8yvX2n3MqXfP9hyWZ9fRn8glhoD7dP/Zc9pvUESkpYhMEZFN4rT9ZNet18f54CgMzXCqE3YF+MCE08+pP/+OB7+6j77tHGtx2pfOxWmv+bfb1hCpqjv19Ebnq3DO/Uc5HDOn85v9N2mVw/pgbfNfoKppONV10cCZBdh3UO8jEUkQkb+LyLduO0X2e+ERt0hhvR9y+x/LXnaWiMQGWB+oE8qvnPpeAKfKC+Ajt33rTyJSS1UPq2q+bgwnbjug/w9OO2PDQOskhzEzhSz7S1+g81NglkQKrpL7mNN9v7OXZ4+TSMij/OEclmffYKZcgHXZ+w7rvcfdN/xKnKqNm4HKqirqjEnYitPOUBiCPaenCJAAsq86xKeMAt1x7pS4C+f1fABsF5H7RMT/tfQEFqnqrwSW0/LsWCvlsD5Y4TxOvt9H4gxg+xynuuffQBOf90L2PXDC/n5wr0yz/zcCvR8C9UBT/GJT1ck41W0f4rSRjQd2iDNYr3Y+4zyCk4D9f466MQZadySf+y6I7M+Mk7mWCpHd2bDgsquXcsry2csPuI+H/Jb7i89h+SGcAXkVOf2DJK8YCsvfgEhgmKouCeNxgj2nIXGrbP4F/EtEWgMDgNuBMTjf6kcBuL1zmuK0AeQkLo9Yfa+oNFBBVwy5f7AEc5xgBfM+6oPT5jNLVXM7L4Uhx7jc6rvyfuVCoqqfAp+KSA2cG8PdjdMr8hwROce/ii/A9ssJMAhQnF6QSaqa6wDBMIp2Hwvy3siRXYkU3HL3Maf637P8yq1yH3N6QwXsEgz85D7WyCWGQG9gEZG7JUAX1xzk9gGX5D7+GGBddIBlee0vJ9/h3Dc7UZxR+v78z2nQRKS6iFyU/VxVv1bV+4Bu7iLfwVm93MfcRqnn9HfL/pt87bMs+9vxKR+KIhKF0+6Sm9NmGXDPUW1+/yYcqmDeR0nuY7jfC75xBfofy162TlVDvhIXkcvFGQeEqqaq6nicquf1OOcjPN1ji0b2e+qnXEuFyJJIAanqVzi3bm0lIqf884nIWTh17ivchkmA/+H847UWkTP9yl9G4CQBv98eNtBUFZNxLvX7iEik37pLcBpE83spe8CNpaL7OFREZrjrsuvjz/GLuwk5T1uSfbWQvb/rReSL3AJQpy/8RJwqh1MmmnS/efbBeb1v5uP15KQFMNV3jIFrnfvoWw3SE6cjRG7tSjVF5FK/WFvifMitUdWVPquyP3ib+u2jF3lXAV0RILFe6243Ja9vy3kI5n0U8L3gyqmDhf97oaKIrBWRznnE9SpOL8dAk45mLyvofFsT8JuPzq0q2+g+LXYDM4Nwhvu4ItdSIbIkUjgG4YwfeFecAVgV3N4477jLB2UXdOvib8VppJ0uzmRqFUSkIzAC55tPINmT5Z3Wy8ftcXILzjiHKeJMdBcjIl2A14FXVHV1Pl9L9huti4hUx+kBld1O8y+cb5PPiEhncQYDnofTgyqnb5nZ++ssIvE4XS+P5SOOR3G+gT4tIn3cD5wGOFM/1AFucV93QSQCE0WksYhEicgZOOMQwG1odXtudSDvUerrgZEi0t79e7bG6Tl0FKd3ka9vcJLVQBG5TETixJmA8mac9pncbMf5G2fHfCVOD6KtONWNIQvyfTQLp5tpNxH5m3tlV0tExuCcr0A24lQ5dXC/9d+A8y1/Sx5xrcYZJ9JeRF5yjxMrIrcB9+H8bQpj0saxbuN4nIhUFmcwaDdgnpbgaW6ANjiN6wvDsvdw9BsubT/83ufc92eLX5n6ON+ed+AkiJ3Aa0D9HPbZzv2jHsH5hjYbSMZprDwRoHwEsAnnqianONvjVLnsx/lGuRpnEFU5nzKLA7yWET7r43E+qPfi1KHOwZnbKnv9ZcBnOB8G6TjjRq7n937r/vsrj/PB/AtOW84S3MGXAeJQfMZn4LQPPIpTvXXcfV1zgPb5+PtMctdtCbAuCafKZTBOct6Ck9h+xmlY7eyz70HuNuflct7VPa9NcD7QDrh/14VA2xy2aeweK909l1NwruZ8430pwHkaAQzEqR476h7rbaCuz76Tcji3Se72/ssXB/s+csslAv/BuSo5gTO+5Fn3J6f/k544CfcoTvXKre7ySTn9DX227e6e0zR3+2+AvwaI67TX7i4P9NpHuOs64gw0Xefu/5C7/2FAdAE/Pxb7n4dC/BwKeK58tqnpvhdfD9fno7gHMsWEiGzGedOfEWBdL5zRuT1VtchmkS3LRORd4AJVzanNA7cb5xJV7VRkgRmTDyLyLM6V8FmquiMcx7DqLA+4DZQjAixvjtNwOifQdqo6GxgN/FtEWoQ1SJPd/nI5RTjtuzGFRURuwBmE2S9cCQSsi69XqgMPulcd7+E0VqbgNFxux+1aGoiq/l1EduK0T3QpgljLLHUaVhPyLGhMMeO2OT0OdFWn63L4jmXVWUXP7cV1O85NY+rh9P3/GecK5HHNxwhZEYlR1aIYqGRy4Pb/v9hv8UhVHVH00RjzWQ8rVwAAAEBJREFUO7fXYXn1m6IoLMeyJGKMMSZU1iZijDEmZJZEjDHGhMySiDHGmJBZEjHGGBMySyLGGGNCZknEGGNMyP4fiMCcgcINkKMAAAAASUVORK5CYII=\n",
      "text/plain": [
       "<Figure size 432x288 with 1 Axes>"
      ]
     },
     "metadata": {
      "needs_background": "light"
     },
     "output_type": "display_data"
    }
   ],
   "source": [
    "# plot last author reputation index\n",
    "\n",
    "sns.set_style({'font.family':'serif','font.serif':['Times New Roman']})\n",
    "\n",
    "g = sns.distplot(np.log(citations_per_paper), color='#3274a1', hist_kws={'alpha':1}, kde_kws={'color':'black'})\n",
    "plt.xlabel('log(citations/publications + 1)', fontsize=20)\n",
    "plt.ylabel('Density', fontsize=20)\n",
    "\n",
    "#plt.savefig('citations_per_publication_last.svg')\n",
    "print(np.mean(np.log(citations_per_paper)), np.std(np.log(citations_per_paper)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "X = pd.DataFrame()\n",
    "X['mean reviewer score'] = scores\n",
    "X['reputation index'] = np.log(citations_per_paper)\n",
    "X['top ten school?'] = top_10_indicator\n",
    "X['constant'] = [1] * len(scores)\n",
    "y = np.array(y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(2997, 4)\n",
      "(2997,)\n"
     ]
    }
   ],
   "source": [
    "print(X.shape)\n",
    "print(y.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Optimization terminated successfully.\n",
      "         Current function value: 0.219219\n",
      "         Iterations 9\n",
      "                           Logit Regression Results                           \n",
      "==============================================================================\n",
      "Dep. Variable:                      y   No. Observations:                 2997\n",
      "Model:                          Logit   Df Residuals:                     2993\n",
      "Method:                           MLE   Df Model:                            3\n",
      "Date:                Fri, 02 Oct 2020   Pseudo R-squ.:                  0.6384\n",
      "Time:                        02:13:57   Log-Likelihood:                -657.00\n",
      "converged:                       True   LL-Null:                       -1816.9\n",
      "Covariance Type:            nonrobust   LLR p-value:                     0.000\n",
      "=======================================================================================\n",
      "                          coef    std err          z      P>|z|      [0.025      0.975]\n",
      "---------------------------------------------------------------------------------------\n",
      "mean reviewer score     2.4354      0.098     24.807      0.000       2.243       2.628\n",
      "reputation index        0.1302      0.057      2.270      0.023       0.018       0.243\n",
      "top ten school?         0.2969      0.165      1.802      0.072      -0.026       0.620\n",
      "constant              -13.6620      0.562    -24.313      0.000     -14.763     -12.561\n",
      "=======================================================================================\n"
     ]
    }
   ],
   "source": [
    "# fit logistic regression model\n",
    "logreg = sm.Logit(y, X)\n",
    "result = logreg.fit()\n",
    "print(result.summary())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Accuracy of logistic regression classifier on test set: 0.90\n"
     ]
    }
   ],
   "source": [
    "# compute test accuracy\n",
    "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0)\n",
    "logreg = LogisticRegression(solver='newton-cg', fit_intercept = True, penalty='none')\n",
    "result = logreg.fit(X_train, y_train)\n",
    "\n",
    "y_pred = result.predict(X_test)\n",
    "\n",
    "print('Accuracy of logistic regression classifier on test set: {:.2f}'.format(logreg.score(X_test, y_test)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "scores = []\n",
    "citations_per_paper = []\n",
    "cmu_indicator = []\n",
    "mit_indicator = []\n",
    "cornell_indicator = []\n",
    "\n",
    "y = []\n",
    "\n",
    "for ratings, rankings, cits, pubs, decision, year, in zip(data['ratings'], data['csranking'], data['authors_citations'], data['authors_publications'], data['decisions'], data['year']):\n",
    "    if year == 2020 and pd.notnull(rankings):\n",
    "        # get decision\n",
    "        binary_decision = decision_to_binary.get(decision)\n",
    "        \n",
    "        # get distinct ranks\n",
    "        ranks = rankings.split(';')\n",
    "        ranks = [int(x) for x in ranks]\n",
    "        ranks_set = set(ranks)\n",
    "        ranks_set.discard(-1)\n",
    "        \n",
    "        # get mean reviewer score\n",
    "        rates = ratings.split(';')\n",
    "        rates = [int(x) for x in rates]\n",
    "        rating_avg = np.average(rates)\n",
    "\n",
    "        # get last author citations and publications\n",
    "        cits_last = int(cits.split(';')[-1])\n",
    "        pubs_last = int(pubs.split(';')[-1])\n",
    "\n",
    "        # discard papers with no last author data\n",
    "        if cits_last == -1:\n",
    "            continue\n",
    "        if pubs_last == -1:\n",
    "            continue\n",
    "\n",
    "        # for each distinct rank\n",
    "        for rank in ranks_set:\n",
    "            scores.append(rating_avg)\n",
    "            citations_per_paper.append(cits_last/pubs_last + 1)\n",
    "            y.append(binary_decision)\n",
    "            \n",
    "            # compute indicators for each school\n",
    "            if rank == 1:\n",
    "                cmu_indicator.append(1)\n",
    "                mit_indicator.append(0)\n",
    "                cornell_indicator.append(0)\n",
    "            elif rank == 2:\n",
    "                cmu_indicator.append(0)\n",
    "                mit_indicator.append(1)\n",
    "                cornell_indicator.append(0)\n",
    "            elif rank == 7:\n",
    "                cmu_indicator.append(0)\n",
    "                mit_indicator.append(0)\n",
    "                cornell_indicator.append(1)\n",
    "            else:\n",
    "                cmu_indicator.append(0)\n",
    "                mit_indicator.append(0)\n",
    "                cornell_indicator.append(0)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "X = pd.DataFrame()\n",
    "X['mean reviewer score'] = scores\n",
    "X['reputation index'] = np.log(citations_per_paper)\n",
    "X['CMU'] = cmu_indicator\n",
    "X['MIT'] = mit_indicator\n",
    "X['Cornell'] = cornell_indicator\n",
    "X['constant'] = [1] * len(scores)\n",
    "y = np.array(y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(2997, 6)\n",
      "(2997,)\n"
     ]
    }
   ],
   "source": [
    "print(X.shape)\n",
    "print(y.shape)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Optimization terminated successfully.\n",
      "         Current function value: 0.217961\n",
      "         Iterations 9\n",
      "                           Logit Regression Results                           \n",
      "==============================================================================\n",
      "Dep. Variable:                      y   No. Observations:                 2997\n",
      "Model:                          Logit   Df Residuals:                     2991\n",
      "Method:                           MLE   Df Model:                            5\n",
      "Date:                Fri, 02 Oct 2020   Pseudo R-squ.:                  0.6405\n",
      "Time:                        02:13:57   Log-Likelihood:                -653.23\n",
      "converged:                       True   LL-Null:                       -1816.9\n",
      "Covariance Type:            nonrobust   LLR p-value:                     0.000\n",
      "=======================================================================================\n",
      "                          coef    std err          z      P>|z|      [0.025      0.975]\n",
      "---------------------------------------------------------------------------------------\n",
      "mean reviewer score     2.4511      0.099     24.718      0.000       2.257       2.645\n",
      "reputation index        0.1306      0.057      2.285      0.022       0.019       0.243\n",
      "CMU                     0.6730      0.368      1.829      0.067      -0.048       1.394\n",
      "MIT                     0.6783      0.358      1.895      0.058      -0.023       1.380\n",
      "Cornell                 1.3482      0.611      2.207      0.027       0.151       2.546\n",
      "constant              -13.7425      0.567    -24.238      0.000     -14.854     -12.631\n",
      "=======================================================================================\n"
     ]
    }
   ],
   "source": [
    "# fit logistic regression model\n",
    "logreg = sm.Logit(y, X)\n",
    "result = logreg.fit()\n",
    "print(result.summary())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Accuracy of logistic regression classifier on test set: 0.90\n"
     ]
    }
   ],
   "source": [
    "# compute test accuracy\n",
    "\n",
    "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0)\n",
    "logreg = LogisticRegression(solver='newton-cg', fit_intercept = True, penalty='none')\n",
    "result = logreg.fit(X_train, y_train)\n",
    "\n",
    "y_pred = result.predict(X_test)\n",
    "\n",
    "print('Accuracy of logistic regression classifier on test set: {:.2f}'.format(logreg.score(X_test, y_test)))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
