{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "CPG0Mzf6NaLq"
   },
   "source": [
    "## The next Block of code, load the data and calculats $\\Pr\\{A\\}$"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "8WOtuD5vQX8l",
    "outputId": "1847f9fb-b18c-4400-baf0-bdbeff786e29"
   },
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "\n",
    "df = pd.read_csv('totals.csv')\n",
    "Num_black = float(df['Black'][0])\n",
    "Num_white = df['Non- Hispanic white'][0]\n",
    "print('The number of black people:{} \\nThe number of white people:{}'.format(Num_black,Num_white))\n",
    "pA0 = float(Num_white/(Num_black+Num_white) )# Calculating \\Pr\\{A=0\\}\n",
    "pA1 = (1-pA0)# Calculating \\Pr\\{A=1\\}"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "FX0pFXcpNHq_"
   },
   "source": [
    "## Next block of code is generating figure 1."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 287
    },
    "id": "iNvW2Dr5QX8x",
    "outputId": "edcc53c9-24b1-40fb-eab8-47c610a404c3"
   },
   "outputs": [],
   "source": [
    "font = {'family' : 'normal',\n",
    "        'size'   : 11}\n",
    "import matplotlib\n",
    "matplotlib.rc('font', **font)\n",
    "\n",
    "\n",
    "df_cdf = pd.read_csv('transrisk_cdf_by_race_ssa.csv')\n",
    "Score = np.array(df_cdf['Score'])\n",
    "cdf_white = np.array(df_cdf['Non- Hispanic white'])/100\n",
    "cdf_black = np.array(df_cdf['Black'])/100\n",
    "pdf_white = cdf_white[1:] - cdf_white[:-1]\n",
    "pdf_black = cdf_black[1:] - cdf_black[:-1]\n",
    "\n",
    "\n",
    "df_per = pd.read_csv('transrisk_performance_by_race_ssa.csv') \n",
    "Score = np.array(df_cdf['Score'])\n",
    "per_white = 1-np.array(df_per['Non- Hispanic white'])/100#white is group 0\n",
    "per_black = 1-np.array(df_per['Black'])/100#black is group 1\n",
    "cdf_R = pA1 * cdf_black+ cdf_white * pA0\n",
    "pRgivenYA0 = pdf_white * per_white[1:] / np.sum(pdf_white * per_white[1:])  \n",
    "pRgivenYA1 = pdf_black * per_black[1:] / np.sum(pdf_black * per_black[1:]) \n",
    "CDFRgivenYA0 = [np.sum(pRgivenYA0[:i+1]) for i in range(len(pRgivenYA0))]\n",
    "CDFRgivenYA1 = [np.sum(pRgivenYA1[:i+1]) for i in range(len(pRgivenYA1))]\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.figure(figsize=(5,4))\n",
    "\n",
    "plt.plot(np.linspace(0,100,len(CDFRgivenYA0)),CDFRgivenYA0, label=r'$F_{R|Y=1,A=0}(\\rho)$',linewidth=4)\n",
    "plt.plot(np.linspace(0,100,len(CDFRgivenYA0)),CDFRgivenYA1,'r' ,label=r'$F_{R|Y=1,A=1}(\\rho)$',linewidth=4)\n",
    "plt.legend(loc=0)\n",
    "plt.xlabel(r'Score $ (\\rho) $')\n",
    "plt.grid()\n",
    "plt.savefig('CDF.eps', format='eps',bbox_inches='tight')\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "B4abIBouNtPe"
   },
   "source": [
    "#Next, we calculate optimal thresholds for the ESR fairness notions\n",
    "#for generating the results of the Table 2 Please uncomment the comment part in the if clause\n",
    "condition np.abs(numerator0-numerator1)<=0.001*(1-noSelect)  implies 0.001-ESR fairness notion\n",
    "\n",
    " condition np.abs(numerator0-numerator1)<=0.01*(1-noSelect)  implies 0.01-ESR fairness notion\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "8cMKk7CSQX8y",
    "outputId": "c0633760-6aa2-40ea-d48e-8007e018288f"
   },
   "outputs": [],
   "source": [
    "\n",
    "obj = 0\n",
    "n0 = 100\n",
    "for i in range(0,len(Score)-1):\n",
    "    for j in range(0,len(Score)-1): \n",
    "        gamma = cdf_white[i]*pA0 + cdf_black[j]*pA1\n",
    "        noSelect = cdf_white[i] * pA0 + cdf_black[j] * pA1  \n",
    "        noSelectn0 = (noSelect**n0)\n",
    "        numerator0 = pA0 *float(np.sum(pdf_white[i:] * per_white[i:-1]))\n",
    "        numerator1 = pA1 *float(np.sum(pdf_black[j:] * per_black[j:-1]))\n",
    "        obj_temp = float(numerator0+numerator1)/float(1-gamma)\n",
    "        EqualOp0 = np.sum((pdf_white[i:]*per_white[i:-1]))/np.sum(pdf_white * per_white[:-1])\n",
    "        EqualOp1 = np.sum((pdf_black[j:]*per_black[j:-1])/np.sum(pdf_black * per_black[:-1]))\n",
    "        if np.abs(numerator0-numerator1)<=0.001*(1-noSelect) and obj_temp > obj:#  and noSelectn0 <=0.5:\n",
    "            Eq0 = EqualOp0\n",
    "            Eq1 = EqualOp1\n",
    "            obj = obj_temp\n",
    "            SR0 = float(numerator0)/float(1-noSelect)\n",
    "            SR1 = numerator1/(1-noSelect)\n",
    "            tau_0 = float(Score[i])\n",
    "            tau_1 = float(Score[j])\n",
    "print('Threshold0: {}, Threshold1: {}, Accuracy: {}'.format(tau_0,tau_1,obj))\n",
    "print('Pr(E_0,tildeY=1): {}, Pr(E_1,tildeY=1): {}'.format(SR0,SR1))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "WVUsILhIOOIe"
   },
   "source": [
    "# Next, we calculate optimal thresholds for the equal opportunity fairness notion\n",
    "# for generating the results of the Table 2 Please uncomment the comment in the if clause\n",
    " \n",
    " condition np.abs(EqualOp0-EqualOp1)<0.001 implies 0.001-EQ fairness notion\n",
    "\n",
    "  condition np.abs(EqualOp0-EqualOp1)<0.01 implies 0.01-EQ fairness notion"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "FrztrIrFQX8z",
    "outputId": "0ad35f67-8898-42ad-eb50-00a6aee4194e"
   },
   "outputs": [],
   "source": [
    "\n",
    "obj = 0\n",
    "for i in range(0,len(Score)-1):\n",
    "    for j in range(0,len(Score)-1): \n",
    "        gamma = cdf_white[i]*pA0 + cdf_black[j]*pA1\n",
    "        noSelect = cdf_white[i] * pA0 + cdf_black[j] * pA1  \n",
    "        noSelectn0 = (noSelect**n0)\n",
    "        numerator0 = pA0 *np.sum(pdf_white[i:] * per_white[i:-1])\n",
    "        numerator1 = pA1 *np.sum(pdf_black[j:] * per_black[j:-1])\n",
    "        obj_temp = float(numerator0+numerator1)/float(1-gamma)\n",
    "        EqualOp0 = np.sum((pdf_white[i:]*per_white[i:-1]))/np.sum(pdf_white * per_white[:-1])\n",
    "        EqualOp1 = np.sum((pdf_black[j:]*per_black[j:-1])/np.sum(pdf_black * per_black[:-1]))\n",
    "        if np.abs(EqualOp0-EqualOp1)<0.001 and obj_temp > obj and noSelectn0 <=0.5:\n",
    "            Eq0 = EqualOp0\n",
    "            Eq1 = EqualOp1\n",
    "            obj = obj_temp\n",
    "            gamma_m = gamma\n",
    "            SR0 = numerator0/(1-gamma)\n",
    "            SR1 = numerator1/(1-gamma)\n",
    "            tau_0 = Score[i]\n",
    "            tau_1 = Score[j]\n",
    "print('Threshold0: {}, Threshold1: {}, Accuracy: {}'.format(tau_0,tau_1,obj))\n",
    "print('Pr(E_0,tildeY=1): {}, Pr(E_1,tildeY=1): {}'.format(SR0,SR1))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "2RLgpkt3O9B3"
   },
   "source": [
    "#The next two blocks, generate the figures in section A.6\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "xN96QmgmQX8z"
   },
   "outputs": [],
   "source": [
    "prs = [0.1,0.2,0.3,0.4,0.5,0.6,0.7,0.8,0.9,1]\n",
    "n0 = 50\n",
    "obj_eq = []\n",
    "Eq0 = []\n",
    "Eq1 = []\n",
    "SR0_eq = []\n",
    "SR1_eq = []\n",
    "obj_ESR = []\n",
    "SR0_ESR = []\n",
    "SR1_ESR = []\n",
    "for p in prs:\n",
    "  obj_eq.append(0)\n",
    "  Eq0.append(0)\n",
    "  Eq1.append(0)\n",
    "  SR0_eq.append(0)\n",
    "  SR1_eq.append(0)\n",
    "  for i in range(0,len(Score)-1):\n",
    "    for j in range(0,len(Score)-1): \n",
    "        gamma = cdf_white[i]*pA0 + cdf_black[j]*pA1\n",
    "        noSelect = cdf_white[i] * pA0 + cdf_black[j] * pA1  \n",
    "        noSelectn0 = (noSelect**n0)\n",
    "        numerator0 = pA0 *np.sum(pdf_white[i:] * per_white[i:-1])\n",
    "        numerator1 = pA1 *np.sum(pdf_black[j:] * per_black[j:-1])\n",
    "        obj_temp = float(numerator0+numerator1)/float(1-gamma)\n",
    "        EqualOp0 = np.sum((pdf_white[i:]*per_white[i:-1]))/np.sum(pdf_white * per_white[:-1])\n",
    "        EqualOp1 = np.sum((pdf_black[j:]*per_black[j:-1])/np.sum(pdf_black * per_black[:-1]))\n",
    "        if np.abs(EqualOp0-EqualOp1)<0.01 and obj_temp > obj_eq[-1] and noSelectn0 <=p:\n",
    "            Eq0[-1] = (EqualOp0)\n",
    "            Eq1[-1] = (EqualOp1)\n",
    "            obj_eq[-1] = (obj_temp)\n",
    "            gamma_m = gamma\n",
    "            SR0_eq[-1] = (numerator0/(1-gamma))\n",
    "            SR1_eq[-1] = (numerator1/(1-gamma))\n",
    "  obj_ESR.append(0)\n",
    "  SR0_ESR.append(0)\n",
    "  SR1_ESR.append(0)\n",
    "  for i in range(0,len(Score)-1):\n",
    "    for j in range(0,len(Score)-1): \n",
    "        gamma = cdf_white[i]*pA0 + cdf_black[j]*pA1\n",
    "        noSelect = cdf_white[i] * pA0 + cdf_black[j] * pA1  \n",
    "        noSelectn0 = (noSelect**n0)\n",
    "        numerator0 = pA0 *float(np.sum(pdf_white[i:] * per_white[i:-1]))\n",
    "        numerator1 = pA1 *float(np.sum(pdf_black[j:] * per_black[j:-1]))\n",
    "        obj_temp = float(numerator0+numerator1)/float(1-gamma)\n",
    "        EqualOp0 = np.sum((pdf_white[i:]*per_white[i:-1]))/np.sum(pdf_white * per_white[:-1])\n",
    "        EqualOp1 = np.sum((pdf_black[j:]*per_black[j:-1])/np.sum(pdf_black * per_black[:-1]))\n",
    "        if np.abs(numerator0-numerator1)<=0.01*(1-noSelect) and obj_temp > obj_ESR[-1]  and noSelectn0 <=p:\n",
    "            obj_ESR[-1] = obj_temp\n",
    "            SR0_ESR[-1] = float(numerator0)/float(1-noSelect)\n",
    "            SR1_ESR[-1] = numerator1/(1-noSelect)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 587
    },
    "id": "Ttef3WFJgJFb",
    "outputId": "adc37335-826c-4da5-a43d-bb6798004255"
   },
   "outputs": [],
   "source": [
    "font = {'family' : 'normal',\n",
    "        'size'   : 11}\n",
    "import matplotlib\n",
    "matplotlib.rc('font', **font)\n",
    "plt.figure(figsize=(5,4))\n",
    "plt.plot(prs,obj_eq,'c--',label=r'$\\Pr\\{\\tilde{Y}=1\\}$ EO',linewidth=4)\n",
    "plt.plot(prs,obj_ESR,'m:' ,label=r'$\\Pr\\{\\tilde{Y}=1\\}$ ESR',linewidth=4)\n",
    "plt.legend(loc='lower right')\n",
    "plt.xlabel(r'$\\psi$')\n",
    "plt.grid()\n",
    "plt.savefig('time21.eps', format='eps',bbox_inches='tight')\n",
    "\n",
    "plt.figure(figsize=(5,4))\n",
    "plt.plot(prs,SR0_ESR,'r',label=r'$\\Pr\\{\\tilde{Y}=1,E_0\\}$ ESR',linewidth=4)\n",
    "plt.plot(prs,SR1_ESR,'b:' ,label=r'$\\Pr\\{\\tilde{Y}=1,E_1\\}$ ESR',linewidth=4)\n",
    "plt.plot(prs,SR0_eq,'c',label=r'$\\Pr\\{\\tilde{Y}=1,E_0\\}$ EO',linewidth=4)\n",
    "plt.plot(prs,SR1_eq,'m' ,label=r'$\\Pr\\{\\tilde{Y}=1,E_1\\}$ EO',linewidth=4)\n",
    "plt.legend(loc='lower right',ncol=2,bbox_to_anchor=(1.02, 0.15) )\n",
    "plt.xlabel(r'$\\psi$')\n",
    "plt.grid()\n",
    "plt.savefig('time2.eps', format='eps',bbox_inches='tight')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "name": "Table1Table2.ipynb",
   "provenance": [],
   "toc_visible": true
  },
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
