{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import random\n",
    "import matplotlib\n",
    "matplotlib.rcParams['pdf.fonttype'] = 42\n",
    "matplotlib.rcParams['ps.fonttype'] = 42\n",
    "import matplotlib.pyplot as plt\n",
    "import sys\n",
    "import time\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### load FICO dataset"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "DATA_DIR = ''\n",
    "file_name = ['transrisk_performance_by_race_ssa.csv','transrisk_cdf_by_race_ssa.csv','totals.csv']\n",
    "df_repay = pd.read_csv(DATA_DIR + file_name[0])\n",
    "df_cdf = pd.read_csv(DATA_DIR + file_name[1])\n",
    "df_dm_ratio = pd.read_csv(DATA_DIR + file_name[2])\n",
    "\n",
    "df_repay = df_repay.rename(columns={\"Non- Hispanic white\": \"Caucasian\", \"Black\": \"African-American\", \"Hispanic\":\"Hispanic\", \"Asian\":\"Asian\"})\n",
    "df_cdf = df_cdf.rename(columns={\"Non- Hispanic white\": \"Caucasian\", \"Black\": \"African-American\", \"Hispanic\":\"Hispanic\", \"Asian\":\"Asian\"})\n",
    "df_dm_ratio = df_dm_ratio.rename(columns={\"Non- Hispanic white\": \"Caucasian\", \"Black\": \"African-American\", \"Hispanic\":\"Hispanic\", \"Asian\":\"Asian\"})\n",
    "\n",
    "df_cdf.iloc[:,1:] = df_cdf.iloc[:,1:]/100.0\n",
    "df_repay.iloc[:,1:] = (100-df_repay.iloc[:,1:])/100.0\n",
    "k1_list=np.linspace(1,2,5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### obtain PDF from CDF"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "nrow, ncol = df_cdf.shape\n",
    "df_pdf = df_cdf.copy()\n",
    "for i in range(nrow-1):\n",
    "    indx = i + 1\n",
    "    df_pdf.iloc[i+1,1:] = df_cdf.iloc[i+1,1:]- df_cdf.iloc[i,1:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig = plt.figure(figsize=(7,3))  \n",
    "plt.subplot(1,2,1)\n",
    "plt.plot(df_pdf[\"Score\"]/100,df_pdf['Caucasian'],label='Caucasian')\n",
    "plt.plot(df_pdf[\"Score\"]/100,df_pdf['African-American'],label='African-American')\n",
    "plt.plot(df_pdf[\"Score\"]/100,df_pdf['Hispanic'],label='Hispanic')\n",
    "plt.plot(df_pdf[\"Score\"]/100,df_pdf['Asian'],label='Asian')\n",
    "plt.xlabel('Score')\n",
    "plt.title(\"PDF of scores\")\n",
    "plt.legend()\n",
    "plt.subplot(1,2,2)\n",
    "plt.plot(df_cdf[\"Score\"]/100,df_cdf['Caucasian'],label='Caucasian')\n",
    "plt.plot(df_cdf[\"Score\"]/100,df_cdf['African-American'],label='African-American')\n",
    "plt.plot(df_cdf[\"Score\"]/100,df_cdf['Hispanic'],label='Hispanic')\n",
    "plt.plot(df_cdf[\"Score\"]/100,df_cdf['Asian'],label='Asian')\n",
    "plt.xlabel('Score')\n",
    "plt.title(\"CDF of scores\")\n",
    "plt.tight_layout()\n",
    "fig.savefig('pdf_cdf.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### repayment probability $P_{Y|X,S}(1|x,s)$"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "import matplotlib\n",
    "matplotlib.rcParams.update({'font.size': 10.7})\n",
    "\n",
    "fig = plt.figure(figsize=(3.5,3))  \n",
    "plt.plot(df_repay[\"Score\"]/100,df_repay.iloc[:,1],label='Caucasian')\n",
    "plt.plot(df_repay[\"Score\"]/100,df_repay.iloc[:,2],label='African-American')\n",
    "plt.plot(df_repay[\"Score\"]/100,df_repay.iloc[:,3],label='Hispanic')\n",
    "plt.plot(df_repay[\"Score\"]/100,df_repay.iloc[:,4],label='Asian')\n",
    "plt.title(r\"$P_{Y|X,S}(1|x,s)$\")\n",
    "plt.xlabel('Score')\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "fig.savefig('repay_prob.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Create a simulator"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Step 1.** Generate simulated data from the joint distributions given above, $P(X=x,Y=y \\mid S= s) = P(Y=y \\mid X=x, S= s)P(X=x\\mid S=s)$."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "np.random.seed(777)\n",
    "# Step 1\n",
    "NUM_SAMPLES = 100000\n",
    "elements = df_pdf[\"Score\"]\n",
    "probabilities_c = df_pdf[\"Caucasian\"]\n",
    "probabilities_aa = df_pdf[\"African-American\"]\n",
    "probabilities_h = df_pdf[\"Hispanic\"]\n",
    "probabilities_a = df_pdf[\"Asian\"]\n",
    "\n",
    "scores_c = np.random.choice(elements, NUM_SAMPLES, p=probabilities_c)\n",
    "scores_aa = np.random.choice(elements, NUM_SAMPLES, p=probabilities_aa)\n",
    "scores_h = np.random.choice(elements, NUM_SAMPLES, p=probabilities_h)\n",
    "scores_a = np.random.choice(elements, NUM_SAMPLES, p=probabilities_a)\n",
    "prob_repay_c = [df_repay.loc[df_repay[\"Score\"]==x][\"Caucasian\"].values[0] for x in scores_c]\n",
    "prob_repay_aa = [df_repay.loc[df_repay[\"Score\"]==x][\"African-American\"].values[0] for x in scores_aa]\n",
    "prob_repay_h = [df_repay.loc[df_repay[\"Score\"]==x][\"Hispanic\"].values[0] for x in scores_h]\n",
    "prob_repay_a = [df_repay.loc[df_repay[\"Score\"]==x][\"Asian\"].values[0] for x in scores_a]\n",
    "\n",
    "repay_c = np.random.binomial(1, prob_repay_c, NUM_SAMPLES)\n",
    "repay_aa = np.random.binomial(1, prob_repay_aa, NUM_SAMPLES)\n",
    "repay_h = np.random.binomial(1, prob_repay_h, NUM_SAMPLES)\n",
    "repay_a = np.random.binomial(1, prob_repay_a, NUM_SAMPLES)\n",
    "\n",
    "scores_c = scores_c/100.0\n",
    "scores_aa = scores_aa/100.0\n",
    "scores_h = scores_h/100.0\n",
    "scores_a = scores_a/100.0"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Step 2.** Fit beta distributions to the generated data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from scipy.stats import beta\n",
    "import scipy.stats as ss\n",
    "# Step 2\n",
    "a_c1,b_c1,loc_c1,scale_c1 = beta.fit(scores_c[repay_c==1])\n",
    "a_c0,b_c0,loc_c0,scale_c0 = beta.fit(scores_c[repay_c==0])\n",
    "a_aa0,b_aa0,loc_aa0,scale_aa0 = beta.fit(scores_aa[repay_aa==0])\n",
    "a_aa1,b_aa1,loc_aa1,scale_aa1 = beta.fit(scores_aa[repay_aa==1])\n",
    "\n",
    "a_h0,b_h0,loc_h0,scale_h0 = beta.fit(scores_h[repay_h==0])\n",
    "a_h1,b_h1,loc_h1,scale_h1 = beta.fit(scores_h[repay_h==1])\n",
    "a_a0,b_a0,loc_a0,scale_a0 = beta.fit(scores_a[repay_a==0])\n",
    "a_a1,b_a1,loc_a1,scale_a1 = beta.fit(scores_a[repay_a==1])\n",
    "\n",
    "\n",
    "def plot_beta(x_range, a, b, mu=0, sigma=1, cdf=False, **kwargs):\n",
    "    '''\n",
    "    Plots the f distribution function for a given x range, a and b\n",
    "    If mu and sigma are not provided, standard beta is plotted\n",
    "    If cdf=True cumulative distribution is plotted\n",
    "    Passes any keyword arguments to matplotlib plot function\n",
    "    '''\n",
    "    x = x_range\n",
    "    if cdf:\n",
    "        y = ss.beta.cdf(x, a, b, mu, sigma)\n",
    "    else:\n",
    "        y = ss.beta.pdf(x, a, b, mu, sigma)\n",
    "    plt.plot(x, y, **kwargs)\n",
    "\n",
    "x = np.linspace(0, 1, 5000)\n",
    "fig = plt.figure(figsize=(12, 2.5))\n",
    "plt.subplot(1,4,1)\n",
    "plt.ylim(0.1, 11.6)\n",
    "plt.xlim(0, 1)\n",
    "plot_beta(x, a_c1,b_c1, 0, 1, color='green', lw=2, ls='-')\n",
    "plot_beta(x, a_c0,b_c0, 0, 1, color='red', lw=2, ls='-')\n",
    "plot_beta(x,(a_c0+a_c1)/2,(b_c0+b_c1)/2, 0, 1, color='blue', label = 'Fail to improve', lw=2, ls='-')\n",
    "plt.hist(scores_c[repay_c==1], density=True, color = 'green', bins=100, label='repay',alpha=0.5)\n",
    "plt.hist(scores_c[repay_c==0], density=True, bins=100, color = 'red', label='default',alpha=0.5)\n",
    "plt.title(\"Caucasian\")\n",
    "plt.xlabel('Score')\n",
    "plt.legend()\n",
    "plt.subplot(1,4,2)\n",
    "plt.ylim(0.1, 11.6)\n",
    "plt.xlim(0, 1)\n",
    "plot_beta(x, a_aa1,b_aa1, 0, 1, color='green', lw=2, ls='-')\n",
    "plot_beta(x,a_aa0,b_aa0, 0, 1, color='red', lw=2, ls='-')\n",
    "plot_beta(x,(a_aa0+a_aa1)/2,(b_aa0+b_aa1)/2, 0, 1, color='blue', label = 'Fail to improve', lw=2, ls='-')\n",
    "plt.hist(scores_aa[repay_aa==1], density=True, color = 'green', bins=100, label='repay',alpha=0.5)\n",
    "plt.hist(scores_aa[repay_aa==0], density=True, color = 'red', bins=100, label='default',alpha=0.5)\n",
    "plt.title(\"African-American\")\n",
    "plt.xlabel('Score')\n",
    "plt.legend()\n",
    "plt.subplot(1,4,3)\n",
    "plt.ylim(0.1, 11.6)\n",
    "plt.xlim(0, 1)\n",
    "plot_beta(x, a_h1,b_h1, 0, 1, color='green', lw=2, ls='-')\n",
    "plot_beta(x,a_h0,b_h0, 0, 1, color='red', lw=2, ls='-')\n",
    "plot_beta(x,(a_h0+a_h1)/2,(b_h0+b_h1)/2, 0, 1, color='blue', label = 'Fail to improve', lw=2, ls='-')\n",
    "plt.hist(scores_h[repay_h==1], density=True, bins=100, color = 'green', label='repay',alpha=0.5)\n",
    "plt.hist(scores_h[repay_h==0], density=True, bins=100, color = 'red', label='default',alpha=0.5)\n",
    "plt.title(\"Hispanic\")\n",
    "plt.xlabel('Score')\n",
    "plt.legend()\n",
    "plt.subplot(1,4,4)\n",
    "plt.ylim(0.1, 11.6)\n",
    "plt.xlim(0, 1)\n",
    "plot_beta(x, a_a1,b_a1, 0, 1, color='green', lw=2, ls='-')\n",
    "plot_beta(x,a_a0,b_a0, 0, 1, color='red', lw=2, ls='-')\n",
    "plot_beta(x,(a_a0+a_a1)/2,(b_a0+b_a1)/2, 0, 1, color='blue', label = 'Fail to improve', lw=2, ls='-')\n",
    "plt.hist(scores_a[repay_a==1], density=True, bins=100, color = 'green', label='repay',alpha=0.5)\n",
    "plt.hist(scores_a[repay_a==0], density=True, bins=100, color = 'red', label='default',alpha=0.5)\n",
    "plt.title(\"Asian\")\n",
    "plt.xlabel('Score')\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "fig.savefig('score_pdf.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Assume $$P^I(\\theta) \\sim Beta(\\frac{a_0+a_1}{2}, \\frac{b_0+b_1}{2}, \\mu, \\sigma)$$**\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "from matplotlib.ticker import LogLocator\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "\n",
    "def plot_monotone_1(x_range, a0, b0, a1, b1, mu=0, sigma=1, **kwargs):\n",
    "    '''\n",
    "    Plots the f distribution function for a given x range, a and b\n",
    "    If mu and sigma are not provided, standard beta is plotted\n",
    "    If cdf=True cumulative distribution is plotted\n",
    "    Passes any keyword arguments to matplotlib plot function\n",
    "    '''\n",
    "    x = x_range\n",
    "    y0 = ss.beta.pdf(x, a0, b0, mu, sigma)\n",
    "    y1 = ss.beta.pdf(x, a1, b1, mu, sigma)\n",
    "    ratio_10 = y1/y0\n",
    "    plt.plot(x, ratio_10, **kwargs)\n",
    "    plt.yscale('log')\n",
    "\n",
    "def plot_monotone_2(x_range, a0, b0, a1, b1, mu=0, sigma=1, **kwargs):\n",
    "    '''\n",
    "    Plots the f distribution function for a given x range, a and b\n",
    "    If mu and sigma are not provided, standard beta is plotted\n",
    "    If cdf=True cumulative distribution is plotted\n",
    "    Passes any keyword arguments to matplotlib plot function\n",
    "    '''\n",
    "    x = x_range\n",
    "    yi = ss.beta.pdf(x, (a0+a1)/2, (b0+b1)/2, mu, sigma)\n",
    "    y1 = ss.beta.pdf(x, a1, b1, mu, sigma)\n",
    "    ratio_1i = y1/yi\n",
    "    plt.plot(x, ratio_1i, **kwargs)\n",
    "    plt.yscale('log')   \n",
    "    \n",
    "def plot_monotone_3(x_range, a0, b0, a1, b1, mu=0, sigma=1, **kwargs):\n",
    "    '''\n",
    "    Plots the f distribution function for a given x range, a and b\n",
    "    If mu and sigma are not provided, standard beta is plotted\n",
    "    If cdf=True cumulative distribution is plotted\n",
    "    Passes any keyword arguments to matplotlib plot function\n",
    "    '''\n",
    "    x = x_range\n",
    "    yi = ss.beta.pdf(x, (a0+a1)/2, (b0+b1)/2, mu, sigma)\n",
    "    y0 = ss.beta.pdf(x, a0, b0, mu, sigma)\n",
    "    ratio_i0 = yi/y0\n",
    "    plt.plot(x, ratio_i0, **kwargs)\n",
    "    plt.yscale('log')  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig = plt.figure(figsize=(3.5, 3))   \n",
    "ax = fig.add_subplot(111)\n",
    "plt.xlim(0, 1)\n",
    "plt.ylim(0.00001, 10**14)\n",
    "plot_monotone_1(x,a_c0,b_c0,a_c1,b_c1, 0, 1, lw=1.5, ls='-',label='Caucasian')\n",
    "plot_monotone_1(x,a_aa0,b_aa0,a_aa1,b_aa1, 0, 1, lw=1.5, ls='-',label='African-American')\n",
    "plot_monotone_1(x,a_h0,b_h0,a_h1,b_h1, 0, 1,  lw=1.5, ls='-',label='Hispanic')\n",
    "plot_monotone_1(x,a_a0,b_a0,a_a1,b_a1, 0, 1, lw=1.5, ls='-',label='Asian')\n",
    "\n",
    "ax.yaxis.set_major_locator(LogLocator(base=10**13))\n",
    "\n",
    "plt.xlabel('Score')\n",
    "plt.title(r'$\\frac{P_{X|Y,S}(x|1,s)}{P_{X|Y,S}(x|0,s)}$')\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "fig.savefig('p10.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig = plt.figure(figsize=(3.5, 3))   \n",
    "ax = fig.add_subplot(111)\n",
    "plt.xlim(0, 1)\n",
    "plt.ylim(0.00001, 10**14)\n",
    "plot_monotone_2(x,a_c0,b_c0,a_c1,b_c1, 0, 1, lw=1.5, ls='-',label='Caucasian')\n",
    "plot_monotone_2(x,a_aa0,b_aa0,a_aa1,b_aa1, 0, 1, lw=1.5, ls='-',label='African-American')\n",
    "plot_monotone_2(x,a_h0,b_h0,a_h1,b_h1, 0, 1,  lw=1.5, ls='-',label='Hispanic')\n",
    "plot_monotone_2(x,a_a0,b_a0,a_a1,b_a1, 0, 1, lw=1.5, ls='-',label='Asian')\n",
    "\n",
    "ax.yaxis.set_major_locator(LogLocator(base=10**13))\n",
    "\n",
    "plt.xlabel('Score')\n",
    "plt.title(r'$\\frac{P_{X|Y,S}(x|1,s)}{P^I(x)}$')\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "fig.savefig('p1i.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig = plt.figure(figsize=(3.5, 3))   \n",
    "ax = fig.add_subplot(111)\n",
    "plt.xlim(0, 1)\n",
    "plt.ylim(0.00001, 10**14)\n",
    "plot_monotone_3(x,a_c0,b_c0,a_c1,b_c1, 0, 1, lw=1.5, ls='-',label='Caucasian')\n",
    "plot_monotone_3(x,a_aa0,b_aa0,a_aa1,b_aa1, 0, 1, lw=1.5, ls='-',label='African-American')\n",
    "plot_monotone_3(x,a_h0,b_h0,a_h1,b_h1, 0, 1,  lw=1.5, ls='-',label='Hispanic')\n",
    "plot_monotone_3(x,a_a0,b_a0,a_a1,b_a1, 0, 1, lw=1.5, ls='-',label='Asian')\n",
    "\n",
    "ax.yaxis.set_major_locator(LogLocator(base=10**13))\n",
    "\n",
    "plt.xlabel('Score')\n",
    "plt.title(r'$\\frac{P^I(x)}{P_{X|Y,S}(x|0,s)}$')\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "fig.savefig('pi0.pdf')\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### demographic parameters\n",
    "\n",
    "The proportion of each demographic group"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# relative sizes\n",
    "total = df_dm_ratio.iloc[0]['Caucasian']+df_dm_ratio.iloc[0]['African-American']+df_dm_ratio.iloc[0]['Hispanic']+df_dm_ratio.iloc[0]['Asian']\n",
    "P_c = df_dm_ratio.iloc[0]['Caucasian']/total\n",
    "P_aa = df_dm_ratio.iloc[0]['African-American']/total\n",
    "P_h = df_dm_ratio.iloc[0]['Hispanic']/total\n",
    "P_a = df_dm_ratio.iloc[0]['Asian']/total\n",
    "print(P_c,P_aa,P_h,P_a)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "$\\alpha_s$"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "# repayment rates\n",
    "alpha_aa, alpha_c,alpha_h, alpha_asian = np.sum(repay_aa)/NUM_SAMPLES, np.sum(repay_c)/NUM_SAMPLES,np.sum(repay_h)/NUM_SAMPLES, np.sum(repay_a)/NUM_SAMPLES\n",
    "print(alpha_aa, alpha_c,alpha_h, alpha_asian)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Verification of results\n",
    "\n",
    "We do experiments on:\n",
    "\n",
    "1. Caucasian vs African American\n",
    "\n",
    "2. Asian vs Hispanic\n",
    "\n",
    "### 1. (Non)-strategic optimal threshold and utility"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "from scipy.stats import norm\n",
    "eps = 0.5\n",
    "u = 1\n",
    "q = 0.3\n",
    "mu_c = 0\n",
    "std_c = 0.25"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "# scaled utility function & non-strategic optimal threshold \n",
    "def opt_non_strategic(u,alpha,a0,b0,a1,b1):\n",
    "    theta = np.linspace(0,1,10000)\n",
    "    U = (1 - beta.cdf(theta,a1,b1))*alpha*u - (1-beta.cdf(theta,a0,b0))*(1-alpha)*u  \n",
    "    return U, theta[int(np.argmax(U))]\n",
    "    \n",
    "# one group: measure for calculating unfairness\n",
    "def fair_measure(threshold,a0,b0,a1,b1,alpha,fair_type):\n",
    "    if fair_type == \"eqopt\":\n",
    "        return beta.cdf(threshold, a1, b1, 0, 1)\n",
    "    if fair_type == \"dp\":\n",
    "        return beta.cdf(threshold, a1, b1, 0, 1)*alpha + beta.cdf(threshold, a0, b0, 0, 1)*(1-alpha)\n",
    "\n",
    "# Get manipulation Prob\n",
    "def get_manip_prob(theta, q, eps, ai, bi, a1, b1):\n",
    "    \"\"\"\n",
    "    function to get manip prob under q and eps\n",
    "    \"\"\"\n",
    "    value = (1-q)*(beta.cdf(theta, ai, bi, 0, 1) - beta.cdf(theta, a1, b1, 0, 1)) - eps*(1 - beta.cdf(theta, a1, b1, 0, 1))\n",
    "    return norm.cdf(value, mu_c, std_c)   \n",
    "\n",
    "    \n",
    "# Get Phi, which is strategic - non-strategic\n",
    "def get_Phi(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1):\n",
    "    \"\"\"\n",
    "    Get Phi, which is strategic - non-strategic\n",
    "    k1, k2, k3 measure our preferences for 3 kinds of behaviors\n",
    "    larger k1 means we prefer improvement\n",
    "    larger k2 means we do not prefer failure of improvement\n",
    "    larger k3 means we do not prefer manipulation\n",
    "    k1=k2=k3=1 is the naive difference\n",
    "    \"\"\"\n",
    "    # manipulation probability\n",
    "    pm = get_manip_prob(theta, q, eps, ai, bi, a1, b1)\n",
    "    # Reverse Benefit\n",
    "    b_1 = k1*(1-pm)*q*(2 - beta.cdf(theta, a0, b0, 0, 1) - beta.cdf(theta, a1, b1, 0, 1))\n",
    "   \n",
    "    # Loss of Failure of Improvement \n",
    "    l_1 = k2*(1-pm)*(1-q)*(beta.cdf(theta, a0, b0, 0, 1) - beta.cdf(theta, ai, bi, 0, 1))\n",
    "    # Loss of manipulation\n",
    "    \n",
    "    l_2 = k3*pm*((1-eps)*(1 - beta.cdf(theta, a1, b1, 0, 1))-(1-beta.cdf(theta, a0, b0, 0, 1)))\n",
    "    \n",
    "    return u*(1-alpha)*(b_1-l_1-l_2)\n",
    "    \n",
    "def get_strat_utility(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1):\n",
    "    theta_grid, k1_grid = np.meshgrid(theta, k1, indexing='ij')\n",
    "    def comp(tta, k_1):\n",
    "        phi = get_Phi(u, alpha, tta, q, eps, a0, b0, ai, bi, a1, b1, k_1, k2, k3)\n",
    "        U = (1 - beta.cdf(tta,a1,b1))*alpha*u - (1 - beta.cdf(tta,a0,b0))*(1-alpha)*u + phi\n",
    "        return U\n",
    "    vectorized_compute_U = np.vectorize(comp)\n",
    "    U_values = vectorized_compute_U(theta_grid, k1_grid)\n",
    "    max_U_indices = np.argmax(U_values, axis=0)\n",
    "    theta_max_U = theta_grid[max_U_indices, np.arange(len(k1_list))]\n",
    "    max_U_values = U_values[max_U_indices, np.arange(len(k1_list))]\n",
    "    \n",
    "    return max_U_values, theta_max_U\n",
    "\n",
    "\n",
    "def get_strat_optimal(u, alpha, q, eps, a0, b0, ai, bi, a1, b1, k1=1, k2=1, k3=1):\n",
    "    theta = np.linspace(0,1,1000)\n",
    "    return get_strat_utility(u = u, alpha = alpha, theta = theta, q = q, eps = eps, a0 = a0, b0 = b0, ai = ai, bi = bi, a1 = a1, b1 = b1, k1 = k1, k2 = k2, k3 = k3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(a_c0,b_c0,a_c1,b_c1)\n",
    "print(a_aa0,b_aa0,a_aa1,b_aa1)\n",
    "print(a_h0,b_h0,a_h1,b_h1)\n",
    "print(a_a0,b_a0,a_a1,b_a1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**(1)**. Threshold for Caucasian and African American"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Caucasian**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [],
   "source": [
    "def vary_eps(u, alpha, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1, q_list = [0,0.3,0.6,1], eps_list = np.linspace(0,1,100), ):\n",
    "    opt_no = opt_non_strategic(u,alpha,a0,b0,a1,b1)[1]\n",
    "    for i in range(len(q_list)):\n",
    "        q = q_list[i]\n",
    "        x = np.zeros(100)\n",
    "        ul = np.zeros(100)\n",
    "        m = np.zeros(100)\n",
    "        j = 0\n",
    "        for eps in eps_list:\n",
    "            u1, x1 = get_strat_optimal(u, alpha, q, eps, a0, b0, ai, bi, a1, b1, k1, k2, k3)\n",
    "            u1 = u1[int(np.argmax(u1))]\n",
    "            x[j] = x1\n",
    "            ul[j] = u1\n",
    "            m[j] = get_manip_prob(x1, q, eps, ai, bi, a1, b1)\n",
    "            j += 1\n",
    "        df = pd.DataFrame({'eps': np.linspace(0,1,100), 'theta_max': x, 'max utility': ul, 'manipulation prob': m})\n",
    "        axes[int(i/2)][int(i%2)].tick_params(axis='both', which='major', labelsize=12)\n",
    "        axes[int(i/2)][int(i%2)].plot(df['eps'], df['theta_max'],'r-', alpha=0.6, label='strategic optimal')\n",
    "        axes[int(i/2)][int(i%2)].plot(np.linspace(0,1,100), [opt_no]*100, 'b-', label = 'non-strategic optimal')\n",
    "        axes[int(i/2)][int(i%2)].set_xlabel(r'$\\epsilon$',fontsize = 12)\n",
    "        axes[int(i/2)][int(i%2)].set_ylabel(r'$\\theta$',fontsize=12)\n",
    "        axes[int(i/2)][int(i%2)].legend(fontsize = 11)\n",
    "        axes[int(i/2)][int(i%2)].set_title('q = %.2f'%q, fontsize=11)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(2,2)\n",
    "fig.set_size_inches(8, 6)\n",
    "vary_eps(u, alpha_c, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "plt.tight_layout()\n",
    "fig.savefig('Caucasian.pdf')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**African American**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(2,2)\n",
    "fig.set_size_inches(8, 6)\n",
    "vary_eps(u, alpha_aa, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "plt.tight_layout()\n",
    "fig.savefig('AA.pdf')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**(2) Effects of varying k_1, k_2** \n",
    "\n",
    "Plot the manipulation probability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "uhat_c = opt_non_strategic(u,alpha_c,a_c0,b_c0,a_c1,b_c1)[1]\n",
    "uhat_aa = opt_non_strategic(u,alpha_aa,a_aa0,b_aa0,a_aa1,b_aa1)[1]\n",
    "theta_c_list, _ = get_strat_optimal(u, alpha_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1, k1_list)\n",
    "strat_func = np.vectorize(get_strat_optimal, excluded=['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k2', 'k3'])\n",
    "theta_aa_list, _ = get_strat_optimal(u, alpha_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1, k1_list)\n",
    "u_c = theta_c_list[0]\n",
    "u_aa = theta_aa_list[0]\n",
    "q = 0.3\n",
    "eps = 0.5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "# plot manipulation probability\n",
    "x = np.linspace(0,1,100)\n",
    "plt.figure(figsize = (4,3))\n",
    "plt.xticks(fontsize = 14)\n",
    "plt.yticks(fontsize = 14)\n",
    "prob1 = get_manip_prob(x,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "prob2 = get_manip_prob(x,q, eps, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "plt.plot(x,prob1,label = r'$P_M$ (Caucasian)')\n",
    "plt.plot(x,prob2,label = r'$P_M$ (African American)')\n",
    "prob_a = get_manip_prob(u_c, q, eps, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "prob_b = get_manip_prob(u_aa,q, eps, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "plt.plot(u_c, prob_a,  marker=\"o\", markersize=10, color = 'orange',label = r'$P_M(\\theta_c^*)$')\n",
    "plt.plot(u_aa, prob_b, marker=\"o\", markersize=10, color = 'green',label = r'$P_M(\\theta_{aa}^*)$')\n",
    "plt.xlabel(r'$\\theta$',fontsize = 14)\n",
    "plt.ylabel(r'$P_M(\\theta^*)$',fontsize = 14)\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "plt.savefig('manipcurve_c_aa.pdf')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "def non_strat_utility(u,alpha,theta,a0,b0,a1,b1):\n",
    "    U = (1 - beta.cdf(theta,a1,b1))*alpha*u - (1-beta.cdf(theta,a0,b0))*(1-alpha)*u  \n",
    "    return U\n",
    "\n",
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_c_list = get_strat_optimal(u, alpha_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_c_list = phi_func(u, alpha_c, theta_c_list, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + nonstrat_func(u, alpha_c, theta_c_list, a_c0, b_c0,a_c1, b_c1)\n",
    "utility_c_non = [get_Phi(u, alpha_c, uhat_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + non_strat_utility(u, alpha_c, uhat_c, a_c0, b_c0,a_c1, b_c1)]*5\n",
    "manip_list_c = get_manip_prob(theta_c_list,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "cdf_c = np.array([fair_measure(theta, a_c0, b_c0, a_c1, b_c1, alpha_c, 'dp') for theta in theta_c_list])\n",
    "manip_hat_c = get_manip_prob(uhat_c,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "cdf_c_hat = fair_measure(uhat_c, a_c0, b_c0, a_c1, b_c1, alpha_c, 'dp')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "theta_c_list"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 116,
   "metadata": {},
   "outputs": [],
   "source": [
    "k1_list = np.linspace(1,2,5)\n",
    "strat_func = np.vectorize(get_strat_optimal, excluded=['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k2', 'k3'])\n",
    "_, theta_aa_list = get_strat_optimal(u, alpha_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_aa_list = phi_func(u, alpha_aa, theta_aa_list, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + nonstrat_func(u, alpha_aa, theta_aa_list, a_aa0, b_aa0,a_aa1, b_aa1)\n",
    "utility_aa_non = [get_Phi(u, alpha_aa, uhat_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + non_strat_utility(u, alpha_aa, uhat_aa, a_aa0, b_aa0,a_aa1, b_aa1)]*5\n",
    "manip_list_aa = get_manip_prob(theta_aa_list,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "cdf_aa = np.array([fair_measure(theta, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'dp') for theta in theta_aa_list])\n",
    "manip_hat_aa = get_manip_prob(uhat_aa,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "cdf_aa_hat = fair_measure(uhat_aa, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'dp')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# can output every metric\n",
    "# example for unfairness\n",
    "cdf_aa - cdf_c"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "x = k1_list\n",
    "fig, axes = plt.subplots(2,1)\n",
    "fig.set_size_inches(4, 7)\n",
    "axes[0].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[1].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[0].plot(x,manip_list_c, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[0].plot(x,utility_c_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[0].plot(x,cdf_c, marker = 'o',label = r'$F_{X|S}(\\theta|s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[0].plot(x, utility_c_non, marker = 'o', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[0].plot(x, [manip_hat_c]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "# axes[0].plot(x, [cdf_c_hat]*5,label = r'$F_{X|Y,S}(\\widehat{theta}^*|1,s)$')\n",
    "axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "axes[0].set_ylabel(r'value', fontsize = 12)\n",
    "axes[0].legend(fontsize = 10)\n",
    "axes[0].set_title('Caucasian',fontsize = 12)\n",
    "\n",
    "axes[1].plot(x,manip_list_aa, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[1].plot(x,utility_aa_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[1].plot(x,cdf_aa, marker = 'o',label = r'$F_{X|S}(\\theta|s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[1].plot(x, utility_aa_non ,marker = 'o',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[1].plot(x, [manip_hat_aa]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "# axes[1].plot(x, [cdf_aa_hat]*5,label = r'$F_{X|Y,S}(\\widehat{\\theta}^*|1,s)$')\n",
    "axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "axes[1].set_ylabel(r'value', fontsize = 12)\n",
    "axes[1].legend(fontsize = 10)\n",
    "axes[1].set_title('African American',fontsize = 12)\n",
    "plt.tight_layout()\n",
    "fig.savefig('fairness_caa_dp.pdf')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**(2) Asian and Hispanic**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "# scaled utility function & non-strategic optimal threshold \n",
    "def opt_non_strategic(u,alpha,a0,b0,a1,b1):\n",
    "    theta = np.linspace(0,1,10000)\n",
    "    U = (1 - beta.cdf(theta,a1,b1))*alpha*u - (1-beta.cdf(theta,a0,b0))*(1-alpha)*u  \n",
    "    return U, theta[int(np.argmax(U))]\n",
    "    \n",
    "# one group: measure for calculating unfairness\n",
    "def fair_measure(threshold,a0,b0,a1,b1,alpha,fair_type):\n",
    "    if fair_type == \"eqopt\":\n",
    "        return beta.cdf(threshold, a1, b1, 0, 1)\n",
    "    if fair_type == \"dp\":\n",
    "        return beta.cdf(threshold, a1, b1, 0, 1)*alpha + beta.cdf(threshold, a0, b0, 0, 1)*(1-alpha)\n",
    "\n",
    "# Get manipulation Prob\n",
    "def get_manip_prob(theta, q, eps, ai, bi, a1, b1):\n",
    "    \"\"\"\n",
    "    function to get manip prob under q and eps\n",
    "    \"\"\"\n",
    "    value = (1-q)*(beta.cdf(theta, ai, bi, 0, 1) - beta.cdf(theta, a1, b1, 0, 1)) - eps*(1 - beta.cdf(theta, a1, b1, 0, 1))\n",
    "    return norm.cdf(value, mu_c, std_c)   \n",
    "\n",
    "    \n",
    "# Get Phi, which is strategic - non-strategic\n",
    "def get_Phi(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1):\n",
    "    \"\"\"\n",
    "    Get Phi, which is strategic - non-strategic\n",
    "    k1, k2, k3 measure our preferences for 3 kinds of behaviors\n",
    "    larger k1 means we prefer improvement\n",
    "    larger k2 means we do not prefer failure of improvement\n",
    "    larger k3 means we do not prefer manipulation\n",
    "    k1=k2=k3=1 is the naive difference\n",
    "    \"\"\"\n",
    "    # manipulation probability\n",
    "    pm = get_manip_prob(theta, q, eps, ai, bi, a1, b1)\n",
    "    # Reverse Benefit\n",
    "    b_1 = k1*(1-pm)*q*(2 - beta.cdf(theta, a0, b0, 0, 1) - beta.cdf(theta, a1, b1, 0, 1))\n",
    "   \n",
    "    # Loss of Failure of Improvement \n",
    "    l_1 = k2*(1-pm)*(1-q)*(beta.cdf(theta, a0, b0, 0, 1) - beta.cdf(theta, ai, bi, 0, 1))\n",
    "    # Loss of manipulation\n",
    "    \n",
    "    l_2 = k3*pm*((1-eps)*(1 - beta.cdf(theta, a1, b1, 0, 1))-(1-beta.cdf(theta, a0, b0, 0, 1)))\n",
    "    \n",
    "    return u*(1-alpha)*(b_1-l_1-l_2)\n",
    "    \n",
    "def get_strat_utility(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1):\n",
    "    phi = get_Phi(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1, k2, k3)\n",
    "    U = (1 - beta.cdf(theta,a1,b1))*alpha*u - (1 - beta.cdf(theta,a0,b0))*(1-alpha)*u + phi\n",
    "    return U\n",
    "\n",
    "def get_strat_optimal(u, alpha, q, eps, a0, b0, ai, bi, a1, b1, k1=1, k2=1, k3=1):\n",
    "    theta = np.linspace(0,1,10000)\n",
    "    U = get_strat_utility(u = u, alpha = alpha, theta = theta, q = q, eps = eps, a0 = a0, b0 = b0, ai = ai, bi = bi, a1 = a1, b1 = b1, k1 = k1, k2 = k2, k3 = k3)\n",
    "    return U, theta[int(np.argmax(U))]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(2,2)\n",
    "fig.set_size_inches(8, 6)\n",
    "vary_eps(u, alpha_asian, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "plt.tight_layout()\n",
    "fig.savefig('Asian.pdf')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, axes = plt.subplots(2,2)\n",
    "fig.set_size_inches(8, 6)\n",
    "vary_eps(u, alpha_h, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "plt.tight_layout()\n",
    "fig.savefig('Hispanic.pdf')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_strat_utility(u, alpha, theta, q, eps, a0, b0, ai, bi, a1, b1, k1 = 1, k2 = 1, k3 = 1):\n",
    "    theta_grid, k1_grid = np.meshgrid(theta, k1, indexing='ij')\n",
    "    def comp(tta, k_1):\n",
    "        phi = get_Phi(u, alpha, tta, q, eps, a0, b0, ai, bi, a1, b1, k_1, k2, k3)\n",
    "        U = (1 - beta.cdf(tta,a1,b1))*alpha*u - (1 - beta.cdf(tta,a0,b0))*(1-alpha)*u + phi\n",
    "        return U\n",
    "    vectorized_compute_U = np.vectorize(comp)\n",
    "    U_values = vectorized_compute_U(theta_grid, k1_grid)\n",
    "    max_U_indices = np.argmax(U_values, axis=0)\n",
    "    theta_max_U = theta_grid[max_U_indices, np.arange(len(k1_list))]\n",
    "    max_U_values = U_values[max_U_indices, np.arange(len(k1_list))]\n",
    "    \n",
    "    return max_U_values, theta_max_U\n",
    "\n",
    "\n",
    "def get_strat_optimal(u, alpha, q, eps, a0, b0, ai, bi, a1, b1, k1=1, k2=1, k3=1):\n",
    "    theta = np.linspace(0,1,1000)\n",
    "    return get_strat_utility(u = u, alpha = alpha, theta = theta, q = q, eps = eps, a0 = a0, b0 = b0, ai = ai, bi = bi, a1 = a1, b1 = b1, k1 = k1, k2 = k2, k3 = k3)\n",
    "\n",
    "uhat_a = opt_non_strategic(u,alpha_asian,a_a0,b_a0,a_a1,b_a1)[1]\n",
    "uhat_h = opt_non_strategic(u,alpha_h,a_h0,b_h0,a_h1,b_h1)[1]\n",
    "theta_a_list, _ = get_strat_optimal(u, alpha_asian, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1, k1_list)\n",
    "strat_func = np.vectorize(get_strat_optimal, excluded=['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k2', 'k3'])\n",
    "theta_h_list, _ = get_strat_optimal(u, alpha_h, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1, k1_list)\n",
    "u_a = theta_a_list[0]\n",
    "u_h = theta_h_list[0]\n",
    "q = 0.3\n",
    "eps = 0.5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# plot manipulation probability\n",
    "x = np.linspace(0,1,100)\n",
    "plt.figure(figsize = (4,3))\n",
    "plt.xticks(fontsize = 14)\n",
    "plt.yticks(fontsize = 14)\n",
    "prob1 = get_manip_prob(x,q,eps,(a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "prob2 = get_manip_prob(x,q, eps, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "plt.plot(x,prob1,label = r'$P_M$ curve for Asian')\n",
    "plt.plot(x,prob2,label = r'$P_M$ curve for Hispanic')\n",
    "prob_a = get_manip_prob(u_a, q, eps, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "prob_b = get_manip_prob(u_h,q, eps, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "plt.plot(u_a, prob_a,  marker=\"o\", markersize=10, label = r'$P_M(\\theta_a^*)$')\n",
    "plt.plot(u_h, prob_b, marker=\"o\", markersize=10, label = r'$P_M(\\theta_h^*)$')\n",
    "plt.xlabel(r'$\\theta$',fontsize = 14)\n",
    "plt.ylabel(r'$P_M(\\theta^*)$',fontsize = 14)\n",
    "plt.legend()\n",
    "plt.tight_layout()\n",
    "plt.savefig('manipcurve_a_h.pdf')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_a_list = get_strat_optimal(u, alpha_asian, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_a_list = phi_func(u, alpha_asian, theta_a_list, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1) + nonstrat_func(u, alpha_asian, theta_a_list, a_a0, b_a0,a_a1, b_a1)\n",
    "utility_a_non = [get_Phi(u, alpha_asian, uhat_a, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1) + non_strat_utility(u, alpha_asian, uhat_a, a_a0, b_a0,a_a1, b_a1)]*5\n",
    "manip_list_a = get_manip_prob(theta_a_list,q,eps,(a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "cdf_a = np.array([fair_measure(theta, a_a0, b_a0, a_a1, b_a1, alpha_asian, 'dp') for theta in theta_a_list])\n",
    "manip_hat_a = get_manip_prob(uhat_a,q,eps,(a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "cdf_a_hat = fair_measure(uhat_a, a_a0, b_a0, a_a1, b_a1, alpha_asian, 'dp')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [],
   "source": [
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_h_list = get_strat_optimal(u, alpha_h, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_h_list = phi_func(u, alpha_h, theta_h_list, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1) + nonstrat_func(u, alpha_h, theta_h_list, a_h0, b_h0,a_h1, b_h1)\n",
    "utility_h_non = [get_Phi(u, alpha_h, uhat_h, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1) + non_strat_utility(u, alpha_h, uhat_h, a_h0, b_h0,a_h1, b_h1)]*5\n",
    "manip_list_h = get_manip_prob(theta_h_list,q,eps,(a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "cdf_h = np.array([fair_measure(theta, a_h0, b_h0, a_h1, b_h1, alpha_h, 'dp') for theta in theta_h_list])\n",
    "manip_hat_h = get_manip_prob(uhat_h,q,eps,(a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "cdf_h_hat = fair_measure(uhat_h, a_h0, b_h0, a_h1, b_h1, alpha_h, 'dp')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "x = k1_list\n",
    "fig, axes = plt.subplots(2,1)\n",
    "fig.set_size_inches(4, 7)\n",
    "axes[0].tick_params(axis='both', which='major')\n",
    "axes[1].tick_params(axis='both', which='major')\n",
    "axes[0].plot(x,manip_list_a, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[0].plot(x,utility_a_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[0].plot(x,cdf_a, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[0].plot(x, utility_a_non, marker = 'o',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[0].plot(x, [manip_hat_a]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$',fontsize = 12)\n",
    "axes[0].set_ylabel(r'value',fontsize = 12)\n",
    "axes[0].legend()\n",
    "axes[0].set_title('Asian')\n",
    "\n",
    "axes[1].plot(x,manip_list_h, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[1].plot(x,utility_h_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[1].plot(x,cdf_h, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[1].plot(x, utility_h_non, marker= 'o', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[1].plot(x, [manip_hat_h]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$',fontsize = 12)\n",
    "axes[1].set_ylabel(r'value',fontsize = 12)\n",
    "axes[1].legend()\n",
    "axes[1].set_title('Hispanic')\n",
    "\n",
    "plt.tight_layout()\n",
    "\n",
    "fig.savefig('fairness_ah_dp.pdf')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### EQOPT"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_a_list = get_strat_optimal(u, alpha_asian, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_a_list = phi_func(u, alpha_asian, theta_a_list, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1) + nonstrat_func(u, alpha_asian, theta_a_list, a_a0, b_a0,a_a1, b_a1)\n",
    "utility_a_non = [get_Phi(u, alpha_asian, uhat_a, q, eps, a_a0, b_a0, (a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1) + non_strat_utility(u, alpha_asian, uhat_a, a_a0, b_a0,a_a1, b_a1)]*5\n",
    "manip_list_a = get_manip_prob(theta_a_list,q,eps,(a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "cdf_a = np.array([fair_measure(theta, a_a0, b_a0, a_a1, b_a1, alpha_asian, 'eqopt') for theta in theta_a_list])\n",
    "manip_hat_a = get_manip_prob(uhat_a,q,eps,(a_a0+a_a1)/2, (b_a0+b_a1)/2, a_a1, b_a1)\n",
    "cdf_a_hat = fair_measure(uhat_a, a_a0, b_a0, a_a1, b_a1, alpha_asian, 'eqopt')\n",
    "\n",
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_h_list = get_strat_optimal(u, alpha_h, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_h_list = phi_func(u, alpha_h, theta_h_list, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1) + nonstrat_func(u, alpha_h, theta_h_list, a_h0, b_h0,a_h1, b_h1)\n",
    "utility_h_non = [get_Phi(u, alpha_h, uhat_h, q, eps, a_h0, b_h0, (a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1) + non_strat_utility(u, alpha_h, uhat_h, a_h0, b_h0,a_h1, b_h1)]*5\n",
    "manip_list_h = get_manip_prob(theta_h_list,q,eps,(a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "cdf_h = np.array([fair_measure(theta, a_h0, b_h0, a_h1, b_h1, alpha_h, 'eqopt') for theta in theta_h_list])\n",
    "manip_hat_h = get_manip_prob(uhat_h,q,eps,(a_h0+a_h1)/2, (b_h0+b_h1)/2, a_h1, b_h1)\n",
    "cdf_h_hat = fair_measure(uhat_h, a_h0, b_h0, a_h1, b_h1, alpha_h, 'eqopt')\n",
    "\n",
    "# plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "x = k1_list\n",
    "fig, axes = plt.subplots(1,2)\n",
    "fig.set_size_inches(7, 3)\n",
    "axes[0].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[1].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[0].plot(x,manip_list_a, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[0].plot(x,utility_a_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[0].plot(x,cdf_a, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[0].plot(x, utility_a_non, marker = 'o',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[0].plot(x, [manip_hat_a]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$',fontsize=12)\n",
    "axes[0].set_ylabel(r'value',fontsize = 12)\n",
    "axes[0].set_title('Asian')\n",
    "\n",
    "axes[1].plot(x,manip_list_h, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[1].plot(x,utility_h_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[1].plot(x,cdf_h, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[1].plot(x, utility_h_non, marker= 'o', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[1].plot(x, [manip_hat_h]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$',fontsize=12)\n",
    "axes[1].set_ylabel(r'value',fontsize = 12)\n",
    "axes[1].legend(fontsize=8)\n",
    "axes[1].set_title('Hispanic')\n",
    "\n",
    "plt.tight_layout()\n",
    "\n",
    "fig.savefig('fairness_ah.pdf')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "k1_list = np.linspace(1,2,5)\n",
    "_, theta_c_list = get_strat_optimal(u, alpha_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_c_list = phi_func(u, alpha_c, theta_c_list, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + nonstrat_func(u, alpha_c, theta_c_list, a_c0, b_c0,a_c1, b_c1)\n",
    "utility_c_non = [get_Phi(u, alpha_c, uhat_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + non_strat_utility(u, alpha_c, uhat_c, a_c0, b_c0,a_c1, b_c1)]*5\n",
    "manip_list_c = get_manip_prob(theta_c_list,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "cdf_c = np.array([fair_measure(theta, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt') for theta in theta_c_list])\n",
    "manip_hat_c = get_manip_prob(uhat_c,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "cdf_c_hat = fair_measure(uhat_c, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt')\n",
    "\n",
    "\n",
    "k1_list = np.linspace(1,2,5)\n",
    "strat_func = np.vectorize(get_strat_optimal, excluded=['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k2', 'k3'])\n",
    "_, theta_aa_list = get_strat_optimal(u, alpha_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1, k1_list)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])\n",
    "utility_aa_list = phi_func(u, alpha_aa, theta_aa_list, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + nonstrat_func(u, alpha_aa, theta_aa_list, a_aa0, b_aa0,a_aa1, b_aa1)\n",
    "utility_aa_non = [get_Phi(u, alpha_aa, uhat_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + non_strat_utility(u, alpha_aa, uhat_aa, a_aa0, b_aa0,a_aa1, b_aa1)]*5\n",
    "manip_list_aa = get_manip_prob(theta_aa_list,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "cdf_aa = np.array([fair_measure(theta, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt') for theta in theta_aa_list])\n",
    "manip_hat_aa = get_manip_prob(uhat_aa,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "cdf_aa_hat = fair_measure(uhat_aa, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt')\n",
    "\n",
    "\n",
    "# plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "x = k1_list\n",
    "fig, axes = plt.subplots(1,2)\n",
    "fig.set_size_inches(7, 3)\n",
    "axes[0].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[1].tick_params(axis='both', which='major', labelsize=14)\n",
    "axes[0].plot(x,manip_list_c, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[0].plot(x,utility_c_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[0].plot(x,cdf_c, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[0].plot(x, utility_c_non, marker = 'o', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[0].plot(x, [manip_hat_c]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "# axes[0].plot(x, [cdf_c_hat]*5,label = r'$F_{X|Y,S}(\\widehat{theta}^*|1,s)$')\n",
    "axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "axes[0].set_ylabel(r'value', fontsize = 12)\n",
    "axes[0].set_title('Caucasian',fontsize = 12)\n",
    "\n",
    "axes[1].plot(x,manip_list_aa, marker = 'o',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "axes[1].plot(x,utility_aa_list,marker = 'o',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "axes[1].plot(x,cdf_aa, marker = 'o',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "axes[1].plot(x, utility_aa_non ,marker = 'o',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "axes[1].plot(x, [manip_hat_aa]*5,marker = 'o',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "# axes[1].plot(x, [cdf_aa_hat]*5,label = r'$F_{X|Y,S}(\\widehat{\\theta}^*|1,s)$')\n",
    "axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "axes[1].set_ylabel(r'value', fontsize = 12)\n",
    "axes[1].legend(fontsize = 9)\n",
    "axes[1].set_title('African American',fontsize = 12)\n",
    "plt.tight_layout()\n",
    "fig.savefig('fairness_caa.pdf')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Noisy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [],
   "source": [
    "# vars not changed\n",
    "def non_strat_utility(u,alpha,theta,a0,b0,a1,b1):\n",
    "    U = (1 - beta.cdf(theta,a1,b1))*alpha*u - (1-beta.cdf(theta,a0,b0))*(1-alpha)*u  \n",
    "    return U\n",
    "\n",
    "sd = [0.05, 0.1]\n",
    "def gen_delta(std, n = 10):\n",
    "    return np.random.normal(0,std,n)\n",
    "uhat_c = opt_non_strategic(u,alpha_c,a_c0,b_c0,a_c1,b_c1)[1]\n",
    "uhat_aa = opt_non_strategic(u,alpha_aa,a_aa0,b_aa0,a_aa1,b_aa1)[1]\n",
    "k1_list = np.linspace(1,2,5)\n",
    "phi_func = np.vectorize(get_Phi, excluded = ['u', 'alpha', 'q', 'eps', 'a0', 'b0', 'ai', 'bi', 'a1', 'b1', 'k1','k2','k3'])\n",
    "nonstrat_func = np.vectorize(non_strat_utility, excluded = ['u','alpha','a0','b0','a1','b1'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(len(sd)):\n",
    "    print(i)\n",
    "    deltas = gen_delta(sd[i])\n",
    "    \n",
    "    theta_c_list = np.zeros([10,5])\n",
    "    utility_c_list = np.zeros([10,5])\n",
    "    utility_c_non = np.zeros([10,5])\n",
    "    manip_list_c = np.zeros([10,5])\n",
    "    manip_hat_c = np.zeros(10)\n",
    "    cdf_c = np.zeros([10,5])\n",
    "    cdf_c_hat = np.zeros([10,5])\n",
    "\n",
    "    theta_aa_list = np.zeros([10,5])\n",
    "    utility_aa_list = np.zeros([10,5])\n",
    "    utility_aa_non = np.zeros([10,5])\n",
    "    manip_list_aa = np.zeros([10,5])\n",
    "    manip_hat_aa = np.zeros(10)\n",
    "    cdf_aa = np.zeros([10,5])\n",
    "    cdf_aa_hat = np.zeros([10,5])\n",
    "    \n",
    "    for j in range(len(deltas)):\n",
    "        print(j)\n",
    "        _, theta_c_list[j] = get_strat_optimal(u, alpha_c, q+deltas[j], eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1, k1_list)\n",
    "        utility_c_list[j] = phi_func(u, alpha_c, theta_c_list[j], q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + nonstrat_func(u, alpha_c, theta_c_list[j], a_c0, b_c0,a_c1, b_c1)\n",
    "        utility_c_non[j] = [get_Phi(u, alpha_c, uhat_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + non_strat_utility(u, alpha_c, uhat_c, a_c0, b_c0,a_c1, b_c1)]*5\n",
    "        manip_list_c[j] = get_manip_prob(theta_c_list[j],q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "        cdf_c[j] = np.array([fair_measure(theta, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt') for theta in theta_c_list[j]])\n",
    "        manip_hat_c[j] = get_manip_prob(uhat_c,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "        cdf_c_hat[j] = fair_measure(uhat_c, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt')\n",
    "        \n",
    "        _, theta_aa_list[j] = get_strat_optimal(u, alpha_aa, q+deltas[j], eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1, k1_list)\n",
    "        utility_aa_list[j] = phi_func(u, alpha_aa, theta_aa_list[j], q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + nonstrat_func(u, alpha_aa, theta_aa_list[j], a_aa0, b_aa0,a_aa1, b_aa1)\n",
    "        utility_aa_non[j] = [get_Phi(u, alpha_aa, uhat_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + non_strat_utility(u, alpha_aa, uhat_aa, a_aa0, b_aa0,a_aa1, b_aa1)]*5\n",
    "        manip_list_aa[j] = get_manip_prob(theta_aa_list[j],q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "        cdf_aa[j] = np.array([fair_measure(theta, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt') for theta in theta_aa_list[j]])\n",
    "        manip_hat_aa[j] = get_manip_prob(uhat_aa,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "        cdf_aa_hat[j] = fair_measure(uhat_aa, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt')\n",
    "        \n",
    "    error_c_list = theta_c_list.std(axis = 0)  \n",
    "    theta_c_list = theta_c_list.mean(axis = 0)\n",
    "    error_c_non = np.zeros(5)\n",
    "    utility_c_non = utility_c_non.mean(axis=0)\n",
    "    error_manip_c = manip_list_c.std(axis=0)\n",
    "    manip_list_c = manip_list_c.mean(axis=0)\n",
    "    error_hat_c = np.zeros(5)\n",
    "    manip_hat_c = manip_hat_c.mean()\n",
    "    error_cdf_c_hat = np.zeros(5)\n",
    "    cdf_c_hat = cdf_c_hat.mean(axis=0)\n",
    "    error_cdf_c = cdf_c.std(axis=0)\n",
    "    cdf_c = cdf_c.mean(axis=0)\n",
    "    error_utility_c = utility_c_list.std(axis=0)\n",
    "    utility_c_list = utility_c_list.mean(axis=0)\n",
    "    \n",
    "    error_aa_list = theta_aa_list.std(axis = 0)\n",
    "    theta_aa_list = theta_aa_list.mean(axis = 0)\n",
    "    error_aa_non = np.zeros(5)\n",
    "    utility_aa_non = utility_aa_non.mean(axis=0)\n",
    "    error_manip_aa = manip_list_aa.std(axis=0)\n",
    "    manip_list_aa = manip_list_aa.mean(axis=0)\n",
    "    error_hat_aa = np.zeros(5)\n",
    "    manip_hat_aa = manip_hat_aa.mean()\n",
    "    error_cdf_aa_hat = np.zeros(5)\n",
    "    cdf_aa_hat = cdf_aa_hat.mean(axis=0)\n",
    "    error_cdf_aa = cdf_aa.std(axis=0)\n",
    "    cdf_aa = cdf_aa.mean(axis=0)\n",
    "    error_utility_aa = utility_aa_list.std(axis=0)\n",
    "    utility_aa_list = utility_aa_list.mean(axis=0)\n",
    "    \n",
    "    print(f'average strategic utility for caucasian when sd = {sd[i]} and k1 = 1.25 is {utility_c_list[1]}')\n",
    "    print(f'average Pm for caucasian when sd = {sd[i]} and k1 = 1 is {manip_list_c[0]}')\n",
    "    print(f'average Pm for caucasian when sd = {sd[i]} and k1 = 1.25 is {manip_list_c[1]}')\n",
    "    print(f'average cdf for caucasian when sd = {sd[i]} and k1 = 1 is {cdf_c[0]}')\n",
    "    print(f'average cdf for caucasian when sd = {sd[i]} and k1 = 1.25 is {cdf_c[1]}')\n",
    "    \n",
    "    print(f'average strategic utility for aa when sd = {sd[i]} and k1 = 1.25 is {utility_aa_list[1]}')\n",
    "    print(f'average Pm for aa when sd = {sd[i]} and k1 = 1 is {manip_list_aa[0]}')\n",
    "    print(f'average Pm for aa when sd = {sd[i]} and k1 = 1.25 is {manip_list_aa[1]}')\n",
    "    print(f'average cdf for aa when sd = {sd[i]} and k1 = 1 is {cdf_aa[0]}')\n",
    "    print(f'average cdf for aa when sd = {sd[i]} and k1 = 1.25 is {cdf_aa[1]}')\n",
    "    \n",
    "    # plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "    x = k1_list\n",
    "    fig, axes = plt.subplots(1,2)\n",
    "    fig.set_size_inches(7, 3)\n",
    "    fig.tight_layout(pad=2.0)\n",
    "    axes[0].tick_params(axis='both', which='major', labelsize=14)\n",
    "    axes[1].tick_params(axis='both', which='major', labelsize=14)\n",
    "    axes[0].errorbar(x,manip_list_c,error_manip_c, marker = '.',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "    axes[0].errorbar(x,utility_c_list,error_utility_c,marker = '.',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "    axes[0].errorbar(x,cdf_c,error_cdf_c, marker = '.',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "    axes[0].errorbar(x, utility_c_non,error_c_non, marker = '.', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "    axes[0].errorbar(x, [manip_hat_c]*5, error_hat_c, marker = '.',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "    # axes[0].plot(x, [cdf_c_hat]*5,label = r'$F_{X|Y,S}(\\widehat{theta}^*|1,s)$')\n",
    "    axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "    axes[0].set_ylabel(r'value', fontsize = 12)\n",
    "    # axes[0].legend(fontsize = 7, bbox_to_anchor=(0.6, 0.47))\n",
    "    axes[0].set_title('Caucasian',fontsize = 12)\n",
    "\n",
    "    axes[1].errorbar(x,manip_list_aa,error_manip_aa, marker = '.',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "    axes[1].errorbar(x,utility_aa_list,error_utility_aa,marker = '.',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "    axes[1].errorbar(x,cdf_aa, error_cdf_aa,marker = '.',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "    axes[1].errorbar(x, utility_aa_non , error_aa_non, marker = '.',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "    axes[1].errorbar(x, [manip_hat_aa]*5,error_hat_aa, marker = '.',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "    # axes[1].plot(x, [cdf_aa_hat]*5,label = r'$F_{X|Y,S}(\\widehat{\\theta}^*|1,s)$')\n",
    "    axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "    axes[1].set_ylabel(r'value', fontsize = 12)\n",
    "    axes[1].legend(fontsize = 8,bbox_to_anchor=(0.3, 0.42))\n",
    "    axes[1].set_title('African American',fontsize = 12)\n",
    "    \n",
    "    fig.savefig(f'fairness_caa_q_noise_{i}.pdf')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(len(sd)):\n",
    "    print(i)\n",
    "    deltas = gen_delta(sd[i])\n",
    "    \n",
    "    theta_c_list = np.zeros([10,5])\n",
    "    utility_c_list = np.zeros([10,5])\n",
    "    utility_c_non = np.zeros([10,5])\n",
    "    manip_list_c = np.zeros([10,5])\n",
    "    manip_hat_c = np.zeros(10)\n",
    "    cdf_c = np.zeros([10,5])\n",
    "    cdf_c_hat = np.zeros([10,5])\n",
    "\n",
    "    theta_aa_list = np.zeros([10,5])\n",
    "    utility_aa_list = np.zeros([10,5])\n",
    "    utility_aa_non = np.zeros([10,5])\n",
    "    manip_list_aa = np.zeros([10,5])\n",
    "    manip_hat_aa = np.zeros(10)\n",
    "    cdf_aa = np.zeros([10,5])\n",
    "    cdf_aa_hat = np.zeros([10,5])\n",
    "    \n",
    "    for j in range(len(deltas)):\n",
    "        print(j)\n",
    "        _, theta_c_list[j] = get_strat_optimal(u, alpha_c, q, eps+deltas[j], a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1, k1_list)\n",
    "        utility_c_list[j] = phi_func(u, alpha_c, theta_c_list[j], q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + nonstrat_func(u, alpha_c, theta_c_list[j], a_c0, b_c0,a_c1, b_c1)\n",
    "        utility_c_non[j] = [get_Phi(u, alpha_c, uhat_c, q, eps, a_c0, b_c0, (a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1) + non_strat_utility(u, alpha_c, uhat_c, a_c0, b_c0,a_c1, b_c1)]*5\n",
    "        manip_list_c[j] = get_manip_prob(theta_c_list[j],q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "        cdf_c[j] = np.array([fair_measure(theta, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt') for theta in theta_c_list[j]])\n",
    "        manip_hat_c[j] = get_manip_prob(uhat_c,q,eps,(a_c0+a_c1)/2, (b_c0+b_c1)/2, a_c1, b_c1)\n",
    "        cdf_c_hat[j] = fair_measure(uhat_c, a_c0, b_c0, a_c1, b_c1, alpha_c, 'eqopt')\n",
    "        \n",
    "        _, theta_aa_list[j] = get_strat_optimal(u, alpha_aa, q, eps+deltas[j], a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1, k1_list)\n",
    "        utility_aa_list[j] = phi_func(u, alpha_aa, theta_aa_list[j], q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + nonstrat_func(u, alpha_aa, theta_aa_list[j], a_aa0, b_aa0,a_aa1, b_aa1)\n",
    "        utility_aa_non[j] = [get_Phi(u, alpha_aa, uhat_aa, q, eps, a_aa0, b_aa0, (a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1) + non_strat_utility(u, alpha_aa, uhat_aa, a_aa0, b_aa0,a_aa1, b_aa1)]*5\n",
    "        manip_list_aa[j] = get_manip_prob(theta_aa_list[j],q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "        cdf_aa[j] = np.array([fair_measure(theta, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt') for theta in theta_aa_list[j]])\n",
    "        manip_hat_aa[j] = get_manip_prob(uhat_aa,q,eps,(a_aa0+a_aa1)/2, (b_aa0+b_aa1)/2, a_aa1, b_aa1)\n",
    "        cdf_aa_hat[j] = fair_measure(uhat_aa, a_aa0, b_aa0, a_aa1, b_aa1, alpha_aa, 'eqopt')\n",
    "        \n",
    "    error_c_list = theta_c_list.std(axis = 0)  \n",
    "    theta_c_list = theta_c_list.mean(axis = 0)\n",
    "    error_c_non = np.zeros(5)\n",
    "    utility_c_non = utility_c_non.mean(axis=0)\n",
    "    error_manip_c = manip_list_c.std(axis=0)\n",
    "    manip_list_c = manip_list_c.mean(axis=0)\n",
    "    error_hat_c = np.zeros(5)\n",
    "    manip_hat_c = manip_hat_c.mean()\n",
    "    error_cdf_c_hat = np.zeros(5)\n",
    "    cdf_c_hat = cdf_c_hat.mean(axis=0)\n",
    "    error_cdf_c = cdf_c.std(axis=0)\n",
    "    cdf_c = cdf_c.mean(axis=0)\n",
    "    error_utility_c = utility_c_list.std(axis=0)\n",
    "    utility_c_list = utility_c_list.mean(axis=0)\n",
    "    \n",
    "    error_aa_list = theta_aa_list.std(axis = 0)\n",
    "    theta_aa_list = theta_aa_list.mean(axis = 0)\n",
    "    error_aa_non = np.zeros(5)\n",
    "    utility_aa_non = utility_aa_non.mean(axis=0)\n",
    "    error_manip_aa = manip_list_aa.std(axis=0)\n",
    "    manip_list_aa = manip_list_aa.mean(axis=0)\n",
    "    error_hat_aa = np.zeros(5)\n",
    "    manip_hat_aa = manip_hat_aa.mean()\n",
    "    error_cdf_aa_hat = np.zeros(5)\n",
    "    cdf_aa_hat = cdf_aa_hat.mean(axis=0)\n",
    "    error_cdf_aa = cdf_aa.std(axis=0)\n",
    "    cdf_aa = cdf_aa.mean(axis=0)\n",
    "    error_utility_aa = utility_aa_list.std(axis=0)\n",
    "    utility_aa_list = utility_aa_list.mean(axis=0)\n",
    "    \n",
    "    print(f'average strategic utility for caucasian when sd = {sd[i]} and k1 = 1.25 is {utility_c_list[1]}')\n",
    "    print(f'average Pm for caucasian when sd = {sd[i]} and k1 = 1 is {manip_list_c[0]}')\n",
    "    print(f'average Pm for caucasian when sd = {sd[i]} and k1 = 1.25 is {manip_list_c[1]}')\n",
    "    print(f'average cdf for caucasian when sd = {sd[i]} and k1 = 1 is {cdf_c[0]}')\n",
    "    print(f'average cdf for caucasian when sd = {sd[i]} and k1 = 1.25 is {cdf_c[1]}')\n",
    "    \n",
    "    print(f'average strategic utility for aa when sd = {sd[i]} and k1 = 1.25 is {utility_aa_list[1]}')\n",
    "    print(f'average Pm for aa when sd = {sd[i]} and k1 = 1 is {manip_list_aa[0]}')\n",
    "    print(f'average Pm for aa when sd = {sd[i]} and k1 = 1.25 is {manip_list_aa[1]}')\n",
    "    print(f'average cdf for aa when sd = {sd[i]} and k1 = 1 is {cdf_aa[0]}')\n",
    "    print(f'average cdf for aa when sd = {sd[i]} and k1 = 1.25 is {cdf_aa[1]}')\n",
    "    \n",
    "    # plot optimal threshold, (non)-strategic utility, and manipulation probability\n",
    "    x = k1_list\n",
    "    fig, axes = plt.subplots(1,2)\n",
    "    fig.set_size_inches(7, 3)\n",
    "    fig.tight_layout(pad=2.0)\n",
    "    axes[0].tick_params(axis='both', which='major', labelsize=14)\n",
    "    axes[1].tick_params(axis='both', which='major', labelsize=14)\n",
    "    axes[0].errorbar(x,manip_list_c,error_manip_c, marker = '.',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "    axes[0].errorbar(x,utility_c_list,error_utility_c,marker = '.',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "    axes[0].errorbar(x,cdf_c,error_cdf_c, marker = '.',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "    axes[0].errorbar(x, utility_c_non,error_c_non, marker = '.', label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "    axes[0].errorbar(x, [manip_hat_c]*5, error_hat_c, marker = '.',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "    # axes[0].plot(x, [cdf_c_hat]*5,label = r'$F_{X|Y,S}(\\widehat{theta}^*|1,s)$')\n",
    "    axes[0].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "    axes[0].set_ylabel(r'value', fontsize = 12)\n",
    "    # axes[0].legend(fontsize = 7, bbox_to_anchor=(0.6, 0.47))\n",
    "    axes[0].set_title('Caucasian',fontsize = 12)\n",
    "\n",
    "    axes[1].errorbar(x,manip_list_aa,error_manip_aa, marker = '.',label = r'$P_M(\\theta^*(k_1))$',linestyle = 'dotted',color = 'blue')\n",
    "    axes[1].errorbar(x,utility_aa_list,error_utility_aa,marker = '.',label = r'strategic utility',linestyle = 'solid',color = 'blue')\n",
    "    axes[1].errorbar(x,cdf_aa, error_cdf_aa,marker = '.',label = r'$F_{X|Y,S}(\\theta|1,s)$',linestyle = 'dotted',color = 'green')\n",
    "    axes[1].errorbar(x, utility_aa_non , error_aa_non, marker = '.',label = r'non-strategic utility',linestyle = 'solid',color = 'red')\n",
    "    axes[1].errorbar(x, [manip_hat_aa]*5,error_hat_aa, marker = '.',label = r'$P_M(\\widehat{\\theta}^*)$',linestyle = 'dotted',color = 'red')\n",
    "    # axes[1].plot(x, [cdf_aa_hat]*5,label = r'$F_{X|Y,S}(\\widehat{\\theta}^*|1,s)$')\n",
    "    axes[1].set_xlabel(r'$k_1$ normalized by $u(1-\\alpha)$', fontsize = 12)\n",
    "    axes[1].set_ylabel(r'value', fontsize = 12)\n",
    "    axes[1].legend(fontsize = 8,bbox_to_anchor=(0.3, 0.42))\n",
    "    axes[1].set_title('African American',fontsize = 12)\n",
    "    \n",
    "    fig.savefig(f'fairness_caa_eps_noise_{i}.pdf')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
