{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "# load the correct data from an ensemble-model folder:\n",
    "dataset = \"utkface\"\n",
    "path = f\"./votes/{dataset}/\"\n",
    "raw_votes = np.load(path + f\"model(1)-raw-votes-(mode-random)-dataset-{dataset}.npy\").astype(float)\n",
    "raw_votes = raw_votes[-300:]\n",
    "targets = np.load(path + f\"model(1)-targets-(mode-random)-dataset-{dataset}.npy\").astype(float)\n",
    "targets = targets[-300:]\n",
    "sensitives = np.load(path + f\"model(1)-sensitives-(mode-random)-dataset-{dataset}.npy\").astype(float)\n",
    "sensitives = sensitives[-300:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(300,)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sensitives.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "calibration_data = pd.DataFrame(\n",
    "    np.c_[raw_votes.argmax(axis=1), targets, sensitives], columns=[\"prediction\", \"truth\", \"sensitive\"]) # note the prediction is not noised yet\n",
    "calibration_data = calibration_data.astype({\"prediction\": int, \"truth\": int, \"sensitive\": int})"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Loss Disparity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array([[[0.85526316, 0.71052632, 0.75      , 0.86666667, 1.        ],\n",
       "         [0.16666667, 0.05555556, 0.20689655, 0.08333333, 0.27272727]],\n",
       " \n",
       "        [[0.14473684, 0.28947368, 0.25      , 0.13333333, 0.        ],\n",
       "         [0.83333333, 0.94444444, 0.79310345, 0.91666667, 0.72727273]]]),\n",
       " array([[[0.78723404, 0.84848485, 0.82666667, 0.80714286, 0.81097561],\n",
       "         [0.14634146, 0.16964286, 0.13861386, 0.16981132, 0.14285714]],\n",
       " \n",
       "        [[0.21276596, 0.15151515, 0.17333333, 0.19285714, 0.18902439],\n",
       "         [0.85365854, 0.83035714, 0.86138614, 0.83018868, 0.85714286]]]))"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "def probability_of_k_given_kprime_and_z(calibration_data):\n",
    "    \"\"\"Producing two sets of probabilitis for Z=z and Z =! z, each |Y| x |Y'| x |Z| matrix of probabilities, where Y is ground truth label and Y' is the predicated label and Z is sensitive attribute.\"\"\"\n",
    "\n",
    "    num_classes = max(calibration_data[\"truth\"]) + 1\n",
    "    num_sensitives = max(calibration_data[\"sensitive\"]) + 1\n",
    "\n",
    "    probabilities_for_z = np.zeros((num_classes, num_classes, num_sensitives))\n",
    "    probabilities_but_z = np.zeros((num_classes, num_classes, num_sensitives))\n",
    "\n",
    "    for z in range(num_sensitives):\n",
    "        for k in range(num_classes):\n",
    "            for k_ in range(num_classes):\n",
    "                numerator_for_z = calibration_data.query(f'truth == {k} and prediction == {k_} and sensitive == {z}')\n",
    "                denominator_for_z = calibration_data.query(f'prediction == {k_} and sensitive == {z}')\n",
    "                probabilities_for_z[k, k_, z] = len(numerator_for_z) / len(denominator_for_z)\n",
    "\n",
    "                numerator_but_z = calibration_data.query(f'truth == {k} and prediction == {k_} and sensitive != {z}')\n",
    "                denominator_but_z = calibration_data.query(f'prediction == {k_} and sensitive != {z}')\n",
    "                probabilities_but_z[k, k_, z] = len(numerator_but_z) / len(denominator_but_z)\n",
    "\n",
    "    # sum of probabilities (over 'Y') should some to 1\n",
    "    assert np.allclose(probabilities_for_z.sum(axis=0), 1)\n",
    "    assert np.allclose(probabilities_for_z.sum(axis=0), 1)\n",
    "\n",
    "    return probabilities_for_z, probabilities_but_z\n",
    "\n",
    "probability_of_k_given_kprime_and_z(calibration_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([0.53, 0.47])"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "def probability_of_k(calibration_data):\n",
    "    \"\"\"Producing a |Y| vector of probabilities, where Y is ground truth label.\"\"\"\n",
    "    num_classes = max(calibration_data[\"truth\"]) + 1\n",
    "    \n",
    "    probabilities = np.zeros(num_classes)\n",
    "    for k in range(num_classes):\n",
    "        numerator = calibration_data.query(f'truth == {k}')\n",
    "        denominator = calibration_data\n",
    "        probabilities[k] = len(numerator) / len(denominator)\n",
    "    \n",
    "    # sum of probabilities (over 'Y') should some to 1\n",
    "    assert np.allclose(probabilities.sum(axis=0), 1)\n",
    "    return probabilities\n",
    "probability_of_k(calibration_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "prob_Y_given_Yhat_and_Z_equal_to_z, prob_Y_given_Yhat_and_Z_not_equal_to_z = probability_of_k_given_kprime_and_z(calibration_data)\n",
    "\n",
    "Y = probability_of_k(calibration_data)\n",
    "indicator = np.ones((Y.shape[0], Y.shape[0])) - np.eye(Y.shape[0])\n",
    "\n",
    "for_z = prob_Y_given_Yhat_and_Z_equal_to_z.transpose((0, 2, 1)) @ indicator @ Y\n",
    "but_z = prob_Y_given_Yhat_and_Z_not_equal_to_z.transpose((0, 2, 1)) @ indicator @ Y\n",
    "\n",
    "np.savez(\"../data/calibration/utkface_ErrorParity_calibration_constants\", for_z=for_z, but_z=but_z)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Equality of Odds"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array([[[0.78431373, 0.60714286, 0.82142857, 0.84615385, 1.        ],\n",
       "         [0.10958904, 0.03571429, 0.28571429, 0.07142857, 0.33333333]],\n",
       " \n",
       "        [[0.21568627, 0.39285714, 0.17857143, 0.15384615, 0.        ],\n",
       "         [0.89041096, 0.96428571, 0.71428571, 0.92857143, 0.66666667]]]),\n",
       " array([[[0.77777778, 0.82300885, 0.7699115 , 0.76521739, 0.76691729],\n",
       "         [0.13953488, 0.14503817, 0.10144928, 0.13740458, 0.11333333]],\n",
       " \n",
       "        [[0.22222222, 0.17699115, 0.2300885 , 0.23478261, 0.23308271],\n",
       "         [0.86046512, 0.85496183, 0.89855072, 0.86259542, 0.88666667]]]))"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "def probability_of_not_kprime_given_not_k_and_z(calibration_data):\n",
    "    \"\"\"Producing two sets of probabilitis for Z=z and Z =! z, each a |Y'| x |Y| x |Z| matrix of probabilities, where Y' is the predicated label and Y is ground truth label and Z is sensitive attribute.\"\"\"\n",
    "    num_classes = max(calibration_data[\"truth\"]) + 1\n",
    "    num_sensitives = max(calibration_data[\"sensitive\"]) + 1\n",
    "\n",
    "    probabilities_for_z = np.zeros((num_classes, num_classes, num_sensitives))\n",
    "    probabilities_but_z = np.zeros((num_classes, num_classes, num_sensitives))\n",
    "\n",
    "    for z in range(num_sensitives):\n",
    "        for k in range(num_classes):\n",
    "            for k_ in range(num_classes):\n",
    "                numerator_for_z = calibration_data.query(f'prediction != {k_} and truth != {k} and sensitive == {z}')\n",
    "                denominator_for_z = calibration_data.query(f'truth != {k} and sensitive == {z}')\n",
    "                probabilities_for_z[k_, k, z] = len(numerator_for_z) / len(denominator_for_z)\n",
    "\n",
    "                numerator_but_z = calibration_data.query(f'prediction != {k_} and truth != {k} and sensitive != {z}')\n",
    "                denominator_but_z = calibration_data.query(f'truth != {k} and sensitive != {z}')\n",
    "                probabilities_but_z[k_, k, z] = len(numerator_but_z) / len(denominator_but_z)\n",
    "                \n",
    "    return probabilities_for_z, probabilities_but_z\n",
    "\n",
    "probability_of_not_kprime_given_not_k_and_z(calibration_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "prob_Yhat_given_Y_and_Z_equal_to_z, prob_Yhat_given_Y_and_Z_not_equal_to_z = probability_of_not_kprime_given_not_k_and_z(calibration_data)\n",
    "\n",
    "np.savez(\"../data/calibration/utkface_EqualityOfOdds_calibration_constants\", for_z=prob_Yhat_given_Y_and_Z_equal_to_z, but_z=prob_Yhat_given_Y_and_Z_not_equal_to_z)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_calibration_constants(dataset, fairness_metric, raw_votes, targets, sensitives):\n",
    "    calibration_data = pd.DataFrame(\n",
    "        np.c_[raw_votes.argmax(axis=1), targets, sensitives], columns=[\"prediction\", \"truth\", \"sensitive\"]) # note the prediction is not noised yet\n",
    "    calibration_data = calibration_data.astype({\"prediction\": int, \"truth\": int, \"sensitive\": int}).assign(dataset=dataset)\n",
    "    \n",
    "\n",
    "    if fairness_metric == 'ErrorParity':\n",
    "        prob_Y_given_Yhat_and_Z_equal_to_z, prob_Y_given_Yhat_and_Z_not_equal_to_z = probability_of_k_given_kprime_and_z(calibration_data)\n",
    "\n",
    "        Y = probability_of_k(calibration_data)\n",
    "        indicator = np.ones((Y.shape[0], Y.shape[0])) - np.eye(Y.shape[0])\n",
    "\n",
    "        for_z = prob_Y_given_Yhat_and_Z_equal_to_z.transpose((0, 2, 1)) @ indicator @ Y\n",
    "        but_z = prob_Y_given_Yhat_and_Z_not_equal_to_z.transpose((0, 2, 1)) @ indicator @ Y\n",
    "\n",
    "        return for_z, but_z\n",
    "\n",
    "    elif fairness_metric == 'EqualityOfOdds':\n",
    "        prob_Yhat_given_Y_and_Z_equal_to_z, prob_Yhat_given_Y_and_Z_not_equal_to_z = probability_of_not_kprime_given_not_k_and_z(calibration_data)\n",
    "        \n",
    "        for_z=prob_Yhat_given_Y_and_Z_equal_to_z\n",
    "        but_z=prob_Yhat_given_Y_and_Z_not_equal_to_z\n",
    "\n",
    "        return for_z, but_z"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.12"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
