{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# making sure that updates to imported files are immediately available without restarting the kernel\n",
    "%reload_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import sys\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import seaborn as sns\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "font = {\"size\": 15}\n",
    "matplotlib.rc(\"font\", **font)\n",
    "\n",
    "sys.path.append(os.path.abspath(\"..\"))\n",
    "from utils import error_consistency, simulate_trials_from_copy_model, filter_df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Significance testing\n",
    "\n",
    "First, let's see how an EC-estimate obtained from an insufficient number of trials is not significant, while one from sufficiently many trials is."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trials1 = np.array([0, 1, 0, 0, 1, 1, 1, 1, 1, 1])\n",
    "trials2 = np.array([0, 0, 0, 1, 0, 1, 1, 1, 1, 1])\n",
    "\n",
    "ec, p_value = error_consistency(trials1, trials2)\n",
    "\n",
    "print(ec, p_value)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "trials1, trials2 = simulate_trials_from_copy_model(\n",
    "    kappa=0.1, acc1=0.7, acc2=0.75, n_trials=1000\n",
    ")\n",
    "\n",
    "ec, p_value = error_consistency(trials1, trials2)\n",
    "\n",
    "print(ec, p_value)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## MvH\n",
    "\n",
    "Testing the statistical significances of the MvH data, for clip and one human."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# load CLIP and subject-01 from Geirhos data\n",
    "all_df = pd.read_parquet(\n",
    "    \"../geirhos_analysis/data/geirhos_raw_data.parquet\", engine=\"pyarrow\"\n",
    ")\n",
    "\n",
    "df = all_df[all_df[\"subj\"].isin([\"subject-01\", \"clip\"])]\n",
    "\n",
    "df = filter_df(df)\n",
    "\n",
    "ecs = []\n",
    "pvals = []\n",
    "exps = []\n",
    "cons = []\n",
    "for exp, exp_df in df.groupby(\"experiment\", observed=True):\n",
    "    for con, con_df in exp_df.groupby(\"condition\", observed=True):\n",
    "\n",
    "        ecdf = pd.merge(\n",
    "            left=con_df[con_df[\"subj\"] == \"clip\"],\n",
    "            right=con_df[con_df[\"subj\"] == \"subject-01\"],\n",
    "            on=\"img_identifier\",\n",
    "        )\n",
    "\n",
    "        ec, pval = error_consistency(\n",
    "            ecdf[\"correct_x\"].values, ecdf[\"correct_y\"].values, n_bootstraps=50_000\n",
    "        )\n",
    "\n",
    "        ecs.append(ec)\n",
    "        pvals.append(pval)\n",
    "        exps.append(exp)\n",
    "        cons.append(con)\n",
    "\n",
    "res_df = pd.DataFrame(\n",
    "    {\"Experiment\": exps, \"Condition\": cons, \"EC\": ecs, \"p-value\": pvals}\n",
    ")\n",
    "\n",
    "display(res_df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "fig, ax = plt.subplots(1, 1, figsize=(12, 6))\n",
    "plt.grid(axis=\"y\")\n",
    "sns.scatterplot(data=res_df, x=\"EC\", y=\"p-value\", hue=\"Experiment\", legend=True, ax=ax)\n",
    "sns.despine()\n",
    "ax.set_ylim(0, 0.35)\n",
    "ax.legend(loc=\"center left\", bbox_to_anchor=(1, 0.5))\n",
    "ax.axhline(0.05, color=\"red\", linestyle=\"dotted\")\n",
    "plt.tight_layout()\n",
    "plt.savefig(\"figures/pvalues.pdf\", bbox_inches=\"tight\")\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {},
 "nbformat": 4,
 "nbformat_minor": 2
}
