{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Notebook - to parse results and visualise results neatly into table"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def find_files(top_dir, monitor):\n",
    "    all_matches = {}\n",
    "    _, dirnames, filenames = os.walk(top_dir).__next__()\n",
    "    for dir_name in dirnames:\n",
    "        exp_dir_path = os.path.join(top_dir, dir_name)\n",
    "        matches = []\n",
    "        for rs, _, fs in os.walk(exp_dir_path):\n",
    "            for filename in fs:\n",
    "                if filename == monitor:\n",
    "                    matches.append(os.path.join(rs, filename))\n",
    "        all_matches[dir_name] = matches\n",
    "    return all_matches"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def read_lisps(fpaths):\n",
    "    df = pd.DataFrame()\n",
    "    for fpath in fpaths:\n",
    "        exp_name = os.path.dirname(fpath).split(\"/\")[-1]\n",
    "        with open(fpath, \"r\") as f:\n",
    "            data = f.read().splitlines()\n",
    "        data = data[5][3:-3].split(\") (\")\n",
    "        data = [i.split(\" \") for i in data]\n",
    "        data = [[float(j) for j in i] for i in data][0]\n",
    "        df[exp_name] = data\n",
    "\n",
    "    return df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "final_res = pd.DataFrame(columns=[\"communicative-success-mean\", \"communicative-success-std\", \"communicative-success-min\", \"communicative-success-max\", \n",
    "                                  \"lexicon-coherence-mean\", \"lexicon-coherence-std\",  \"lexicon-coherence-min\",  \"lexicon-coherence-max\",  \n",
    "                                  \"unique-form-usage-mean\", \"unique-form-usage-std\",  \"unique-form-usage-min\",  \"unique-form-usage-max\"])\n",
    "\n",
    "fpaths = find_files(\"paper/test-results/\", \"communicative-success.lisp\")\n",
    "for key, val in fpaths.items():\n",
    "    final_res.loc[key] = [None, None, None, None, \n",
    "                        None, None, None, None,\n",
    "                        None, None, None, None]\n",
    "for monitor in [\"communicative-success.lisp\", \"lexicon-coherence.lisp\", \"unique-form-usage.lisp\"]:\n",
    "    fpaths = find_files(\"paper/test-results/\", monitor)\n",
    "    for key, val in fpaths.items():\n",
    "        df = read_lisps(val)\n",
    "        mean = df.mean(axis=0).mean(axis=0)\n",
    "        min = df.mean(axis=0).quantile(0.05) # quantile min\n",
    "        max = df.mean(axis=0).quantile(0.95) # quantile max\n",
    "        # take the mean of df and then take the 2-std of that from dataframe df\n",
    "        std = df.mean(axis=0).std(axis=0) * 2\n",
    "        # set the communicative-success-mean to final_res\n",
    "        monitor_name = f\"{monitor.split('.')[0]}\"\n",
    "        final_res.loc[key, f\"{monitor_name}-mean\"] = mean\n",
    "        final_res.loc[key, f\"{monitor_name}-std\"] = std\n",
    "        final_res.loc[key, f\"{monitor_name}-min\"] = min\n",
    "        final_res.loc[key, f\"{monitor_name}-max\"] = max"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# turn the numbers into percentages with 2 decimal points in the communicative-success and lexicon-coherence columns\n",
    "perc = final_res.sort_index().copy()\n",
    "perc[\"communicative-success-mean\"] = perc[\"communicative-success-mean\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"lexicon-coherence-mean\"] = perc[\"lexicon-coherence-mean\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"unique-form-usage-mean\"] = perc[\"unique-form-usage-mean\"].apply(lambda x: round(x, 2))\n",
    "perc[\"communicative-success-std\"] = perc[\"communicative-success-std\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"lexicon-coherence-std\"] = perc[\"lexicon-coherence-std\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"unique-form-usage-std\"] = perc[\"unique-form-usage-std\"].apply(lambda x: round(x, 2))\n",
    "perc[\"communicative-success-min\"] = perc[\"communicative-success-min\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"lexicon-coherence-min\"] = perc[\"lexicon-coherence-min\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"unique-form-usage-min\"] = perc[\"unique-form-usage-min\"].apply(lambda x: round(x, 2))\n",
    "perc[\"communicative-success-max\"] = perc[\"communicative-success-max\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"lexicon-coherence-max\"] = perc[\"lexicon-coherence-max\"].apply(lambda x: round(x*100, 2))\n",
    "perc[\"unique-form-usage-max\"] = perc[\"unique-form-usage-max\"].apply(lambda x: round(x, 2))\n",
    "perc"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "plot-babel-fast",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.4"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
