{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e355b99d",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "from lib_project.notebook import setup_notebook\n",
    "setup_notebook(\"../../../\")\n",
    "               \n",
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "acbd71c6",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "from experiments.memorization_dynamics import results as res_util\n",
    "from experiments.memorization_dynamics import carlini_comp_results as cc_res_util"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e1206ca3-0050-4a98-9e42-355d6aeaab2c",
   "metadata": {
    "tags": []
   },
   "source": [
    "# Memorization Dynamics: Comparing with the Carlini Memorization Metric\n",
    "\n",
    "From [this paper](https://arxiv.org/abs/2202.07646)\n",
    "\n",
    "We train models for 100 epochs on random strings with different alphabet sizes and 1024 tokens."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3a35828d-0e51-4f7c-9f96-e2e20545394e",
   "metadata": {},
   "outputs": [],
   "source": [
    "FIGURE_FOLDER = f\"{res_util.FIGURE_FOLDER}/carlini_comparison\"\n",
    "\n",
    "def load_results(\n",
    "    models: list[tuple[str, str]],\n",
    "    seed_ids: list[int],\n",
    "    alphabet_size: int = 26,\n",
    ") -> dict:\n",
    "    return {\n",
    "        model[1]: res_util.load(\n",
    "            [f\"rand_a-lat-{alphabet_size}_t-1024\", model[0]],\n",
    "            seed_ids,\n",
    "        )\n",
    "        for model in models\n",
    "    }\n",
    "\n",
    "def show(results: dict):\n",
    "    return cc_res_util.show_models(\n",
    "        results,\n",
    "        title=\"Model\",\n",
    "    )\n",
    "\n",
    "def produce_paper_plots(\n",
    "    figures: dict,\n",
    "    show_legend: bool = True,\n",
    "):\n",
    "    cc_res_util.produce_accuracy_recall_paper_plots(\n",
    "        figures,\n",
    "        show_legend=show_legend,\n",
    "        figure_folder=FIGURE_FOLDER,\n",
    "    )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6db1ebcf-894a-4f39-8214-dd817b620f09",
   "metadata": {},
   "outputs": [],
   "source": [
    "seed_ids = list(range(10))\n",
    "results = results = load_results(\n",
    "    [\n",
    "        (\"pythia-1b\", \"Pythia-1B\"),\n",
    "        (\"phi-2\", \"Phi-2.7B\"),\n",
    "        (\"Llama-2-7b-hf\", \"Llama2-13B\"),\n",
    "    ],\n",
    "    seed_ids,\n",
    ")   \n",
    "figures = show(results)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3456ca51-a5a0-4728-95e7-89331cf2c5ee",
   "metadata": {},
   "outputs": [],
   "source": [
    "produce_paper_plots(\n",
    "    figures,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fab40316-bb29-4f77-9721-408f7b6382fd",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e3341cec-0464-4638-a04a-ba103bad739c",
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "# Upload\n",
    "res_util.publish(\"dynamics_analysis/carlini_comparison\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "de626a7a-9492-4fe0-ad94-b525e91d1c84",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
