{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "08191f5b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "import numpy as np\n",
    "import os\n",
    "import pandas as pd\n",
    "import pickle as pkl\n",
    "import polars as pl\n",
    "import policy\n",
    "import random\n",
    "import seaborn as sns\n",
    "from config import *\n",
    "from create_tensor import load_metadata\n",
    "from matplotlib import font_manager as fm\n",
    "from sklearn.metrics import average_precision_score, precision_recall_curve, confusion_matrix, ConfusionMatrixDisplay\n",
    "from tqdm.notebook import tqdm\n",
    "from utils import load_test_predictions, load_test_prompt_predictions, load_val_predictions, process_math_id"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "e470b872",
   "metadata": {},
   "outputs": [],
   "source": [
    "cm_dict = dict()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "7066292d",
   "metadata": {},
   "source": [
    "# GSM8K / DeepSeek-R1-Distill-Llama-8B"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "83840edf",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset = \"gsm8k\"\n",
    "model_id = \"deepseek-ai/DeepSeek-R1-Distill-Llama-8B\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "9bb1a126",
   "metadata": {},
   "outputs": [],
   "source": [
    "model_dir = os.path.join(DSET_TO_DIR[dataset], MODEL_IDS[model_id])\n",
    "history_list = list()\n",
    "layer_list = list()\n",
    "for layer in range(1, 33):\n",
    "    history_csv = os.path.join(model_dir, \"model\", f\"L{layer}_mlp\", 'history.csv')\n",
    "    if os.path.exists(history_csv):\n",
    "        history_df = pd.read_csv(history_csv)\n",
    "        history_list.append(history_df)\n",
    "        layer_list.append(layer)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "15c4a9a3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAroAAACkCAYAAAB4vo3bAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjUsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvWftoOwAAAAlwSFlzAAAPYQAAD2EBqD+naQAAMZ9JREFUeJzt3XlcVPX+P/DXsAcIggqhpoa7JpoG4p4KKZqlgqmVXislul834iJ5TYVEK72o30w0FzS618Qt1FQ0TLuKCJhLuJSmJrjhgqzD6pzfH36ZnwMzA3POgcHh9Xw8etScOec97zOd98x7PnzOOQpBEAQQEREREZkYM2MnQERERERUG9joEhEREZFJYqNLRERERCaJjS4RERERmSQ2ukRERERkktjoEhEREZFJYqNLRERERCaJjS4RERERmSQ2ukRERERkktjoEhEREZFJYqMLQKVSQalUQqVSGTsVIiIiIpIJG10AxcXFuHTpEoqLi42dChERERHJhI0uEREREZkkNrpEREREZJLY6BIRERGRSbIwdgJEZBpWb9iIvPxCo7y2QyM7/M/UD+rkte7cuYPNmzfj5MmT2L17NwDg1q1bmDBhArZu3YoWLVporF9QUIAtW7YgNjYWx48fN/j1Tp8+jZCQEBw4cAA2Njay7IMxxKz+GoV5uXX+unYOjnj/f6bX+esSUf3ARpeIZJGXX4jUroON8tpeF44YtH5CQgK++OIL3LlzBx9++CE++OADODo6AgAePHiAzz//HMePH8fChQsxYsQIjW0bN26MRo0aIT8/X72sWbNmmD59Opo1a1bltVQqFSwtLXH//n0Rewa0a9cO06dPf6abXAAozMvF6JP76vx1471HGrzN5s2bERsbix49esDMzAx79+5Fjx498MILLyAjIwPXr19HWlpaLWRLRHJjo0tEDc7w4cNhbm6O6dOno3fv3uomFwCaNm2Kvn37ol+/flWaXAB47rnn8Pzzz2sss7Kywvjx47W+loODAzp16lTj3DIzM3H27FmMGjVKvb2/v3+Ntyfp7OzssGPHDjg7OwMA9u7di4CAAIwbNw4AsHLlSoNj5ufnIz4+HpMmTZIzVSKqBufoElGDNHToULRp0wZxcXFVnjt27Bhef/11nduamRn20VnT9XNycjBz5kyUlZUZFJ/kNXjwYHWTq827775rULzi4mIEBwcjJydHYmZEZCiO6BJRg2RmZobJkydj8eLFyMzMxAsvvAAAuHz5Mtzd3ZGcnIwDBw6gZcuW+PnnnzF37lx4enpWiVNYWIj//Oc/2Lp1K2JjY9GyZUsAwA8//IAzZ87AyckJ58+f19im4jlHR0ecOHECX375Jdq1a4c9e/YgMzMThw4dwu3btzFx4kTExsZix44dSEpKAvBkKsSGDRtQWFiIR48e4fbt25g/fz5at26NY8eOYdOmTejZsycAYOvWrWjevDliYmJgb29fm2+nSWnatKne5x0cHLBp0yYUFxfjyJEj8PT0xD/+8Q8oFAps3boVBQUFuHXrFuLj43HmzBkkJCTg6tWrKCoqQnl5OQIDA2FnZ1dHe0PUsHFEl4garLFjx6JRo0aIjY1VL4uLi8P48eMRFhaGgIAATJ8+Hd26dUNMTIzWGDY2NnjllVdw69Yt9bLk5GT85z//QUREBIKDg+Hl5aV+rqCgAP/85z/x0UcfISQkBE5OTti6dSsAYPLkyXBwcMBrr72G6dOnw8HBAR06dMCDBw/U269fvx4PHz5EcHAwPvvsM3Tt2hXvv/8+SkpK0LdvX9y7dw+pqal4/fXXcfDgQWRkZGD//v1yv3UN2ooVKzBw4EB89NFH+Prrr7F582bs2LEDBQUF+O677zB16lQsXLhQPZ1l9OjRaNmyJby9vREcHMwml6gOsdElogbrueeew4QJE7Bz507k5+ejoKAASqUSrq6u+Oqrr+Dh4YHLly/j5s2bKCgo0BrD3Ny8ykloq1evxtChQ6FQKAAA3bt3Vz9nb2+PDRs2wM3NDWfPnsWjR49QWKj9ahWWlpZo0qSJ+rFKpcKmTZvQu3dv9bJJkybh5s2bSExMhLm5ORo3bgxPT0+0adMGdnZ2ePHFF3Hv3j3R7xFpEgQBe/fuxbFjx7B582bs378fAwcORH5+PiwsLHDnzh384x//QGZmJj74oG6uBEJEurHRJaIG7d1330VpaSni4uKwc+dOjB07FgDg7OyMJUuWICMjAx4eHnpjVDS0FS5evKgxalf5eRsbG0RERKC4uBjt27eHIAg1ip2dnY1Hjx6hvLxcvaxp06aws7PD7du3tb6WhYWF3vhkmOzsbOTk5GDSpEmYMmUKpkyZgjVr1uD999+HjY0NNm3ahCtXrmD48OFYv349Hj9+bOyUiRo0NrpE1KA1a9YMo0aNwr///W/8+uuv8PT0RH5+Pt5++22899578PHxMfjkMwcHB1y5ckXrczdu3EBQUBBCQkLg7e1tUFxnZ2fY2trijz/+qPJchw4dDIpF4jRu3BgKhQL79mleKi01NRVFRUVwc3PDDz/8gIiICHz//ffqay0TkXEYtdFVKpWIiIjAihUrsHjxYpSWlmpdb+3atYiOjsbatWuxYsUKjdEJpVIJLy8vdOzYER07dsRPP/1UV+kTkYmYMmUK7ty5g379+gEAMjIykJubi+zsbGRnZ+P8+fMoLi7GX3/9BeDJn6+f/hyq+O+Kf48cORK7d+/GuXPn1PEAICsrC7///juKi4uRk5OD27dv488//9SIbWlpiZycHNy4cQPFxcUasStOoNu1axeUSiUA4Pfff0erVq3Qv39/AMDjx4+rjOByRFe8itHzin+bm5tj9OjRWLhwIWJiYpCWloZ//etfUCgUKCgowObNm2FmZoaAgAAMGjRI/d5bWVkhJycH2dnZGnOuiah2GfWqC+Hh4fD19YWvry/i4+MRFRWFuXPnaqxz5MgR3Lx5E5GRkQCAuXPn4sCBA+rrW+7cuRMRERHq62A+PXeNiKgmOnbsiBEjRuCNN94AAHTq1AlDhgxBYGAg/Pz8MGzYMHz55Ze4cOECnnvuOfz888+4d+8e9u7dCx8fH+zatQsAEB8fj6lTp2LmzJkoKChAYGAgunfvji5duqBdu3Y4ePAgxowZg65du2LcuHEYN24chg0bhtjYWNy5cwdt2rSBv78/1q5di9LSUowfP159Itn333+PCRMmYMaMGSgtLUVQUBB69uyJgoICrFu3Dubm5khJScGff/4JAPDz88OjR49w7do1lJWV4fXXX4e7u7tx3uBn1K1bt9Qjsvv370fbtm3h5eWFuXPnwszMDN988w3s7Owwc+ZMeHp64v79+4iJicGDBw/QoUMHNG/eHG+++SYA4I033kBkZCQUCgXmzZtnzN0ialAUgpF+6mdlZcHX1xdpaWmwtrZGdnY2Bg8ejKSkJI3L4GzYsAEXLlzAihUrAAARERHo1KkTxo8fj8ePHyMwMBDz5s2T9AGuVCpx6dIldO7cGba2tpL3jaghaii3ACZxeAtgIjIGo43opqamwsnJCdbW1gCezD2ztLREeno6+vTpo15vyJAhWLVqFRISEtCnTx88evRI/Qv5+PHjOH36NPz8/NC/f38sXbpU4wxlIqo7bDRJHzabRGQMRmt0s7KyNG67CTy57WJWVpbGMnd3d0RFRSEkJASenp5YtWqV+p7vgwYNwunTp3Hq1ClEREQgKCgIcXFxBp84UqHyvDsiIiIiqn8qX2FGF6M1ugqFQj2aW6GsrAyWlpZV1i0pKcGaNWsQERGBjz/+GKtWrYKFhYU6jqenJ2JjY+Hn54ezZ8+q7wpkKKVSCZVKJWpbIiIiIqobjRo1qtF6Rmt0XVxckJ+fr7FMqVTCxcVFY1lKSgrOnz+PsLAwxMbGYvz48di0aROmTZumsZ6zszOGDx+Ou3fvis7J1taWc3SJiIiITITRGl0vLy8sWLAApaWlsLKyUk9ZqHxh9oMHD6qvD+nq6orZs2fjwIEDVRpd4MmF0Tt16iQ6J4VCUeOhcCIiIiKq30RNZs3Ly5P8wq6urhgwYADS0tIAAElJSZg4cSKsra2xceNGXLt2DQDQuXNnXLx4UWPbbt26AQASExNx9epVAMC1a9dgb2/Py+cQEREREQCRjW5oaChu3Lgh+cXDw8Oxf/9+REdH448//kBwcDAAYN++fbh8+TIAwN/fH02aNMG6deuwfft2ZGRkIDAwEACQnp6OcePG4cMPP8TRo0cxa9YsyTkRERERkWkQdR3dZcuWwdzcHHfv3sVrr72GoUOHPtN/8ud1dImIiIhMj6QbRpSVleHQoUP4+eef0b59ewQEBKBp06Zy5lcn2OgSUU3l5eXBwcHB2GkQEVENSDoZzdLSEpaWlrh27RqOHj2K69evw8bGBhMmTEDnzp3lypGIqN6IiorCvHnzYGVlZexUiIioGqIa3ZiYGDg7O2Pjxo24d+8eJk2ahMmTJ8PBwQFKpRKRkZHo27cvXn/9dbnzJSIympKSEuzduxeDBw/Gq6++aux0iIioGqIa3Ypb7f7tb3/DO++8Azs7O/Vztra28PLywhdffMFGl4hMyrFjx1BYWIiEhAQ2ukREzwBRja6Pjw++/PJLjQb3afb29ujdu7ekxIiI6puDBw8CAA4fPqy+BjgREdVfok5Gq3wyxrP+gc+T0YiosqSkJGzevFnjtuCnT5+GUqkEAPTs2VPj88LT0xOBgYEwMxN11UYiIqoFoj6RL1y4AD8/P9y/fx8AcP78eaxYsQJFRUWyJkdEZCz9+vXDpEmTcOnSJRw/fhzHjx9XN7nAk6b3+PHjSE5ORo8ePTBt2jQ2uURE9YyoT+WVK1di0KBBcHR0BPBkZOOll17CZ599JmtyRETGNHDgQOzevRt9+/bV+rybmxtiY2MxY8YMmJub13F2RERUHVGNrre3Nz755BON6QpOTk5ITEyULTEiovqgWbNmWLdundZpTZGRkXjllVeMkBUREdWEqEa3tLRUY5pCQUEBVq1aBTc3N9kSIyKqL9LS0jSmLVT45ZdfjJANERHVlKhGd+zYsfD398fMmTMRFBSEV199FWfPnsXcuXPlzo+IyOgSEhIAAJ07d8auXbvg7+8PADh06BAk3FySiIhqmehbAGdnZyM+Ph6ZmZlwc3PDyJEj0aJFC7nzqxO86gIR6aJSqTBw4EAMHz4cc+bMUU/Z2r9/PxYsWID169fj5ZdfNnKWRESkjehGt7KMjAzcuXPnmbx+LhtdItLlypUruHXrltYbRNy8eRPp6enw8/Or+8SIiKhaom4YcfXqVcTFxaGgoED9Z7uSkhL8+uuvnLNGRCYjZvXXKMzLBQCkJydVed7OwRHv/8/0uk6LiIhqSFSjGxYWBicnJzx69Ajt27cHAGRmZmLy5MmyJkdEZKinm1NtDGlOC/NyMfrkPp3Px3uPNFpuRERUPVGNbt++ffHxxx/j3LlzKCkpgZeXF+7cuYOtW7fKnR8RkUHkbk7lVJ9zIyIyRaIa3ZycHGRlZaF79+5YtGgRunXrBpVKhR07diA4OLjGcZRKJZYtWwYHBwcolUqEhoZqvZXw2rVroVKpYGZmhqKiIsyePRsKhQLAk3vOJycno7S0FMOHD9d5YXciIlPC0WEiouqJanRffvllDBkyBBs2bMDIkSMxaNAglJSUoEuXLgbFCQ8Ph6+vL3x9fREfH4+oqKgqlyg7cuQIbt68icjISADA3LlzceDAAYwYMQJXr17FmjVrsH37dgiCAH9/f6xduxaurq5idouIakjOJosNmzh1Oa2C/w+I6FklqtF99dVXkZKSAnt7ewDAjh078Mcffxg0mpqVlYWEhAQsWrQIwJNbbS5cuBAzZsxQxwWenPhWWFiofmxjY4P8/HwAwLfffosBAwZAoVBAoVCgR48e2LJli0GjykRkODmbLP45v37Q9/+Bc5GJ6FklqtH19/dHUFAQ3nrrLQBAq1at0KpVK4NipKamwsnJCdbW1gAAZ2dnWFpaIj09HX369FGvN2TIEKxatQoJCQno06cPHj16hDfffBMAkJKSgqlTp6rXbd26NQ4dOiRmlwAAgiDw4u9EMpGzluSuS+ZWu7Fq8uPFkHibor9GYV6e1ufsHBzw3t/ZNBM1NBVTWKsjqtH18PDQOnp77tw5dO/evUYxsrKy4OjoqLHMzs4OWVlZGsvc3d0RFRWFkJAQeHp6YtWqVbCxsVHHaNy4scb29+7dM3Bv/j+lUgmVSiV6e6L6Km5TDJQF+Tqft7VvhPHvvV/jeNU1KYIgoKCgoM5jMbfayc2Y+wkABbm5GJOyX+tzP/QeYVAsuWuBiIyjUaNGNVpPVKPr7u6OOXPmaDS7KpUKP/30E/bu3VujGAqFQj2aW6GsrAyWlpZV1i0pKcGaNWsQERGBjz/+GKtWrYKFhQUUCoXGyWtlZWWwsBC1SwAAW1tb3jCCTFJRYYHORgF4MsL29JSh6lT3S1qhUNQ4npyxxMSL3hCDPB2NknlxiVFzq6tY1cUz5n7KnZvctUBE9ZuorvDcuXPIzc1FSkqKxvIHDx7UOIaLi4t6rm0FpVIJFxcXjWUpKSk4f/48wsLCEBsbi/Hjx2PTpk2YNm0aXFxcNH7JFxYWVtneEBVzfYnqg7qe5yj3sS9nvKdjrd6wEXn5hTrXNS8uNiheXkEhUrsO0bqe97E4g2LJobbet/oUS+54xsxNzpP4OLeZSH6iGt133nkHffv2VU8hqJCUVPXOQbp4eXlhwYIFKC0thZWVlXrKgoeHh8Z6Bw8eRIcOHQAArq6umD17Ng4cOIBp06bB29sb169fV6+bkZHxTN6CmEgbnqSlXV5+IVK7Dtb5fE2a09oiRxNOzxY5T+JjzRPJT1SjO2RI1dGP4uLiKvNr9XF1dcWAAQOQlpaGfv36ISkpCRMnToS1tTU2btyIwYMHw93dHZ07d0Z6errGtt26dQMATJw4EYsWLcL06dNRXl6O3377DTNnzhSzS0Sy4CWaGrb63IRTwyL36DBHm+lZJarRHTp0aJVl+fn5aNOmDcaOHVvjOOHh4YiKilJPhQgJCQEA7Nu3Dy1atIC7uzv8/f1x+/ZtrFu3Dk5OTrhz5w6CgoIAAJ06dcLYsWPx5ZdfoqysDHPnzkWzZs3E7BKRLOQc3aGGjaPDJIXco8McbaZnlahGt2vXrhg8WHPU4tixYxqXBasJZ2dnLF68uMryXbt2qf/bzMwMs2bN0hnD39/foNckorqnr2ljw6ad3KPDbJypvmhIo831ObeGQlSjGxYWhhYtWmgs8/LywsaNG2VJioiMS+6mSF/Txj/n1w05G2c2zSRFfR5tlrsxrc+5NRSiGt3KTS4AlJeXY9++fViwYIHkpIjIuDjXlPTh8UGmqj5P0ajPudVnok9Ge/ryKyqVCvfv39d6khpRfcZfyETGxxFiomdbff4uFdXodu7cGT4+PurHZmZmaNasmda7pRHVZ6b0C5nzYOlZxWkVRHVPzqsE1efvUlGNbmhoKNq0aSNzKkQ1w0t4acd5sEScVkFUUw3lKkGiGt2ioiJMnToVy5Ytg5OTE5KTk/H7779jypQpvLMY1bqGUpxEZHxyjhBztJmoZuQc0BLV6EZERKBZs2awtrYGAPTp0wdZWVlYunQpwsLCxIQkanD4pUdU/8k5QszRZqKakXNAS1Sj27NnT8yZM0djWZs2bfDFF1+w0aUq6vMkdWPilx4RSSHnvHz+8CZTJarRrTw9QRAEfPvtt3B0dJQlKTIt9XmSuqH4ZUBE9YWc8/Lr8gYl/JykuiSq0R08eDDGjh2L3r17o7S0FL/88gtu376NZcuWyZ0fUb3CUVgiourJ2YRzgIGkENXovvLKK1i2bBm2bNmCzMxM9O3bF/7+/ujevbvc+REREVEDVp9Hm9mE13+iGl0AaNu2LebPnw8AyMrKgqurq2xJkfHxEl5ERGSK6uuUDzbNtUNUo7tv3z58+umn2L9/P9zc3FBUVITw8HDMmDEDTZo0kTtHMgJewouIiKjucGpc7RDV6H733Xf4+OOP8fzzzwN4csUFHx8fLFiwAKtXr5Y1QSIp+AuZiIgaIl4D+glRjW7//v0xadIkjWXm5uY4efKkLEkRyYW/kImIqCHiNaCfENXoFhYWaszLzcjIwBdffIH27dsbFEepVGLZsmVwcHCAUqlEaGgorKysNNZJSUnB5MmTNZa99NJL2LlzpzrGq6++itzcJ/NJv/76a/j6+orZLSIiIiIyIaIa3cmTJ2Pq1KmwsrJCaWkprl27hsaNG2Pjxo0GxQkPD4evry98fX0RHx+PqKgozJ07V2OdkydPYuXKlXBzcwPwpPEtLy9XP79z505ERESor+Hbu3dvMbtkFHLeSMGUbsrwLP+JhIiIiOoPUY2um5sbdu7ciSNHjiAzMxNubm4YNGgQUlNT0alTpxrFyMrKQkJCAhYtWgQAGDhwIBYuXIgZM2bA3t5evd64cePQvHlz9eMdO3aoR3gfP36Mo0ePYt68eXB3dxezK0Yl540UTOmmDM/yn0iIiIhIv7oc0BJ9eTErKysMGzZM/TgpKQlLlizBkCFDarR9amoqnJycYG1tDQBwdnaGpaUl0tPT0adPH/V6Tze5KpUKV69eRYcOHQAAx48fx+nTp+Hn54f+/ftj6dKlvOqDEXAEloiIiGqqLge0RDe6AFBaWooff/wR3333HS5dulTl1sD6ZGVlVbllsJ2dHbKysnRuc+bMGfTo0UP9eNCgQTh9+jROnTqFiIgIBAUFIS4uDmZmZgbvC/DkVsaCIIjatrbImU9txcrLL0BqV90/cGpywGrmJi1POWPJHY+5GT+W3PFqL7eGsp/S4zE348eSO17DzK2h7Kf0eIIg1LjnFNXo3rt3D1u2bMG2bduQk5OD/v37Y9asWUhPT69xDIVCoR7NrVBWVgZLS0ud2yQmJlY50UyhUMDT0xOxsbHw8/PD2bNn0bNnT8N26P8olUqoVCpR24pRXeMpCAIKCgrqPFZ18SrHktpAyxmPuRk/FnOTJ7eGsp/MjbkxN9a8mFiNGjWq0foGNbrnzp1DbGwsDh48CBsbG4wZMwYlJSX47LPPAABeXl41juXi4oL8/HyNZUqlEi4uLnpfPzQ0VOtzzs7OGD58OO7evVvjHCqztbWFra2t6O0NVd2vEYVCoTFfua5iVRevcixDRvJrOx5zM34s5iZPbg1lP5kbc2NurHkpsapT40Z3xowZSExMxIsvvoh//vOfGD16NGxtbbF8+XL1OoY0iV5eXliwYAFKS0thZWWlnrLg4eGhdf3Lly+jXbt2eqclWFhY1PhkOG0UCoXeN98YVzaQenDpiiV1Xq1mXtJzlDMeczN+LLnjNczcGsp+So/H3IwfS+54DTO3hrKf0uMZ0hvVuNFduXIl9u/fj3379iE3NxclJSWSRj9dXV0xYMAApKWloV+/fkhKSsLEiRNhbW2NjRs3YvDgwRpXUkhMTISPj49GjIrGu23btrh27Rrs7e1r9eoLvLIBERER0bOjxo2uubk5Ro0ahVGjRuHXX3/FkiVLYG9vr3FN20ePHsHJyanGLx4eHo6oqCicO3cOubm5CAkJAQDs27cPLVq00GhaU1JSMHXqVI3t09PTMWfOHHh6eqJ3796YNWtWjV+biIiIiEybqJPRevXqhV69euHmzZv497//jZCQEIwZMwanT5/GzJkzaxzH2dkZixcvrrJ8165dVZZ9++23VZYFBwcjODjYsOSJiIiIqEEQdx2u/9OyZUt88skniIiIwMWLF7F582aZ0iIiIiIikkbSdXQr2NvbIzAwUO8VE0ga3pSBiIiIyDCyNLoVRo8eLWe4Z56czSlPHiMiIiIyjKyNLmlic0pERERkPJLm6BIRERER1VdsdImIiIjIJLHRJSIiIiKTxDm6leg7gYxXNiAiIiJ6drDRrUTfCWQ8eYyIiIjo2cGpC0RERERkktjoEhEREZFJYqNLRERERCaJjS4RERERmSQ2ukRERERkktjoEhEREZFJYqNLRERERCbJqNfRVSqVWLZsGRwcHKBUKhEaGgorKyuNdVJSUjB58mSNZS+99BJ27twJADh8+DCSk5NRWlqK4cOHo2/fvnWWPxERERHVX0ZtdMPDw+Hr6wtfX1/Ex8cjKioKc+fO1Vjn5MmTWLlyJdzc3AA8aXzLy8sBAFevXsWaNWuwfft2CIIAf39/rF27Fq6urnW+L0RERERUvxht6kJWVhYSEhIwcOBAAMDAgQOxdetWFBQUaKw3btw4+Pn5oUePHujRowcyMzPh6+sLAPj2228xYMAAKBQKmJmZoUePHtiyZUud7wsRERER1T9GG9FNTU2Fk5MTrK2tAQDOzs6wtLREeno6+vTpo16vefPm6v9WqVS4evUqOnToAODJ6O7UqVPVz7du3RqHDh0yOBeVSgUAKCoqQiN7WzxvrtK6XiNHR5Q931JnHLtGDigsLPz/6+uJZWg8OWNJjVeb+8ncaic3Yx67zE1cPB67zE1KPNbVs5cbj13DclMoFLCxsYGZmf4xW4UgCILeNWrJhg0bsGfPHuzZs0e9bNCgQQgODsbo0aO1bvPrr78iMTERYWFhAIAePXpg2bJl6hHe7du345tvvkFiYqJBuTx8+BB//fWXqP0gIiIiorrXuXNn2Nra6l3HaCO6CoVCPZpboaysDJaWljq3SUxMVDe1FTGePnmtrKwMFhaG75KjoyPatGkDa2vran8ZEBEREZHx2djYVLuO0RpdFxcX5OfnayxTKpVwcXHRuc25c+cQGhqqEePpOb2FhYV6t9fFwsICTZo0MXg7IiIiIqq/jDZ86eXlhaysLJSWlgJ4cnIaAHh4eGhd//Lly2jXrp3GiKu3tzeuX7+ufpyRkYHevXvXYtZERERE9KwwWqPr6uqKAQMGIC0tDQCQlJSEiRMnwtraGhs3bsS1a9c01k9MTISPj4/GsokTJyI5ORkAUF5ejt9++w1vvfVW3ewAEREREdVrRjsZDQCys7MRFRWFFi1aIDc3FyEhIbCyssLYsWMRGBiI4cOHq9f929/+hvXr11e5ocTOnTvx559/oqysDD4+PvD29q7r3SAiIiKiesiojS4RERERUW3hJQaIiIiIyCSx0SUiIiIik8RGl4iIiIhMEhtdIiIiIjJJbHSJiIiIyCSx0SUiIiIik8RGt4Z++eUXBAQE4ObNm5JjHTp0CEOGDEHv3r0RGRmJ8vJy0bFOnz6NESNG4JVXXkFkZKTk3ACgtLQUb7zxBlJSUiTHWrNmDTp27IiOHTvijTfekCG7J/scExODxMREZGdni4oxadIkdV4V/xw9elR0TlevXkVERAQ2b96M8PBwXLp0SXSs1NRUzJs3D//7v/+L8PBwFBcXGxxD2/GqVCoRERGBFStWYPHixeq7EoqNl52djaVLlyIiIkJybmJrQlssKTWhr84NrQtdscTWhL7cDK0JbbGk1IS2eGJrQlssMTWh65gSWwf6jlFDvx90xRJbB7q2E1ML1eVgaB3oi2doLVSXm6F1oCuemFrQFUtMHeiKJfa7QddxILYW9B1XhtaCrlhy9kkQqFoPHjwQDh8+LHTo0EHIzMyUFOvWrVtCaGiokJ6eLsTHxws9evQQNmzYICpWQUGBsGbNGiEnJ0c4cuSI0KVLFyEpKUlSfoIgCKtXrxZ69uwpnDx5UlKckpISYf78+UJSUpKQlJQkXL9+XXJu27ZtE5YvXy4pxs2bN4WFCxcKqampwpkzZ4QzZ84Io0aNEoqLi0XHHDNmjHD37l1BEJ78Px4+fLioONnZ2cKQIUOEoqIiQRAEYfPmzUJkZKRBMXQdr6GhocKhQ4cEQRCEH374QViyZImkeOfPnxeCgoKEsLAwSbmJrQltsaTURHV1bkhd6Ioltib05WZoTWiLJaUmdOUmpia0xRJTE/qOKTF1oC+eod8PumKJrQNd24mphZrkYEgd6ItnaC1Ul5uhdaArnpha0JeboXWgK5bY7wZ9x4GYWtAXz9Ba0BVLzj5JEASBjW4NPX78WJZGNy0tTSgrK1M/Xrp0qTBt2jRRsYqLiwWVSqV+PGbMGCE5OVlSfqdOnRJ27NghDB48WHKju23bNuGbb74RlEqlpDgVUlNThSlTpmjssxi3bt3SeHz37l1hxowZkmJ2795d+PPPPwVBEISHDx8K/fr1ExVn27ZtwtixY9WPMzIyhK5duwqFhYUGxal8vN69e1fo1q2b+sP64cOHgoeHh5Cfny8qXoWVK1ca1OhqiyWlJirHkloTuvZTTF1oiyWlJrTFE1sTlWNJrQltuYmticqxxNSErmNKbB1Ud4wa8v2gK5bYOtC1nZhaqC4HQ+tAXzxDa0FfLDF1oCuemFrQl5uhdaArltjvBl3HgdhaqO64MqQWdMWSs08SBEHg1IUaMjOT56165ZVXYGFhoX7s4uICNzc3UbGsra2hUCgAPPkThLu7O3r37i06t8LCQhw6dAj+/v6iYzxtz549WLFiBfr164fdu3dLjvf555/D3d0dn332GaZOnYozZ86IitO8eXONx4mJiRg6dKik3Pz8/PDpp5+ioKAAe/bswfz580XFKSwsRFZWlvrx888/j7KyMvz1118Gxal8vKampsLJyQnW1tYAAGdnZ1haWiI9PV1UvOqWGxJLSk1UjiW1JrTtj9i60BZLSk1oiye2JirHkloT2nITWxOVY4mpCV3HlNg6qO4YNaQOdMUSWwe6thNTC/pyEFMH+uIZWgv6YompA13xxNSCvtwMrQNdscR+N+g6DsTWQnXHlSG1oCuWnH0SwDm6Rpeeno6JEydKinHixAm8//77KC8vR1FRkeg469evR2BgoKRcnvbdd9/hxIkTmDx5MsLCwiTNgb1+/TouXryIgIAALFy4EN7e3vjggw/w8OFDyXkePXoUgwcPlhRj/vz5sLS0REBAAGxtbTFs2DBRcby9vfHw4UPs27cPAHDhwgUAgEqlkpRfVlYWHB0dNZbZ2dlpfHDWF/WpJgB564I1YTg5aqLimJKrDuQ4RquLJfY1Km8npRaejiVHHTwdT2otVMSSqw50vd9iauHpWFLroCKW1DqofBxIrQU5P2OriyW13tjoGtFff/2Fpk2bolOnTpLitG/fHuPGjUNycjKWLl0qKsYvv/yC7t27o0mTJpJyqczJyQmzZ8/GRx99hNjYWNFxrly5AkdHR3Tu3BnAk5MFBEFAYmKipPzy8vKgUCjg4OAgKU5xcTFGjhyJN998E59//jlOnjwpKk6nTp2wcuVKxMXFITIyEnv27IG5uTlatWolKT+FQqH+5V6hrKwMlpaWkuLKrT7VBFA7dcGaMIzUmnj6mJKjDuQ6RvXFEvsa2rYTWwtPx5KjDrTlJrYWno4lRx3oer/F1ELlWFLq4OlYUuug8nEgtRbk+oytLpYc9WZR/SpUG8rLyxEXF4ePP/5YcqxmzZrB398fZmZm2LBhg6gYmzZtwvnz59WPCwoKEBQUhI8++kiW0ax33nkHCQkJorcvLy/H48eP1Y+tra3RunVr5OTkSMrryJEjGDRokKQYABAaGoqoqCg0btwYgiAgODgYhw8fhq2trcGxhg0bpv7VP2vWLAwcOFBy0+Hi4oL8/HyNZUqlEi4uLpLiyqm+1QRQu3XBmqg5sTVR+ZiSWgdyHqO6Yol9DV3biamFyrGk1kF1+2RILVSOJbUO9OVmaC1oiyW2DrTFkvLdUPk46NWrl6RakOszVl8sueqNI7pGsnHjRkydOhVWVlayxezSpQtcXV1Fbbts2TLEx8er/3FxcUFkZCQmTJggS25mZmbo0qWL6O07duyI/Px8jUvGmJubo23btpLy+vnnn+Hj4yMpRnZ2Nv744w80btwYAPDRRx/Bzs4OV69elRT38uXL+O9//4uQkBBJcQDAy8sLWVlZ6svHVPx5ysPDQ3JsudS3mgBqty5YE4YztCYqH1NS60DOY1RXLLGvUd12htRC5VhS66C63AyphcqxpNaBvtwMrYXKsaTUgb68pHw3VBwHcn0nSP2M1RdLrnpjo1tDgiBo/FuK6OhodO3aFUVFRcjMzMSOHTtw48YNg+OUlJRo/Mr+73//i0mTJonKqVmzZmjZsqX6HwsLCzRt2lT0SGJ2djZ27dqFx48fQxAEbNy4EbNnzxYVCwDatm2LAQMGqH/15+XlobS0VNLIU0lJCXJzcyUXaePGjWFlZaUxt8nR0REvvvii6Jj5+fmYN28evvjiC7Rv397g7Ssfr66urhgwYADS0tIAAElJSZg4cWKVP13VNN7Tyw2tCW2xxNZE5VhSa6JyPCl1UTmW1JqoHE9KTej6/ym2JirHk1ITunIztCa0HVPFxcWi60DfMWro94OuWGLrQNt2ly9fFlUL2mIplUrRdaAtXnp6uqha0BbLwsJCdB3oe78NrQVtsXJzc0XVgb68DK0DXZ+JYr8TqvuMNaQW9MWSq08COHWhRgoLC9VnhcbHx+Odd96Bs7OzqFirV6/GV199pbHM3d0dAQEBBse6fv06AgMD0apVK7z88st46aWXJJ9AIpfCwkJER0fjm2++Qa9evfDee+/hhRdekBRz6dKlWLx4MUpKSnD79m0sX75c0hzTEydOoG/fvpJyAp6MRkRHR2P16tXo2rUrHjx4gLCwMNjb2xsc6/79+zhx4gQuXryIiIgIUSN+uo7X8PBwREVF4dy5c8jNza3xaICueOfPn0dKSgqys7ORlpYGT09PUbG+//57UTWhLda9e/dE14Scda4tlpSa0JWbmJrQt59iakJXPDE1oS3W48ePDa4JfZ+zYupAXzxDjxtdsbKyskTVga54K1asMLgW5Px+0hdv3bp1BteCvtzE1EF1+2pILeiLZWgd6Io1aNAg7N692+DvBn19gpha0BfP0FrQFUvu41AhyDFESURERERUz3DqAhERERGZJDa6RERERGSS2OgSERERkUlio0tEREREJomNLhERERGZJDa6RERERGSS2OgSERERkUlio0tE1ICMHj0aBw4cMHi7hw8fYvny5Rg9erT8SRER1RI2ukREMklPT8esWbPQsWNHhISE4OTJk8ZOqYrAwEC8/PLLBm+nUChQUlKCvLy8WsiKiKh2sNElIpJJt27d8NZbbwEA/v73v8Pb29vIGVU1YsQIPP/88wZv5+zsjHbt2tVCRkREtYeNLhGRjCwsLDT+bUrMzc2NnQIRkUHY6BIR1bFffvkFn3zyCb7++muMHTsWaWlpAIDt27ejS5cumDJlCu7fvw8AuHjxIvr164czZ84AAI4dO4Z169Zh5syZmDJlCjIzM/HgwQMsX74c/fv3R3JyMvr164fo6OgqrxsfH4/x48fjhx9+QFlZGeLi4vD6668jMTERoaGh6NWrF+bPn6+xzfr16xEZGYkvv/wSO3bs0Hju3r17iI6OxtKlSzF69Gj8+OOPAICdO3eiV69eGDp0KB48eIDt27dj1KhR+O2332R/L4mI9GGjS0RUx8LCwhAQEIDp06ejW7duiImJAQCMGzcO48aNw+PHj9GsWTMAgLW1NQICAvDyyy/j999/x6lTpxAYGIivvvoK1tbWCAsLg6OjI9q1a4f79+/j0aNH+Ne//oU+ffpUeV1fX1/8+eefEAQBFhYW8PHxwZUrV3DixAksWLAAMTEx2LZtG/766y8AwI4dO5Ceno5PP/0UYWFhGlMXVCoVlixZgg8++ABz5sxBUFAQwsLCcPXqVfj7+2PRokW4e/cu7t27hz/++APffPMNPDw8av/NJSJ6iun9bY2IqJ776quv4OHhgcuXL+PmzZsoLS1VP/fhhx/itddew2+//QYPDw9s374dkydPBgBs3boVKpUKmzdvBgC4ublBEASYm5vDxcUFAODn5weFQqH1de3s7ODg4ADgycllzs7OAIBhw4ahUaNG6Nq1KwDg/v37aNOmDVavXo3g4GD19t27d8fx48cBAOfPn8eNGzfw/fffAwCKiorg7e2Nu3fvom3bthgxYgQOHTqEoKAgzJ8/H82bN5fr7SMiqjE2ukREdczZ2RlLlixB//794eHhgVOnTqmfa968Od544w1ER0dj5cqVyMnJUTeJt27dwsiRI7Ve4quiudXV5FZeT9u6FfOKVSoVcnJycPv2bdjZ2Wld/+bNm3BwcMCUKVN0vta0adMQEBCAW7du6c2JiKi2cOoCEVEdSUtLQ35+Pt5++22899578PHxgZlZ1Y/hDz/8EMeOHcPSpUsxcuRI9XJXV1fs3r1bY91Tp05BEATZc7W1tYWFhQWuXLmi9XlXV1ecPn0amZmZ6mXFxcXqebjl5eWIi4vD8uXLsWLFCly/fl32HImIqsNGl4hIRo8fPwbwpNF72rVr13D69GlkZGQgNzcX2dnZyM7Oxvnz51FcXKyeFwsArVu3xvDhw3Hs2DH0799fvXzMmDFITk7G7NmzkZSUhB9//BHHjh3TGGmteH1dBEFQN8YqlUq9rPI6VlZW8PX1RWxsrDq3GzduIC8vD0qlEh4eHmjVqhWmTJmCPXv2IDk5GREREWjVqhUAYM2aNXj33Xfh5+cHHx8ffPLJJ1XeEyKi2sZGl4hIJr/99hu2bt0KAJgzZw5CQkIQEhKCadOmYcyYMejVqxc6deqEIUOGIDAwECtXrsSwYcOQkZGBCxcuaMR68803MWHCBI0mtlevXli+fDkuXbqEWbNm4fjx4/jwww/x4MED9RUPoqOjUVBQoDW/n376Cffu3cORI0dw+/ZtbNmyBQCQkJCAu3fvYvv27QCAAwcOIDs7GxEREfDy8sL48eMxc+ZMFBYW4sUXX0RCQgIsLS2xdu1avPjiiwgPD8eyZcvw9ttvo3HjxoiJicHevXthb28PAGjZsiXOnj2LsLAwZGVlyfumExHpoRBq429eREQkyaJFizBjxgw0btzY2KkQET2zeDIaEVE9kZmZicOHD8POzg42NjZscomIJOLUBSKieuL3339HdHQ0UlNTMWvWLGOnQ0T0zOPUBSIiIiIySRzRJSIiIiKTxEaXiIiIiEwSG10iIiIiMklsdImIiIjIJLHRJSIiIiKTxEaXiIiIiEwSG10iIiIiMklsdImIiIjIJLHRJSIiIiKT9P8ANz/16DCm69IAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 710x180 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Best layer: 14; corresponding epoch idx (0-based): 2\n"
     ]
    }
   ],
   "source": [
    "# --- aesthetics (light touch) ---\n",
    "sns.set_theme(style=\"whitegrid\", context=\"paper\", font_scale=1.1)\n",
    "fm.fontManager.addfont(\"font-times-new-roman/Times New Roman.ttf\")\n",
    "fm.fontManager.addfont(\"font-times-new-roman/Times New Roman - Bold.ttf\")\n",
    "fm.fontManager.addfont(\"font-times-new-roman/Times New Roman - Bold Italic.ttf\")\n",
    "fm.fontManager.addfont(\"font-times-new-roman/Times New Roman - Italic.ttf\")\n",
    "plt.rcParams.update({\n",
    "    \"axes.spines.top\": False, \"axes.spines.right\": False,\n",
    "    \"grid.alpha\": 0.25, \"legend.frameon\": False,\n",
    "    \"pdf.fonttype\": 42, \"ps.fonttype\": 42,\n",
    "    \"font.family\": \"Times New Roman\"\n",
    "})\n",
    "\n",
    "# ---- your original processing ----\n",
    "val_accuracies = []\n",
    "test_accuracies = []\n",
    "best_epoch_idx = []\n",
    "\n",
    "for i, history_df in enumerate(history_list):\n",
    "    max_val_epoch_idx = history_df['val_acc'].idxmax()\n",
    "    val_acc = history_df.loc[max_val_epoch_idx, 'val_acc']\n",
    "    test_acc = history_df.loc[max_val_epoch_idx, 'test_acc']\n",
    "    val_accuracies.append(float(val_acc))\n",
    "    test_accuracies.append(float(test_acc))\n",
    "    best_epoch_idx.append(int(max_val_epoch_idx))\n",
    "\n",
    "best_layer_idx = int(np.argmax(val_accuracies))\n",
    "best_layer = layer_list[best_layer_idx]\n",
    "\n",
    "# ---- seaborn barplot (two bars per layer) ----\n",
    "df = pd.DataFrame({\n",
    "    \"layer\": layer_list,\n",
    "    \"Validation\":   val_accuracies,\n",
    "    \"Test\":  test_accuracies\n",
    "})\n",
    "dfm = df.melt(id_vars=\"layer\", var_name=\"Split\", value_name=\"Accuracy\")\n",
    "\n",
    "fig, ax = plt.subplots(1, 1, figsize=(7.1, 1.8))  # slightly wider for 32 layers\n",
    "palette = {\"Validation\":\"#4DBBD5\", \"Test\":\"#E64B35\"}\n",
    "\n",
    "sns.barplot(\n",
    "    data=dfm, x=\"layer\", y=\"Accuracy\", hue=\"Split\",\n",
    "    order=layer_list, palette=palette, ax=ax, dodge=True,\n",
    "    edgecolor=\"gray\", linewidth=0.6, saturation=0.95\n",
    ")\n",
    "\n",
    "# --- axes to mirror your previous settings ---\n",
    "ax.set_xlabel('Layer index', fontsize=11)\n",
    "ax.set_ylabel('Accuracy', fontsize=11)\n",
    "ax.set_ylim(0.7, 0.85)\n",
    "ax.set_yticks([0.70, 0.75, 0.80, 0.85])\n",
    "ax.grid(axis=\"y\", alpha=0.25); ax.grid(False, axis=\"x\")\n",
    "ax.tick_params(axis='x', labelsize=10)\n",
    "ax.tick_params(axis='y', labelsize=10)\n",
    "\n",
    "# legend (keep it simple; move slightly up if you prefer)\n",
    "ax.legend(loc='upper center', bbox_to_anchor=(0.5, 1.10), ncol=2, fontsize=11, frameon=False)\n",
    "\n",
    "# --- star marker on best layer ---\n",
    "# add a little headroom so the star isn't clipped\n",
    "ymin, ymax = ax.get_ylim()\n",
    "ax.set_ylim(ymin, ymax * 1.04)\n",
    "ax.annotate(\"$^\\star$\", (best_layer_idx, ax.get_ylim()[1] * 0.85),\n",
    "            ha=\"center\", va=\"bottom\", fontsize=35)\n",
    "\n",
    "plt.tight_layout()\n",
    "plt.show()\n",
    "\n",
    "# save\n",
    "fig.savefig(\"figs/iclr/pred_acc_by_layer.pdf\", format=\"pdf\", bbox_inches=\"tight\", pad_inches=0)\n",
    "\n",
    "print(f\"Best layer: {best_layer}; corresponding epoch idx (0-based): {best_epoch_idx[best_layer_idx]}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "dc9900d0",
   "metadata": {},
   "outputs": [],
   "source": [
    "selected_layer = best_layer\n",
    "selected_epoch = best_epoch_idx[best_layer_idx]\n",
    "\n",
    "interval = 16\n",
    "warmup = 5\n",
    "patience_high = 5\n",
    "threshold_val_percentile = 80"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "2760e627",
   "metadata": {},
   "outputs": [],
   "source": [
    "val_preds = load_val_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "test_preds = load_test_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "\n",
    "metadata = load_metadata(dataset, model_id, for_training=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "bb279029",
   "metadata": {},
   "outputs": [],
   "source": [
    "metadata_test = metadata[metadata['train'] == 0][['unique_id', 'chain_id', 'tokens', 'correct', 'type']]\n",
    "metadata_test = metadata_test.merge(test_preds, on=['unique_id', 'chain_id', 'tokens'], how='left')\n",
    "metadata_test['pred'] = metadata_test['pred'].fillna(val_preds.pred.median())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "396d125d",
   "metadata": {},
   "outputs": [],
   "source": [
    "confusion_matrix_analysis = list()\n",
    "threshold = np.percentile(val_preds.pred.values, threshold_val_percentile)\n",
    "\n",
    "for _, chain_df in metadata_test.groupby(['unique_id', 'chain_id']):\n",
    "    chain_df_sorted = chain_df[chain_df.type == 'intermediate'].sort_values(by='tokens')\n",
    "    final_outcome = chain_df[chain_df.type == 'final'].iloc[0]['correct']\n",
    "    intermediate_outcome = chain_df_sorted.correct.values\n",
    "    token_steps = chain_df_sorted.tokens.values\n",
    "    token_final = chain_df[chain_df.type == 'final'].iloc[0]['tokens']\n",
    "    preds = chain_df_sorted.pred.values >= threshold\n",
    "\n",
    "    ours_outcome = None\n",
    "    ours_tokens = None\n",
    "    for idx in range(warmup, len(preds)):\n",
    "        consecutive_sum = np.sum(preds[idx+1-patience_high:idx+1])\n",
    "        if consecutive_sum >= patience_high:\n",
    "            if ours_outcome is None:\n",
    "                ours_outcome = intermediate_outcome[idx]\n",
    "                ours_tokens = token_steps[idx]\n",
    "    if ours_outcome is None:\n",
    "        ours_outcome = final_outcome\n",
    "        ours_tokens = token_final\n",
    "\n",
    "    confusion_matrix_analysis.append({\n",
    "        'unique_id': chain_df_sorted.iloc[0]['unique_id'],\n",
    "        'chain_id': chain_df_sorted.iloc[0]['chain_id'],\n",
    "        'accuracy_baseline': final_outcome,\n",
    "        'accuracy_ours': ours_outcome,\n",
    "        'tokens_baseline': token_final,\n",
    "        'tokens_ours': ours_tokens\n",
    "    })\n",
    "\n",
    "confusion_matrix_analysis = pd.DataFrame(confusion_matrix_analysis)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "15b9c825",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[3364,   14],\n",
       "       [  15, 9797]])"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cm = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1]\n",
    ")\n",
    "cm_dict[dataset] = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1],\n",
    "    normalize='pred'\n",
    ")\n",
    "cm"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0e56371b",
   "metadata": {},
   "source": [
    "# MMLU / DeepSeeek-R1-Distill-Llama-8B"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "9769038d",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset = \"mmlu\"\n",
    "model_id = \"deepseek-ai/DeepSeek-R1-Distill-Llama-8B\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "0283489d",
   "metadata": {},
   "outputs": [],
   "source": [
    "selected_layer = 14\n",
    "model_dir = os.path.join(DSET_TO_DIR[dataset], MODEL_IDS[model_id])\n",
    "history = pd.read_csv(os.path.join(model_dir, \"model\", f\"L{selected_layer}_mlp\", \"history.csv\"))\n",
    "selected_epoch = history.epoch.values[np.argmax(history.val_acc.values)]\n",
    "\n",
    "interval = 80\n",
    "warmup = 0\n",
    "patience_high = 2\n",
    "threshold_val_percentile = 80"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "42c86556",
   "metadata": {},
   "outputs": [],
   "source": [
    "val_preds = load_val_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "test_preds = load_test_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "\n",
    "metadata = load_metadata(dataset, model_id, for_training=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "a636e95a",
   "metadata": {},
   "outputs": [],
   "source": [
    "metadata_test = metadata[metadata['train'] == 0][['unique_id', 'chain_id', 'tokens', 'correct', 'type']]\n",
    "metadata_test = metadata_test.merge(test_preds, on=['unique_id', 'chain_id', 'tokens'], how='left')\n",
    "metadata_test['pred'] = metadata_test['pred'].fillna(val_preds.pred.median())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "dae1e1d3",
   "metadata": {},
   "outputs": [],
   "source": [
    "confusion_matrix_analysis = list()\n",
    "threshold = np.percentile(val_preds.pred.values, threshold_val_percentile)\n",
    "\n",
    "for _, chain_df in metadata_test.groupby(['unique_id', 'chain_id']):\n",
    "    chain_df_sorted = chain_df[chain_df.type == 'intermediate'].sort_values(by='tokens')\n",
    "    final_outcome = chain_df[chain_df.type == 'final'].iloc[0]['correct']\n",
    "    intermediate_outcome = chain_df_sorted.correct.values\n",
    "    token_steps = chain_df_sorted.tokens.values\n",
    "    token_final = chain_df[chain_df.type == 'final'].iloc[0]['tokens']\n",
    "    preds = chain_df_sorted.pred.values >= threshold\n",
    "\n",
    "    ours_outcome = None\n",
    "    ours_tokens = None\n",
    "    for idx in range(warmup, len(preds)):\n",
    "        consecutive_sum = np.sum(preds[idx+1-patience_high:idx+1])\n",
    "        if consecutive_sum >= patience_high:\n",
    "            if ours_outcome is None:\n",
    "                ours_outcome = intermediate_outcome[idx]\n",
    "                ours_tokens = token_steps[idx]\n",
    "    if ours_outcome is None:\n",
    "        ours_outcome = final_outcome\n",
    "        ours_tokens = token_final\n",
    "\n",
    "    confusion_matrix_analysis.append({\n",
    "        'unique_id': chain_df_sorted.iloc[0]['unique_id'],\n",
    "        'chain_id': chain_df_sorted.iloc[0]['chain_id'],\n",
    "        'accuracy_baseline': final_outcome,\n",
    "        'accuracy_ours': ours_outcome,\n",
    "        'tokens_baseline': token_final,\n",
    "        'tokens_ours': ours_tokens\n",
    "    })\n",
    "\n",
    "confusion_matrix_analysis = pd.DataFrame(confusion_matrix_analysis)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "c49a55ab",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[3036, 1011],\n",
       "       [ 798, 5155]])"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cm = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1]\n",
    ")\n",
    "cm_dict[dataset] = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1],\n",
    "    normalize='pred'\n",
    ")\n",
    "cm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "d4614710",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Ours tokens: 5974679; Baseline tokens: 9576245; num_branches: 10000\n"
     ]
    }
   ],
   "source": [
    "ours_tokens_all = confusion_matrix_analysis.tokens_ours.sum()\n",
    "baseline_tokens_all = confusion_matrix_analysis.tokens_baseline.sum()\n",
    "branches = confusion_matrix_analysis.shape[0]\n",
    "\n",
    "print(f\"Ours tokens: {ours_tokens_all}; Baseline tokens: {baseline_tokens_all}; num_branches: {branches}\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "59a8ea9b",
   "metadata": {},
   "source": [
    "# MATH / DeepSeek-R1-Distill-Llama-8B"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "238cc08f",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset = \"math\"\n",
    "model_id = \"deepseek-ai/DeepSeek-R1-Distill-Llama-8B\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "a63e5d40",
   "metadata": {},
   "outputs": [],
   "source": [
    "selected_layer = 14\n",
    "model_dir = os.path.join(DSET_TO_DIR[dataset], MODEL_IDS[model_id])\n",
    "history = pd.read_csv(os.path.join(model_dir, \"model\", f\"L{selected_layer}_mlp\", \"history.csv\"))\n",
    "selected_epoch = history.epoch.values[np.argmax(history.val_acc.values)]\n",
    "\n",
    "interval = 80\n",
    "warmup = 0\n",
    "patience_high = 2\n",
    "threshold_val_percentile = 80"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "85d03786",
   "metadata": {},
   "outputs": [],
   "source": [
    "val_preds = load_val_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "test_preds = load_test_predictions(model_dir, f\"L{selected_layer}_mlp\", selected_epoch)\n",
    "\n",
    "metadata = load_metadata(dataset, model_id, for_training=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "715d27a5",
   "metadata": {},
   "outputs": [],
   "source": [
    "metadata_test = metadata[metadata['train'] == 0][['unique_id', 'chain_id', 'tokens', 'correct', 'type']]\n",
    "metadata_test = metadata_test.merge(test_preds, on=['unique_id', 'chain_id', 'tokens'], how='left')\n",
    "metadata_test['pred'] = metadata_test['pred'].fillna(val_preds.pred.median())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "2fb5f4bc",
   "metadata": {},
   "outputs": [],
   "source": [
    "confusion_matrix_analysis = list()\n",
    "threshold = np.percentile(val_preds.pred.values, threshold_val_percentile)\n",
    "\n",
    "for _, chain_df in metadata_test.groupby(['unique_id', 'chain_id']):\n",
    "    chain_df_sorted = chain_df[chain_df.type == 'intermediate'].sort_values(by='tokens')\n",
    "    final_outcome = chain_df[chain_df.type == 'final'].iloc[0]['correct']\n",
    "    intermediate_outcome = chain_df_sorted.correct.values\n",
    "    token_steps = chain_df_sorted.tokens.values\n",
    "    token_final = chain_df[chain_df.type == 'final'].iloc[0]['tokens']\n",
    "    preds = chain_df_sorted.pred.values >= threshold\n",
    "\n",
    "    ours_outcome = None\n",
    "    ours_tokens = None\n",
    "    for idx in range(warmup, len(preds)):\n",
    "        consecutive_sum = np.sum(preds[idx+1-patience_high:idx+1])\n",
    "        if consecutive_sum >= patience_high:\n",
    "            if ours_outcome is None:\n",
    "                ours_outcome = intermediate_outcome[idx]\n",
    "                ours_tokens = token_steps[idx]\n",
    "    if ours_outcome is None:\n",
    "        ours_outcome = final_outcome\n",
    "        ours_tokens = token_final\n",
    "\n",
    "    confusion_matrix_analysis.append({\n",
    "        'unique_id': chain_df_sorted.iloc[0]['unique_id'],\n",
    "        'chain_id': chain_df_sorted.iloc[0]['chain_id'],\n",
    "        'accuracy_baseline': final_outcome,\n",
    "        'accuracy_ours': ours_outcome,\n",
    "        'tokens_baseline': token_final,\n",
    "        'tokens_ours': ours_tokens\n",
    "    })\n",
    "\n",
    "confusion_matrix_analysis = pd.DataFrame(confusion_matrix_analysis)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "220c988b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[1446,  241],\n",
       "       [ 418, 2855]])"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cm = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1]\n",
    ")\n",
    "cm_dict[dataset] = confusion_matrix(\n",
    "    confusion_matrix_analysis.accuracy_baseline.values,\n",
    "    confusion_matrix_analysis.accuracy_ours.values,\n",
    "    labels=[0, 1],\n",
    "    normalize='pred'\n",
    ")\n",
    "cm"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "a4cf8274",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Ours tokens: 8151978; Baseline tokens: 12575380; num_branches: 4960\n"
     ]
    }
   ],
   "source": [
    "ours_tokens_all = confusion_matrix_analysis.tokens_ours.sum()\n",
    "baseline_tokens_all = confusion_matrix_analysis.tokens_baseline.sum()\n",
    "branches = confusion_matrix_analysis.shape[0]\n",
    "\n",
    "print(f\"Ours tokens: {ours_tokens_all}; Baseline tokens: {baseline_tokens_all}; num_branches: {branches}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "63584dce",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "selected_epoch"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "27d9eea2",
   "metadata": {},
   "source": [
    "# Confusion matrix for early-termination vs. uninterrupted accuracies"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "70db8620",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZIAAAC8CAYAAABSUygIAAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjUsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvWftoOwAAAAlwSFlzAAAPYQAAD2EBqD+naQAAVoxJREFUeJzt3XdUFNfbwPHv0hEUARERRVSKFWvsFXuMxhJbsMXeYzcxlp8lxa6JCfaSGDX2gib2qMSOBbsgIr1IX9qy7Lx/EEZXQHFB0bz3cw5H9869M8/u3dln5k5TSJIkIQiCIAg60ivqAARBEIQPm0gkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRPIOqVQq1qxZw5QpU1i2bBnLli1jwYIFeHp6cujQIQDi4uL45ptvmDNnDmPHjsXNzQ1XV1eSk5NRKpX88ccf1KpVC3d3d9Rqda7LuXz5Mq6urgwYMIArV64AEBsby+zZs1m3bh3r169n2bJlcvuTJ0/SpUsXqlatypYtW4iJiSEtLY1ly5ZRpUoVvv76a+7du/duPqQPxMWLF+nduzeurq5cuHAh1zqZmZm0a9eOOnXqsH//fn7++WdcXV35/PPP85zvvn37cHV1ZcKECdy+fZvbt2/z5Zdf4urqypQpU7h06VKONr6+vkyYMAFXV1dmz57NgwcP5GlBQUGsXr2aRo0a4eXlRUZGRsHf/H/Um/bpgQMHUCqVWtO3b9/O2bNntcrGjBlDz549mTJlCl988QWurq6MGTOGSZMm0b59e8aMGYOfnx9z587F1dWVL7/8kps3bwIQEhIif288PDy4ePHiW3nvBSYJ70R8fLzUrVs3afny5ZJGo5HL1Wq19MMPP0jr16+XJEmSRo4cKR05ckSe/vjxY6lhw4aSUqmUywYNGiS5urpK+/fvz3VZ48ePl1xcXKRdu3bJZZMmTZL27dsnv165cqW0YcMG+fWKFSukpk2byq81Go00ffp0ycvLS/c3/R/3xx9/SG5ubtLAgQNznX7kyBHJzc1N6tu3r1zWrl07ycXFRbp69WqO+hqNRurZs6fk4uIi/fPPP3K5t7e35OLiIvn7++cZy/nz5/Oso1KppMmTJ7/JW/t/S5c+zabRaKQOHTpIQ4YM0Spft26dvM5funRJcnFxkQIDAyVJkqT09HTp559/liRJkp4+fSq5uLhI3t7eWu0zMzMlFxcXaefOnQV+f2+L2CN5R2bNmoVarWbixIkoFAq5XF9fn6lTp2JlZQXApUuXMDc3l6dXqlSJQYMGac2rTJkytGzZkvXr1yO9dM/Nhw8fUrp0aXne2R49ekRycrL82sTEhMTERK049PSyvg6SJLFw4ULc3d3p3LlzQd/6f5aBgQE9e/bk0qVL3Lp1K8f0gwcP0rJlSwwMDOSyOnXq4OLiwpo1a3LUP3PmDLVq1QK0+y67/YvzeZmhoWGedQwNDeXpwqvp0qfZzp49S6lSpfjnn394/PixXN69e3etdf5FRkZG9O7dG0Be/16um12e/e/76P2N7D/Ez8+P48eP07Nnz1y/UPr6+vTo0QOAunXrMnnyZHbv3o1GowGgc+fOGBkZabUZMWIE/v7+nDp1Sqt8y5YtORIPQNeuXVm5ciU3btxAqVRy//59Bg8enKNeRkYGM2fOpFGjRnTo0EHXt/z/Rrt27XB0dGTt2rVa5RcuXKBevXo5+k2hUDBs2DDOnz/P/fv3tabt3r2bXr16vfWYhVd70z7NtnfvXlavXk2pUqX47bff5PJSpUq9cnmvm/4hEInkHcg+TlGhQgWtcpVKxb59+5g6dSpff/01ly9fZunSpdSoUYNZs2bRpUsXjh8/joODQ44tynr16lG3bl2tL3toaCh6enrY2dnliGH48OH06tWLAQMGMGnSJL799lssLS216mRkZDB69GjMzMxo165dYb39/zQ9PT2GDRvG6dOn8fPzk8t37txJv379cm3TuXNn7O3ttfru+vXrVKtWDVNT07ces/BquvTpw4cPKVeuHCVLlqRv374cPHhQa4//TezYsYNvv/1W6+99JxLJO5A9pPTygU4jIyN69OjBw4cPUSqVNGzYECsrK7Zs2cLKlStRqVSMHz+ekSNHolKpcsx3xIgR+Pr6ygfgtmzZwhdffJFrDGq1Gmtra9auXcv9+/eZMmVKjoP1BgYGlClTht9//529e/cWxlv/f+HTTz/FxsaGdevWAXDv3j0cHBwoXrx4rvUNDAwYMmQIx44dIzAwEIDff/8dDw8PnWPIa+gkv9MFbW/ap9u2baN///4A9O3bl4yMDPbs2aPTsvv168c333yj9fe+E4nkHXB1dQXg7t27uU43NzfHzMwMgKdPnwLQqVMnjh49yqhRo/j7779ZtWpVjnatWrXCxcWFtWvXEhcXR2xsLE5OTrku49tvv8XR0ZGmTZuyfft27ty5w+bNm7XqKBQKFixYIH+Rd+/erfN7/v/EyMiIwYMHc/ToUUJCQti6dSsDBw58ZZvPPvuMkiVLsn79eh4/foy1tbV8nEwX2XusqampOaYlJyeLPZ039CZ9GhMTw+3bt9mxYwdLly5ly5YtODo6sm3bNnl4+r9OJJJ3oFmzZjg5ObF//36tA9652b9/v/x/Q0NDJk2aRP369QkICMhRN3u8/eLFi8ycOfOVW7QHDx6kYsWKADg4ODB58mR8fHxyneecOXMYNGgQs2fP5o8//sjv2/x/rU+fPpiZmbFw4UJMTU3lEx7yYmJiwoABAzh48CBLlizJ9bhWfly9ehXIOgEDsoY3X/bkyRMcHBx0mv//Z/nt0+3btzN//nymTp0q/3333XeEhoZy+vTpdxx10RCJ5B3Q19fnxx9/BGDatGk5thpfPPPq8OHDWj/w6enpxMTEaB2zSE9Pl/+fPd6emJhI3bp1gaxz3V/8F6BGjRrcuXNHfq1QKKhdu7b8Wq1Wa209ff3113zxxRfMnTuXDRs26PS+/+syMzPlz9jc3Jx+/fpx9uxZrZMYMjMztYYQX+w7Dw8PjIyMKFGiBPb29gBy3Rf7Lvv/Lw9FBgQEcP36dQDs7Oxwd3dny5YtWhsr8fHxrFmzRpx9l09v2qfJycncuXMHNzc3rfm4ublRvXr1HOtOXn35qmnZw9ovfifeN3mfTygUqsqVK3Po0CE2b97M6NGjcXZ2xszMjGfPnlGrVi35IF5aWhoDBgygcePG2NvbExERwaBBg+jRowdKpZJTp05x/vx5du7cSbt27bC2tmbIkCGUK1cOyLqA6cCBAwB4eXnh6OjIRx99xNKlS1m+fDlxcXGYmZkRFxfHsGHDgKwLEk+dOkVMTAybNm2ia9eulCpVCjs7OyRJYsmSJVy8eJHPPvuMTp06Fcnn9765evUqXl5eWFlZUaJECWrUqMGgQYOIiIjA0dGRjIwMTp48ybVr10hOTmb//v0olUrOnz/PoUOHcHd3x8LCgr59+9KtWzcA/P39+f3334GsM7hKlCiBRqNh586dAEyfPh1HR0cAEhMTuXLlChs3bpRjWr58OStWrGDo0KHY29vLp4tOmjQJGxubd/fhfKDetE89PT25dOkS0dHRXLx4kcaNG8vz8vX1JS0tjbt377JgwQKGDx/Os2fP5OHibdu24eHhIQ9F+/v7s337diBrD6d48eLUqVOHkJAQ+ViLl5cXFSpU0FrO+0IhvXwhgiAIgiC8ATG0JQiCIBSISCSCIAhCgYhEIgiCIBTIe5VITp48WdQhCIIgCG+oSM7aOn/+PJ6enkRHR8unnEqSRHR0NLdv3y6KkARBEAQdFUkimTZtGh07dqR79+5ad9E8d+5cUYQjCIIgFECRJJKyZcvyv//9L0d5o0aN3n0w/9JoNKSlpWFiYvJe365ZeD3Rl/8Noh8/HEVyHcn169eJjY2lbdu2WuXHjh0rsluXp6SkcP/+fYbMP8SjoJhCn79CAdUrleZuQBRv6xOPu7r67cyYrKHH1JRkTIuZvbUbAJoU0maN3Jcr/uFRqG53YH0VhQKqO5TkblD82+vLE7PeynzfRT9C4fRldj+O3h6If3T66xu8IQVQ1c6E++FpvK0fwbBNeT8Ns6Dep3WySPZI5s+fT3h4ON9//71cJkkSz549+88+A0NPocDQQA89hYLMD/QaUHHtapYPvS9FP2ZRKMBAT4FCwVvbIHjb3pe+LJJE0qhRI0qXLk3JkiXlTKpWqzlz5kxRhCMIgiAUQJEkkv79+1O2bNkc454tWrQoinAEQRCEAiiSRFKuXDm8vb3ZunUr4eHhODs7M3ToUGrUqFEU4QiCIAgFUCSnQhw6dIiRI0cCWcNc1tbWzJs3j7NnzxZFOIIgCEIBFMkeye7duzl8+DCVKlWSyyRJYtGiRbRs2bIoQhIEQRB0VCR7JHXr1tVKIpD1oCXxXGlBEIQPT5EkEqVSSUZGhlbZ33//zY0bN4oiHEEQBKEAimRoq1OnTnTu3JkqVaqgVqt59OgRkZGR/Pzzz0URjiAIglAARbJHUr9+fTZs2EDZsmXJyMigefPmHDhwQJz+KwiC8AEqsme2Ozg48NVXX2mVRUZGYmtrW0QRCYIgCLp4J4nk2LFj1K5dW04SBw4cyFFHkiTOnDnDjz/++C5CEgRBEArJO0kka9asYeTIkXTs2BGAnTt34u/vT4kSJbTqRUVFvYtwBEEQhEL0ThLJ/v37tV7369ePdu3aUaxYMa1y8YREQRCED0+RHGyvVq1ajiTy+PFj6tevXxThCIIgCAVQJInk6NGjOcoqVarElClTiiAaQRAEoSDe6Vlbv/zyC5cuXSIkJAQfHx+taQkJCcTHx7/LcARBEIRC8E4TyZgxY8jMzESj0dCgQQOtaUZGRrRp0+ZdhqMTQwN95ozrSmqairKlLVm26S+ehDzLUa+yQ2kmf9GeoLBYnBxK88v2U6DJuppfX1+POWO6kKmRMDM1JjgiltXbTuWYR6cWNXG0L0Vg6DMu3nxMfGJKgWJXZaiZv/oQpiZGhEXFMWVIRyqVt8lXvYrlSsnTD52+wT/X/dFoJGpXKY9H18byNLU6k91/XWX55uNc3TunQPG+TYYGeswZ6k5qWgZlbUqwbLs3T8LictQ7tmowDaqV0yr7cdcFDpy+ib6egjlDWv/bj0YERyawes8lud6wrvWY2KcppiYGHDr3gJlrjpOari6U+PPblwD/+PixeMOfTB/WiSZ1nXJMV6aks2WfN5YliuFoX4qm9Zy1pqemqXAftIQl03vRrJ5LocRfmAz19fj6s1qkqjIpa2nKKq+7BEYpc9Q7NLM99Z1KaZXtOv+IyVuu0b+lE4sHaf8mRSekUmuS9vHdDrXtcbAx52m0kit+0cQnqwocv67r5eQvOlDGyhSAzfu8mfz9Tq36NlbFeXQs6+GBf52/zcWbj7G3tcQvMJLBPZpS3cm+wLFne+fXkYwfP54mTZpQr149rfLExMQcZ3G9j76b3JOHTyLYsPsc5ctY8sfK0bQasBhVxvMfCAN9PXYsH8nA6et5EBCBvW1JTm2Zxpg5mwCY8kUHFAoF838+CMCulaNJSk5j6/5/5HksnNiDp6HP8NxReA/7mrl8L64VyzC8d0uCwmPpM9GTv3+bjrGR4Wvrnfl1GgBXbz9h9bZTHNs4BYVCQY9xq3Eoa03z+lk/MEHhsaSp1PgHvd9n4H03uj0Pn0az4ZAP5Utb8MfCPrQauxFVRqZcp0qFUlx/GMacdSdJ/7f8m8Gt8PJ+CMDkfs2y+nHTaQB2fduXpJR0th69QRM3ByrZW9Hrmx3UcrZj6fiOpKoymOl5olDiz29fxiUkIyFx2TcAKZcHyoZHxzN67m8s/7pvnono+3VHCY3MmWTfF/P61eVRWAJbTvthb12M375sRcf5f6FSa+Q6LmUtuPkkhgW7rpP+b/lX3d34514YAG6OVnisOENMUtYjfetWssbVvqTWcub2qUtQtJL1Jx4WavwFWS+PeI6hmBncuh/ErpWjKWVpDsC1O4HcDwgHICZeyUJPL87//hUKhYKgsBh6T/Tk0q7Ce5xzkRwjeTmJAKSmprJo0SKd5xkTE8PChQtZv349S5YsQa0unC2/F1mXNGdw96YcPJV1T7DgiDjSVWo+bVNbq16Tuk442pfiQUAEAKGR8TwJfUanVln1BnZrwh2/ULn+4TM3GefxfG9szOfumJsZs373uUKL/VlcElv2/8OnbeoA4GBnhbGRAQdP3cxXvUOns+qt3HqCzq1qyTfY7Ni8Bss3H5PbVypvQ+sGVQot7rfB2qIYgzvX5eC5BwAERyWQnpHJp82ratVLTs3g61+Oc/luCDcfhXPbPwKbksW4/jDrx6d/p9rcCYiU6x/2fsC4Xo0AMDY0YKbnCe4HRrPzhC8bD12jVZ2KhRJ/fvsSwNLCjGb1XChlWTzHNLU6k36T1/LVyI/zTCJeZ27h5lqOkiWK5Tq9qFkVN6Z/Sye8rgUDEBqTgkqtoXN9B616yekZzNnhw1X/Z/gGxnI3KA7rEiY8DInDUF+PpQd8OXM7HN/AWHwDY6lcpgReV4Pk9iPaV8HcxIDNpx8VavwFXS+PnL2NKkPNVyM7065pdepUq0CdahXwD4qi2791g8JieBabRIY6a2PIxNiQRGVqob6PIkkk27Zto379+lStWlX+a9WqFYcOHdJ5nhMnTqRHjx4MHz6csmXL4unpWYgRZ2nxkQvpGWqiY5PkMr+nkfLWeDbzYiYYGuhT2vr5yhsSHotTBdt/pxtTtnRJeVpweBxOFUpjamyIlYUZX434mNDIONbMG8juVaOpXVV7pdDFuauPMDY0oLT1870+5wq2nL/2KF/1zl19hEaj4eyVh1Qoa/18mqMtF28+lr+kAHp67/ddnFvUdiRdpSY6Plku8wuOoXltR616wVEJ2u3qVOT8rafya3NTI8qWev45BUcm4FTOGlNjA874BGi1fRoRn2N+uspvX74otz7ZeuACqWkqLlz3p9uYn5i2eBfJqeny9JCIOK7cfsJnHd7fsymbVbFFpdbwLDFNLvMPT6RZVe07ZITGaA8LN6tqy4UHWRsBGZkaohLStKY3cLbh4sOsvWorc2OmdqtJWGwKPw5rzLZJrXBztCqU+Au6Xv5zIwAjQwPKlLKQyyVJ4tLNxzStmzVEWdOlHBbFTZn47Q7U6kx+O3SRpTP6FEr82Yokkfz111/Mnz+fwYMH4+npyZYtWxg9ejTLli3TaX4PHjwgICCAatWqAdCkSRO2bduGRqN5Tcs3Y29rSVxCslaZMjmdsqUttcqu+AaQkJTCxEHtgazE4VTBlnRV1l7SiX/uMah7UyyKZ41v1qnmgFqdSYY6k09a1yJRmcr2w5cYNfdX/J5GceDncVhamBUo9tDIuBzzMDczJiwqLp/14olPSiUlTYXVC9PNi5mQrlITE59zTPp9ZW9Tgrgk7S0yZWo6ZW1ybrW/qGvzKhw8d19+ffKqP4M618HC3ASAOi52qDM1ZKhzfu8aVi+P574rhRB9/vvydXb9eZWGtSoxYUBbNn8/hBP/3JXH2TMzNSzfcoyvRnxcKDG/LWWtihGnTNcqU6ZlYGf56j2ozvUdOHItKNdp9SuX4kZADBopayiwY91yJKao+MM7gAkbLvI4IpE/prpjaWZU4PgLtF4WMyYiOufGyRXfJ9StXgF9/ayfdwMDfXavGsPV209o0f8HKtqX4uOWbgWO/UX5SiTXr18v1IU2a9aMjz/+mKFDhxIZGUnDhg0ZPXo0Gzdu1Gl+N27cwMbm+a55mTJliI+PJygo9y/Kq+jpgb6eItc/PQWkpWdolRkZ6ZOZmalVFpeQTO+Jnjg5lGb9gkF4dGlE1cplCQ57hr6egmmL/+DEP3fZ/P0Qvhr+MS3qu/Ak5BmSJFHdqSz+T6OIiE5AX0/Bqq3HMS9mwiet3PKMK/tPkqS8/wBTY0OtMlVGJgb6+vmqZ2iQVQ/A2Oj5dNW/ydFAX0+rDfDqeF76exv08upHPUhLV2v3o6EBmZmaPD9bQwM9ajvbceNhmPxdmLH6GCeu+LN5Vg++GtCCFnUceRIWiyRJWm1dK5QiTaXm/M3A1/ZhofZljv7Q7pN7j8NoWtcZfX09SpYoxtBezdl73AdVhprV204x7LMW8nJya/+u+lJPkfefQgFpGZlaZUaGeqgzNXm2MdBTULOCJTefxOQ6/ZOPHPC6FiS/rlauJI8jkoiIT0FPAauP3MXcxICOdcu9MjY9RT4+r/z2Za711BgY6OWY58FTN+jWpo5WWUJSCmM83HFvVJVJ3+/k4g3/Qu3LfB1sDw0N5fDhw5iZmdG6detcj3G8icePH7NmzRp69epFYGAge/bsITY2VueElZCQgIXF8107Q8Osg1TJycl5NcmTc3lrTI0Nc52mr5CwLmmOm/Pz3eZytiVJVKZqlQFkpKfyvWfWGR/N67uir6fgUUAwNZ1s0UgSOw6d/zdWfYb3acGePy/j5myLrbU5FsVNtOYXm6CkWiXbHMt4WUpy3nsFNhamxCUma9WJT1BiY2mmVZZ3vWIUM9bDxNiQyOgYUpKzEvez2DhMjA0x1tfIbVJTU14bz8vMzF+9N6AL57LFMTXSz1GujwZrC1PcKj7fkyxnY06iMk2r7EV1XO159DQSt4qW6CkUVLIzBxTs+PMqkHU23/Bu9dlz8pbWPIwM9RnVswmeey7kOe/cFEZfvkjSaEhLSyUlWUlaWtbemFqdSUpKitzGubw1mZkaIqOe8f26I6z69fmJAQnKVDymrqVn+7osnND1lbEXdl9WtjHGxDD3bV59SY21uTE1yprKZfaWJiSlqLTKXlSrYin8Q2OpUdaUiqWMAdC88JvZqpotB7zvy+1tihtiYaqvNb/YpHSq2JnluYxsr1sHCrReJiop9W+9Fx8KeOH6I74a2lauG5+UyvBZWzi2YTwG+voY6EkMnLGBi9unYWry6r0q05L568t8JZIuXbrQpUsXkpOTOX36tFZS0eVq9HHjxrF8+XJiY2MZPXo048eP586dO4wYMeKN5wVgaWlJevrz3dvU1KwV5cXkkl9+wTH4BcXmOi00OpnpI7oQGp0sD+XYWFnw64GL+PpF5trGQF+PH+d+wYotx7l+L4Tb/pFkvvCtHd+/DdGxSSz45Qip6RmcverHjNrOWvNLScvgzBW/PJeRrZiZeZ7T2jaryaRFu0lRSfKB1yehMfTs8JFWu7zrdcDExJTWDavwNCJBbhMUmUizes6YF38+dmtqmv7aeN4Fv7Ak/EITc5SHxt5l+iB3QmPTiUnISno2lsX59c9b+D7JfXiof+eGbPS6ge+TOPT1FIDE7cB4uS/H92pEdFwyC7ack0/x1dNT8NXAlkxbfSLHUNrrFEZfvkihp4eJiak8vZiZOTVdyhH0Ql+am5tR2qo45cracu2lU7c7DF3Owok9aNXAlWJm7/bA++PodPyj03OdFpYYzOQe9QhL1BD77xCXjYUZv597wp2w3D/zfu62bP07QJ5+JyxVTiS1K1pz2f8ZvqHP23o/iKaBq53W/FJVmZy7/yzPZWR73TpQsPUylvEeLSlmZi4nEp+7gdSp5kjxF86APXHJj+LmppQokfV7OGdcdw6evk1wlLJQjr/CGx4jMTMzo0uXLvzvf/9jzJgxhIWFMXfuXBYvXsy1a9fyPZ8KFSqwatUqnJ2dKVGiBFu3bsXHx4du3bq9afwAuLm5ER4eLr8ODQ3FxsYGe/s3P09ao4FMjZTrX1RsEnuP+9C2aXUyNRL2ZaxQ6Ck4ePomdapVYESfVjnafDu5Jz53A1my8U80kva0hrUq0atTA/pNXosyVUWmRmLXn1dRZ2poWKsSmRoJO5usPZ4TF+7lGVf2X/bjinP7s7EqQc/29TjufVc+BVDSSHR1r821O4F47jjzynpdWtdGoVAw5vPWHDt/R57vqQv3mTiovdayXvSqmPJqU1g0efVjXDJ7z9ylbQOnrH4sbYFCoeDgufvUcS3LiG4fadXXSBK1nMtw5V7oC2XPvycNq5enV5ua9JuzC2VqBpmarKGIecPbcOySH6YmhpQrbUGnJi40quHw2n4srL588S97mOLFsi8HtsXrzC3UmRoUCgWXbgUwxsMdhUJBuTJWWn/6+nrYWJljaWH2zvtSI+X99ywpnYOXA2lTyx6NBPbWZigUcMQnmNoVrRna1lWrvgS4VbDm2uOYXOf3cb3yHL4apFW299JTMjUSHznboJHAzrIYSakZnL4T/srYNNLrv/8FWS81GomPW9TQmt+h07fo1rauVllNl3I8DYshOVUl9491STOcKtgWWl/qfB2JmZkZXbt2pWvXriiVSk6fPs3cuXOZN2/ea9tKksSlS5eIiorSGk/X9TbyVatWxc7OjkePHuHi4sK1a9f4/PPP38qXesaSXSz4sgd2pSwoV8aSvpPWkJmpoV4NRz7rWB/PHWcwMzWibZPq1KpSHm8fPw6cvPHvVmyWpnWdqeFij5WFGZ2Gr9A6FS85VUWvL39h+rBO1HApR6VyNgyYvr5Qxp4XTevN7FX7CH+WQEhEHDtXjMLAQB+fO4Hs+esaYz53f2U9VXpW7D071Gf2yn1IEnzepRFNX7jILSwqnu1elwHYsPscvT9ugIX5q3f/i8KM1X+xYGRb7KzNKWdjQd/Zf5CpkahXpSyfudfQOjDeuIYDl+4E55hHUzcHqlYsjVWJYnSatJXE5OdbzRtmdqd7y2qM7tFQLotPSsW1z8pCiT+/fZmapsLr71tExSSx74QP5cpYUrpk1skBnVvVIjw6gelLduHkUBqVSs3kwe0LJb536ZvffZjTuw62JU2xtyrGwFVnydRI1KlUiu6NHLWu+2jgbMMVv+g859XQpTTf7bmlVZaSrsZjxRkmd61JDQdLHEsXZ+jP5yisw0E6r5fLR2Kgrz10e/GGP3PHag89VnYozcqZ/fhm+V7qVq9AdFwS307qSXEzk8J5A4BC0uEXas6cOcydOxd9/Zzjz/kxcuRIvL29KVWqlNY8YmNjuXnzpk7zDAkJYc2aNTg7OxMfH8+4cePeKL6UlBTu37/PkPmHeBQUo1MMr6Kvp8DN2RZfP+2hrcIUd3X1W5kvZCX6lGSl1m50YTMppMtj5b5c8Q+PchnaKih9PQVuFS3xfRL39vryROFdLPaid9GPUDh9md2Po7cH5jm0VRB6CqhR1lRraKuwhW36/O3MmPdrndSpu5OTk/nhhx+wsLCga9euODi82TjbzZs3OX36dI6nIRbkNvLlypVj4cKFOrcXBEEQdKNTIvn2228xMTEhISEBLy8vgoKCqFGjBh06dMDI6PXnVnfp0gUDg5yLrlq1ai61BUEQhPeZTokkNTUVExMTTExMMDMz4/bt2/z222+cPn2aFStWvLa9i4sLCxYsoFWrVnKZeNSuIAjCh0mnRPL9999jbm6Ol5cXxYoVo3v37ixZsiTfZ0nt27ePx48f4+vrK5dpNBqePct5F11BEATh/aZTIvHy8qJFixY0atSIFi1a0K1bt1yHqvIycOBA2rVrJ184mO3EicK5M6ogCILw7uiUSObPn89nn30GZN3nasWKFZQuXZqePXtibv76i9A+/jj3+/e4uLx/zzoQBEEQXk2nRJJ94aBSqeT27dvcuHEDX19f7t69y+LFi3PU37JlC82bN6dy5cpA1pMSc7uh4oULF9i+fbsuIQmCIAhFRKdEMm1a1kOOTp8+jb29Pd27d+fHH3+kVKlSuda/cuUKTk5OciLx8fEhIiICKyvtWzEHBATk1lwQBEF4j+mUSE6ePEmXLl3YtGlTvm7g+Msvv2i9HjBgAE2aNMlxqvDVq1d1CUcQBEEoQjqftfXJJ5/ovNAXT/t9kbW1da7lgiAIwvtLp0RSkCQCWbc+OHLkCNHR0VrHSsQxEkEQhA9PId3d6M0MHz6cp0+f4ujoqHWPmMDAwKIIRxAEQSiAIkkkAQEBnDp1imLFtJ9rcO7cuaIIRxAEQSgAnZ7ZnphYsDuqtm/fHpVKlaO8UqVKBZqvIAiC8O7pfPrvzJkzqVChgk4LnTZtGsuXL8fN7fkD6MW9tgRBED5MOiUSJycn9u7dS0REBO3bt6dNmzZvdD/8qVOn4u3tzenTp9HTe75TJO61JQiC8OEp0AWJGRkZHD9+nKlTp+Ls7Mxnn32W50WJL7px4wZ//vkn5cuX1yo/evSoLuEIgiAIRahAB9sNDQ0xNDQkICCAv//+mydPnmBiYkLfvn1f+WyRDh065HrNSMOGDXOpLQiCILzPdEokmzZtwsrKio0bNxIVFcWAAQMYOHAgJUqUICUlhYULF9KkSZM8rzdp06YN69evp0mTJnKZJEn8+eefzJ07V7d3IgiCIBQJnZ7ZXqVKFaytrRk0aBAeHh6YmZlpTT9w4ABLly7F29s71/ZdunTBz88vZzAKBffv33/TcApF9vOhKzlXxfSl05ILw7t4vrLlR+Peynzh3TxzPvVG4TxzPrsvyzg4YWTydvoyPTUZY1Ozt9aXDi0mvZX5vot+hMLpy+x+NLKugJ6hSSFEpU2SJDSqVPSMTN9aP9b/5Ku3Ml94v9ZJnfZI2rZty6JFi3IkkGzm5uavHKbq06cPbdu2pUyZMnKZJEns2LFDl3AEQRCEIqRTIvnuu++0kohKpdK6AWPbtm1p27Ztnu3v3btHhQoVtBKJQqGgX79+uoQjCIIgFCGdLki8e/cunTp1Ijo6GoA7d+6wYsUKUlNT89X+8uXLOW4hDxAXF6dLOIIgCEIR0imRrFy5kpYtW2JhYQFA3bp1qVGjBvPnz89X+1mzZnHp0iVCQ0MJCwsjLCyM4OBgVq8unDFyQRAE4d3RaWirUaNGTJqkfTDQ0tKSkydP8v3337+2/bfffktISAhLly6VyyRJQqFQMGfOHF1CEgRBEIqITolEpVKRmpqKqakpkPXI3Z9++gk7O7t8te/Vqxf169fH1tZWPltCkiT27NmjSziCIAhCEdIpkfTo0YOePXvi5OSESqXi2rVrZGRksGbNmny19/DwwNjYmKSkJKysrFAqlZibmzNs2DBdwhEEQRCKkE7HSJydndm2bRu1a9fGzs6OESNGcPToURo3bpyv9sHBwXTs2JEZM2YAEBoayoIFC3K9I7AgCILwftP5FilWVlYMGTJEfh0UFMTly5fzdZuTuXPn0qpVK/mUYVdXV5o0acLs2bP5+eefdQ1JEARBKAI6JZLHjx/zxx9/oFQqyb4wPj09HR8fH86ePfva9s7OzsyePZutW7c+D8TAgMuXL+sSjiAIglCEdBramjFjBk+ePOHRo0dyWXBwMAMHDsxX++y7/mYfaNdoNGzevBkHBwddwhEEQRCKkE57JE2aNGHy5MncunWL9PR0GjRoQHh4ODt37sx3+zlz5pCUlERycjJeXl6EhISwbt06XcIRBEEQipBOeyTx8fFERkZSq1Ytjh07RmpqKhqNJt+n77q5uTFu3DiqV69OVFQUXbp0wcvLS9xGXhAE4QOk0x5JnTp1cHd3Z8OGDXTu3JmWLVuSnp5OtWrV8tX+zJkztG7dWut030ePHuHr66v1+F1BEATh/adTImnVqhWXL1/G3NwcgD179vDw4UOt54u8iq+vL61bt9YqK126NP3798fLy0uXkARBEIQiolMi6dmzJ6NGjaJ3794AODg45OtA+S+//IKnpydqtTrXixdr1aqlSziCIAhCEdIpkbi5ueW693Hr1q1XJoMxY8ZQs2ZNjhw5Qo8ePbSmGRkZUaVKFV3CEQRBEIqQTomkUqVKTJ8+XSuZaDQaTpw4weHDh1/Ztnnz5ri4uGBra6vLooucKkPN/NWHMDUxIiwqjilDOlKpvM1r603+ogNlrEzl6YdO3+Cf6/5oNBK1q5THo2vOuwKkpqlwH7SEJdN70ayeS4FjNzTQZ864rqSmqShb2pJlm/7iScizHPUqO5Rm8hftCQqLxcmhND9tO8ldv1AA9PX1mDP2EzI1EmamxgRHxLJ62ym5bbsm1fikdW3Co+NxsLNm9qr9xMQrCxx7YVNlqFm09gimJoaERycwfkBbHMvl7MdLN/2Zs3IfweGx1KvhyHdTelHe7vkjEI7+fYtLtx4jaSRqupaj98fPTxg5eeEuV24FULZ0SR4HReHRtTFVKpctlPjz25dOFUoz7LMWPA6KolwZS67fe0pQSAQABvp6LJnemx7t6xGfmMLsVfs5dPpmjnl0alETR/tSBIY+4+LNx8QnphTKeygsGRlqVm/9CxNjI6JiEhjSuzXly5bKUc/ndgBL1h4iLDIWtyoV+GpMN+z+XScTlSl8//MBLvg8xMrCnFH929OhZc6N4rT0DAZOWs30UV2p71a5UOLXdb38Zfsp0GQAYFHclOVf96Vt42pExybx3Zoj7DvhI7cd1qsFEwe1w9TYiEOnbzBz+V5S0zMKJX7QMZHcunWLhISEHBcQPnuW883n5kNNIgAzl+/FtWIZhvduSVB4LH0mevL3b9MxNjJ8bb0jnmMoZgZXbz9h9bZTHNs4BYVCQY9xq3Eoa03z+trJ4vt1RwmNLLxntHw3uScPn0SwYfc5ypex5I+Vo2k1YDGqDLVcx0Bfjx3LRzJw+noeBERgb1uSk1um0XrAIgAmD+6AQqFg/s8HAdi1cjRJyWls3f8PlcrbsGR6bz76bAEZ6ky6ta3D70uH03HYikJ7D4Vl/k8HcHYsw6AezQiJiGXwjPUcWT8FY6Pnq0R8Ugpb93uzeHofklNVfL10FyNmbeLPjVMBuH43kHV/nGH/L1+iUCjwmOxJuTJWNKnrTGy8kiXrj/LXpqkoFAqCw2MZNH0dp38rnEev5qcvAdbOH8SAaesJi4pHoVBwZfcsZi7dCUTi0bUxWw9cYM6PB/h+ymesmTeQkxfukZL2/FZFCyf24GnoMzx3nCmUuN+G5Ru8qFjelt6fNCY8Ko4v/7eFbavGY2T4vC8TlSnsPnKRWeN7kpqWzner9zPtu21sWzocgI07T+PepAZDerdm+0FvZi/biYO9NVWdymkta+3vJ4h8Fl+o8eu6Xp7aMo0xczYBMHVoRw6fvsnyTccY/bk76xYM4nFwFLceBNOkrhOVytvQ68tfqFXFgaUzepOansHM5XsL7T3odPqvh4cHe/fu5bffftP6e/G28O+aSqVi9+7ddOjQ4a0t41lcElv2/8OnbeoA4GBnhbGRAQdP3cxXvSNnbwOwYstxOreqJV+Q2bF5DZZvPqY1D68zt3BzLUfJEoXzzHHrkuYM7t6Ug6duABAcEUe6Ss2nbWpr1WtS1wlH+1I8CMjaag2NjCcw5BkeXbL2mPp/2pg7/+6dABw+c5NxHm0A6Nu5AU9Cn5GhzgTg6Nnb1KvuSAO3ioXyHgpLTLyS3w9f5ONWWVuc5cpYYWRowNG/b2nVexIczeLpfaldrQJN6znzvwnduecfRuy/e1i//H6KDs1ryv3Ytml1Vm87CUBwRCzP4pLkz8LE2JCk5LRCiT+/fQng4liGksWzvkOSJKHRSHKy/OPoFW7eDyIpOY3V206iztSgkZ4/+3vM5+6Ymxmzfve5Qon7bYhLULLvzyu0aVoDALvSlhgZGnDK+7ZWvaDQZ8ya0JMaruX5qJYTU0Z0we9JuLx31bieK+2au+Fc0Y5vxvfAumRxrvkGaM3jzIU7uFYuSwlzUwpLQdbLJ6HP6NQqq96pC/c5cPIGd/3D+PLb7UTGJMobpsaGBsxcvpf7j8PZeeQyG3efo1UD10J7D6BjInF3d8fExESrLC0tjcjIyEIJShfJycmULl2awMDAt7aMc1cfYWxoQGnrEnKZcwVbzl97lK96/9wIQKPRcPbKQyqUtX4+zdGWizcfyz86IRFxXLn9hM861C+02Ft85EJ6hpro2CS5zO9pZI69IPNiJhga6FPaurhcFhwRSw0X+3+nG1O2dMnn08LjcKpQGlNjQ8yLmWhNU2WoiYpNoqaL9lZdUfvHxw8jQwNsrJ6/RyeH0ly47qdVr061ChQ3e/49L29nTQlzE4qbm6LRaPD28aO83fN+rOxgy1XfADLUmVR3ssfC3JSvluxCrc7kjyOX+HbyZ4USf377EmDfcR9++d8ArEua07y+C0fO+sp7uWkvDG3UcC7H9CW75TIrCzO+GvExoZFxrJk3kN2rRlO76vt354mrtx5jaKiPteXzvnQsZ8NV38da9Wq4OmBe7Hlf2pexwtzMBPNixgA0quMsTzPQ16d0KQvsXvguR0TH4/sgiI4taxdq/AVZL0PCY3GqkDW68/eVB3J5ZqaGsKh4gsNjAThz+YHWvJ6GxcjTCotOiaRNmzY5/lq0aJHvK9tv3br1+kpvyNLSkkqVKhX6fF8UGhmHpYWZVpm5mTFhUXGvr1fMmIjoBOISU0hJU2H1wnTzYiakq9TExCvJzNSwfMsxvhrxcaHGbm9rSVxCslaZMjmdsqUttcqu+AaQkJTCxEHt5bidHGzlH5iTF+4xqHtTLIpnbZXVqeaAWp1JhjqTkxfu4eJYho9bZl0LVN7OCuuSZoU6FlsYwqPisXxpT8+smDHh0fGvbHf1dgCDujfH0ECf+KRUUtNUWJZ4sR+NSVepiY1XYmCgz9YlI7l+N5BOQ5fhULYU7ZvVKJT489uXANOX7CI0Mo5TW6bStnFVvvXUPoZpZWHGpMHtWTCxO4YGz38OPmldi0RlKtsPX2LU3F/xexrFgZ/H5fheF7XIZwlYvNSXxUyNiXqW8Mp2N+8G0rtzYwwM9HNMU6akkZauokXDrOviMjM1bN51hpGfty28wP9VoPWygi3pKu2hTIDiZiYUMzHiz3O3c0wDaFirEp47/i6cN/AvnY6RVK9ePcd1IOfPn8/3beTHjh1Lr1696NOnD2XKlNElhFxlDzEUhCRJ8o0oc0wDTI0NtaarMjIx0NfXKsu9nhoDAz25zNjo+XTVv18GA309Vm87xbDPWmi1lyTyjOlF+np5v389RdYW6It1jIz0yczM1CqLS0im90RPpg7pyPoFg7h2J5BqTnYc+fsmegoFM5bsYsaIzmz+fghXbj2hYa1KPAl5hiRJnL3ygLHzfmN0v1a0bliFhKQUjI0M8X8a+crYADI1r39/byqvz01CwiS3fjTQz/NzTlepOX3xHqtmeWh9R4yNDJ73Y8bzfpQkiURlCsN7tyIgJJqZy3ZRplQJPnLL38ZOYfQlgJmpETfvB3Ho1A2Wz+xHVEwil64/kOspU9I48c8dHO2t+XGWB4+eRHDtTiDVncri/zSKiOgE9PUUrNp6nBG9W/JJKze2H770ytgLuy9fuU5Kkta6BJChVst9kBtVhhrvqw+YP6U3kpSZo972A+eZPPwTDP/9Pmzbf45enRtj/NJ3pqDrJBRsvaxauSzXfP1zLGPs5+58s2Jvrt8HpwpZG4Xnrz18bWxvQqdEMmPGDOzt7bXKGjRowMaNG/PVfv369RgbG7N161bi4+P55JNPaNq0qS6hFLq0tBQkSZPrNBsLU+ISk0lJfn4WUnyCEhtLM62yXOslKillaYapYdZ4eWR0DCnJWWcJPYuNw8TYEGN9Dd+vO8KqX0/I7RKUqXhMXUvP9nVZOKHrK2N3c877JAZ9hYR1SXOtOuVsS5KoTM3RLiM9le899wPQvL4r+np63HkQSKVyWVtJOw6dB8DQUJ/hfVqw58/L8jzu+z1lzoqnAIwb0J6noc/ISM+5jJfdeBjxyum6UKWn5tqXNiVNiU9MIT31+ZZgYpISm5LFtMpetOrXU0wb0hZ91KSnZlDcRB8TY0OexcSRnprVj3FxCZgYG2JqKBEV9YwJ83/j4C9jMNDXx1BPYuTszZzeMhlTE6PXxl5Yfbl4xues2X6SgOAo/rdqD99O6cPitVl9+/x4iIYte85Qu2p5urethSo9FVtrcyyKm2jNLzZBSbVKtu+8L6WMdK1jNy8qbVmMpKQUNKpUuUypTKGUpZlW2Ys27jjD+AHumOhnoslIR1KARNaP6q0HQZQoZkT9qvZy+3XbT/Lr3ud3NU9KTmPKwl/5uKUbU4d1emXsr/usCrZeKngUEExNJ1v586nuXA4TIwUJCQk52hsZGjDq87Z4bj/x2rjelE6J5OUkAqBWqzly5Ei+nrletWpVICshpaens3jxYubPn0/fvn3p2bMnJUqUeM0c3h4Tk2KYFsv9AHfbZjWZtGg3KSqJUv+OyT4JjaFnh48oZmb+mnqxjPdoSTEzc9wbVuFpRILcJigykWb1nDEvXoJre7U/vw5Dl7NwYg9aNXClmNmrD7z7+uV9jCo0OpnpI7oQGp0sn45rY2XBrwcu5tnOQF+PH+d+wfLNxzhz1Z+aTrbc9o+UtzjH929DdGwSC345kmP4qlwZSzq0qEX/qeteGdfbZGRsipFJzgOjLRvV4Ktl+1CmZ63EAIGhsUwYWB9j05xDN9sPXaRDi9q4VM46RpC9Jdq8vgtPIxLkNkGRiTSqXRlTs+KcvhqAuZkpZuZZ3+XpI7vidfYOwVFKarqWf23shdGXVhZm1K9ZiaPn76PKUOPrF0md6pWwtiyp1Y/ZvK/5c+tBCL5+kZy96seM2s5a80tJy+DMFb933p8KQ2P0DE1yndagbhWSUw+SkJqJpcW/61N4LENbuKNnlLPv9/11hRaNa1Khgj2SJKGQQGFoikKhIDAkmjv+kQzo0UKrzd61U7VeD5nmyaShnWlQ2ynXZbzodZ9VQdbLFVuOc/1eiNyXTg6lsbK0YIHn0Rxt9PQUfDWiM9MW7ybuLZy+rfPB9hePj7Ru3ZrOnTvn+6aLMTExANy5c4eJEyfyxx9/ULNmTZycnPjxxx9ZtmwZGRlFM66uUCjy/LOxKkHP9vU47n0XhUJBUFgMkkaiq3ttrt0JxHPHmTzraTQSH7eogUKhYMzn7hw7f0ee76kL95k4qD0KhYJyZay0/vT19bCxMsfSwuyVsSkUCjI1Up5/UbFJ7D3uQ9um1cnUSNiXsUKhp+Dg6ZvUqVaBEX1a5Wjz7eSe+NwNZNGGP8nUSGik59Ma1qpEr04N6Dd5LcpUlVa7YqbGrJk3iK+X7eHvKw9fGVf239vpy9z7s5Rlcbq2qcvpi/fkU3M1kkSnlm7cuPeUjbvPynV/P3QRIyMDrC2LExIRx/W7T9l19AoKhYJhvVty6sJdue7fl+8z1qMtCoWC6k72BIfHkJKqkodcrSzMqORQ+rX9WFh9GR2n5GnoM2q6ltNqf88/lEyNRDUne8xMjcnUSBgaGlDJwYZDZ26RqZHY9edV1JkaGtaqRKZGws4mayv5xIV777wvX/U5WZUsToeWtfC++hCFQkFYZBySJOHetAZ3Hgaz/aC3XHffX1cwNjLAqqQ54VFx3H4YxOHTN7O+A2Ex7PK6QNtmNQmPiuNp6DM27DyFRiNRxqak1p++ngJLCzMsihcrUD8WdL1csvFPeZ2sYF+KYb1bsv/kDcraWlKxvA2Th3RAImuofd6E7hzzvoOpqTHl7Kzo1NKNRrWdCq0vddojqVq1Km3bPj/wpKenh42NTb7vtTVt2jQyMzPx8fHh008/5ejRo/ItVpo3b86ePXuYNWsWixYteqO48jNmWVCLpvVm9qp9hD9LICQijp0rRmFgoI/PnUD2/HWNMZ+7515v+UgM9LMO7DWt50zPDvWZvXIfkgSfd2lE07pObz32GUt2seDLHtiVsqBcGUv6TlpDZqaGejUc+axjfTx3nMHM1Ii2TapTq0p5vH38OHAy67TE7PHUpnWdqOpkj5WFGZ2GryBR+Xz4wKGsNY1rVaKGazm+Xr6Xm/eD3vp70tX8L3uw8JeDRD5LJDQyjs0/DMfAQJ8b955y4OR1hvVuxa/7vZm1Iue59gfXfAlAo9pOdG0TzcKfDyJJ0LtTQxrWzrpIrWJ5G36Y2pt5qw9Qu6oDMXFK5ozrpnXmUEHkpy8B+kxaw+Qv2lPD2R59fX0u3vDnvl8wALPHdKFONQf+PHebZ3FKrbO2klNV9PryF6YP60QNl3JUKmfDgOnr38k69qamjezKyo1HiY5NJCI6nhVzBmOgr8+dh0EcO3sLj27N2X3kIos8D+Zou+mHoYRExDL8q7XExCWx+8jz4z+ffdwIfX2dtrXfiK7rZfY6WaGsNUfWTaRMKQuG9Xq+N7Vxzzk0GolN3w2he7u6jO73/Lh2fGIKrh1nFtp7UEg6fDMCAwNxdHTUeaHVq1end+/ejBgxAjs7uxzTt27dyi+//PJGT0xMTExkz549LFq0iKVLl9KhQwf5Ub75kZKSwv3796nkXDXPoa2CkCSJlGQlxczMC+WkgNxYfjTurcwXshKJm7Mtvn45h0QKS+qN1YUyn+y+LOPghJHJ2+nL9NRkjE3N3lpfOrSY9Fbm+y76EQqnL7P70ci6Qp5DWwUhSRIaVSp6RqZvrR/rf1I4F6Dm5n1aJ3XaI0lNTWXYsGEsWbIES0tLLl68yIMHDxg8eHC+OuR///sfvXr1ynO6u7t7rsdhXqVEiRIMGTJE6znygiAIwtun037bvHnzMDU1xdg462Kexo0bY2lpyeLFi/PVPq8k4uvrC2Q9ivfFoTNBEATh/aXTHkndunWZPn26VpmjoyM//PADM2bMyFF/zpw5+Tp4fv36dY4dO/baeoIgCML7Q6c9kpeHryRJYuvWrVhYWORaPzExkfDwcDSa3K/PyJ6HIAiC8OHRaY+kdevW9OjRg4YNG6JSqTh79ixhYWEsWbIk1/pDhgzBycmJYq85iP3w4UNdwhEEQRCKkE57JPXr12fJkiWoVCqCg4Np0qQJO3bsoHPnzrnWd3Nz00oic+bMwdvbO0c9V9fCvSOlIAiC8PbptEcCULlyZWbPng1AZGTkGz1j5J9//qFPnz45ymNjY7GyssqlhSAIgvC+0mmP5MiRI9SpU4fw8HAg63Tg//3vf/IV668za9YsLl26RGhoKGFhYYSFhREcHMzq1YVzHYEgCILw7ui0R/Lbb78xefJk+c69jo6OtG3bljlz5vDzzz+/tv23335LSEiI1oOwJElCoVDk615dgiAIwvtDp0TSrFkzBgwYoFWmr6/PpUuvvr10tl69elG/fn1sbW3lM8AkSWLPnj26hCMIgiAUIZ0SSXJystZxkaCgIH744QecnZ1f0zKLh4cHxYoVQ0/v+chaUFAQffv21SUcQRAEoQjplEgGDhzIsGHDMDIyQqVSERAQQMmSJfP9PBIDAwNOnz6NUvn8eR2pqans3btX7JUIgiB8YHRKJHZ2duzdu5czZ84QHByMnZ0dLVu2xNzc/PWNgYkTJ3LlyhUMDQ0xM8t6loNSqcz3begFQRCE94fOp/8aGRnRoUMHrbLTp0/j7u7+2rYWFhZcvXqVM2fO4OTkhKOjIzdu3CAsLEzXcARBEIQiUmg32/f29ua7777LV107Ozv09fVp1aoVe/dmPe+hevXqrFq1qrDCEQRBEN4RnfdIAFQqFV5eXvz222/cv38/3/f0T09Pp3379ixduhRHR0c8PDxISUlBrVYXJBxBEAShCOiUSKKioti+fTu7du0iPj6eZs2a8eWXX3L79u18tZ8+fTqNGjXCyckJNzc39PX1uXPnDp999pku4QiCIAhF6I0Sya1bt/j11185duwYJiYmdO/enfT0dObPnw9AgwYN8jUfhUKBg4MDt27donHjxlSuXBl3d3dKlCjx5u9AEARBKFL5TiTjx4/n5MmTVKxYkZkzZ9KtWzeKFSvG8uXL5Tqvu7tvtiNHjjBjxgwaN25M48aNcXFxYd68eXh4eFC9evU3fxeFIPsW9+lpqa+pqRtJkkhPT0Oh0Htrj/V0cbB+K/MF0NODcqVLkJqewSueBlAgGo1G69qigswHIEOVVuB55UaSIEOV/m9fvpVFvLW+fBf9CIXTl9n9qFGnF0ZIOUiShKRWoVEoxDqZh5SUFExMTF7bl/lOJCtXruTo0aMcOXKEhIQE0tPT8504XrZhwwaWLVvGkydPADA2NqZr167MmTNHPvj+rqWnZ31ZQ4MDi2T5hWHTnK5FHUKBpKWl6fydelF2X8ZEhBR4XkVF9OXzflQnRBRGSEXiQ+/H+/fvU7Vq1df2Zb4Tib6+Pl26dKFLly74+Pjw3XffYW5urnWAPC4uDktLy9fOq0mTJnTo0IGtW7fKZdHR0Tx9+jS/4RQ6CwsLHB0dMTY2LpStYuHNmZiYFMp8RF8WvcLoS9GP74f89KVOB9vr1atHvXr1CAkJYdu2bUyZMoXu3btz/fp1JkyY8Nr25ubmqFQqeXcyJCSEVatWUbduXV3CKRQGBgZYW7+93VDh3RF9+d8g+vHDoZAK4Rm3SqWS7du3s2bNGq5fv/7a+tHR0Xz33Xc8ffoUCwsLfHx8cHBwYO3atdjb2xc0HEEQBOEdKpREku3AgQN069YtX3UlSeL27duEhoZia2uLm5sbBgYFuqxFEARBKAKFmkgEQRCE/3/EESxBEAShQEQiEQRBEApEJBJBEAShQEQiEQRBEApEJBJBEAShQEQiEQRBEApEJJJ3ICYmhoULF7J+/XqWLFnywT13RaVSsXv37hxPxPz/SPTlf8eH3JfvWz+KRPIOTJw4kR49ejB8+HDKli2Lp6dnUYf0RpKTkyldujSBgYFFHUqRE3353/Eh9+X71o8ikbxlDx48ICAggGrVqgFZN6zctm2bfIvsD4GlpSWVKlUq6jCKnOjL/44PvS/ft34UieQtu3HjBjY2NvLrMmXKEB8fT1BQUBFG9ebe1vMaPiSiL/87/gt9+T71o0gkb1lCQgIWFhbya0NDQyBr11T4sIi+/O8QfVm4RCJ5yywtLeUH9ACkpmY9gfHFL7HwYRB9+d8h+rJwiUTylrm5uREeHi6/Dg0NxcbGRtwu/wMk+vK/Q/Rl4RKJ5C2rWrUqdnZ2PHr0CIBr167x+eefv1fjm/khbhIt+vK/5L/Ql+9TP4pE8g4sXbqUX3/9la1btxITE8PIkSOLOqQ3kpiYyIkTJwA4fPgwKpWqiCMqOqIv/zs+5L583/pRPI9EEARBKBCxRyIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkgiAIQoGIRCIIgiAUiEgkwgcnNDSU5s2bExoaWtShFLpHjx4xbdo0Zs2a9dq6wcHBREZGvoOo/rsyMzPZs2cPXbt25fLly+9kmTdu3Hgny3mXDIo6AOE5tVrNxIkTWb16dVGH8l6zsbFh3Lhx2NjYFHUoha5EiRIEBwfj6Oj4ynpnzpwhPT2djh07vpvAXkOSJEaPHk316tUZP358nvU2bNhAbGwsSqWSxo0b06lTJ3na5cuXOXDgAPb29gQEBDBq1ChcXFy02qvVanbv3g1A2bJladCgAaampjrHraenR40aNXj48KHO83hTJUuWZOXKlUyYMAE9vf/Gtvx/4138R/z555+cOHHiP7nFUpiMjIzo06cPRkZGctnPP/9chBHllJSUxG+//fbG7cqUKUP58uVfWefu3bt4e3u/N0kEYMuWLdy5c+eVdbZt24a/vz/Tp09n3rx5bNy4Uf6uh4SEMGXKFL755hvGjRvHhAkT+OKLL4iOjpbbJyUlMXr0aKpVq0a/fv1o2bJlnkkkODiYw4cPvzZuhUKRI1m9bRUrVqRWrVqsXLnynS73bRKJ5D1y5MgRKlasyK+//lrUoXxQzp8/j6enZ1GHIUtLS2PSpEnEx8fr1F5fX/+V0+fMmUPv3r11mvfbcO3aNfT19alYsWKedTIzM1m9ejUff/wxkPUD3qpVK3nve9++fZQuXRpzc3MAHB0dKVOmDDt27ACy9njGjh1L7969qVWr1ivjiY+PZ8KECWRkZOQr/qLYK2jdujX//PMP/v7+73zZb4NIJO+Ja9euUbNmTQYMGMDx48dzHfsOCwtj0aJF/PTTT/Tt2xcvLy+t9osXL2bRokX06dOHe/fu8eTJE8aMGYO7uzuQtdU3YcIE+fWpU6cYOnQoq1at4ssvv6RVq1bExsayf/9+5syZw7Jly+jZs6fWl/3Ro0csWrSIFStW0Lt3by5cuEBCQgJjx47F1dWVDRs2yHUXL17M8OHDc/ygnj17lkaNGvHTTz8BcPHiRZo0acJPP/2EUqlk06ZNuLu7c/36dUaNGkWdOnXkPY7k5GTWrVuHu7s7ISEhRERE4OXlRUZGBitWrODUqVMA3Lp1C09PT2bOnEmvXr24d+8eSqWSNWvW0KZNG06fPo27uztff/01v/32G126dOHQoUN07dqVL774gm3btuHq6srly5dRq9Xs2LFDfv3gwQO+/vprRowYweHDh2nWrBmtW7fmr7/+AuCvv/7i8ePHXLp0iRUrVpCcnIxKpWLz5s14enrSu3dvlixZgiRJAKSkpDB37lxWrFjBrFmzXrllf/XqVSIiInB1dQWQ35O7uzu+vr5MmjSJevXqMXPmTOLj45k8eTL169dn7NixZGZmAhAYGMjUqVPx9PTEw8ND3nO6f/8+/fv3x9XVlb/++ovIyEhatmzJ1q1b84wnNjaWo0ePMnDgwDzrQNZeVFxcHA4ODnJZ5cqVuXr1Kmq1mqSkJCIjI+XPBKB8+fLyZ3Hw4EGePn1KSEgI48aNY+rUqUREROS6rEOHDhEcHMzx48flRJWYmMgPP/zAqlWrGD9+PLNnzyYlJSXX9tnf+8OHD6NSqdBoNOzcuZN169bRv39/Zs6cSVpaGn5+fsycOZPhw4dz8uRJOnbsSIsWLbh79y4AGo2G5cuXs3nzZkaNGsXQoUO1ltOgQQM2b978ys/tgyEJ74UpU6ZIMTExklKplOrWrSstX75ca3paWpr0ySefSKGhoZIkSdLWrVslNzc3KTMzU/L395e6d+8uZWZmSpIkSWPHjpWGDBkiSZIk7d27V2rdurU8nxdfp6SkSJ06dZL69OkjBQUFSTt27JASExOlKlWqSGFhYZIkSdLQoUOlBQsWSJIkSTExMVLHjh2lpKQkSZIk6bvvvpPat28vSZIkJSUlSY0aNZL27dsnL2vp0qVSQEBAru+3f//+0o8//pjjtVqtlnx9fSUXFxfJ09NTSk1NlY4cOSJVq1ZNSklJkdRqteTj4yO5uLhIwcHBkiRJ0qVLlyQXFxd5XhEREdKsWbPk1/PmzZNat24tpaenS1evXpVcXFykdevWSb6+vtLff/8thYSESC4uLtL8+fMlPz8/6ejRo5IkSZKLi4t06dIleT7ZrzMzM6V58+ZJbdq0kc6ePSulpKRIkydPltzc3OT+efn9/fDDD5K/v78kSZIUGRkpVatWTdq1a5ckSZI0bdo0adu2bZIkSZJarZY6deokzZgxI9fPbfHixVL//v3l12q1Wrp27Zrk4uIibdu2Tes9/vTTT5JSqZQiIiKk6tWrS+fPn5ckSZLGjx8vrV69WpIkSTpy5IhUt25deX5xcXFSs2bNpO+//17y9vaW48pNZmamNGfOHCkxMTHX9/yiP//8U3JxcZHi4uLksrNnz0ouLi5SVFSUdOHCBcnFxUXavn27JEmSlJCQIH366afSuHHjJEmSJA8PD2nChAlSWlqapFKppP79+0sdO3aUMjIycl1e69atpb1798qvhwwZIp08eVKSJEnSaDRSv379pEmTJsnTs/vWz89PmjlzppSWliZP+/XXX6Vz585JkiRJSqVSatKkibRixQpJrVbL3wNvb29Jo9FIQ4cOlSZPnixJkiT9/fff0uzZs+XPatGiRVox7tq1S2rSpEmen++HRBxsfw8EBwdjZmaGlZUVAN27d+ePP/5gzJgxGBsbA1kHVw0NDSlbtiwAHh4etGnTBj09PX7//XcaNGgg76L/8MMPqFSq1y7X1NQUKysrGjRoQPny5enbty+QdUDUzs6OmzdvEhcXJx/U3r9/P05OTvLww+TJkxkyZAgA5ubmDB48mE2bNtGtWzcyMjIIDw9/5XBHbvT19SlZsiQAn3zyCSYmJlSvXh21Wk1cXBxly5Z97UH2Q4cOkZiYyJYtW4CsYyoVK1YkMTERW1tbADp27Cgfi5D+3Qpu164dTk5OODk5vXL+enp6WFpaYmdnR4sWLQCYPn06Xl5eeHt75xh2kiSJw4cPY2try/nz5wFo0aIFSUlJBAcHc+jQIaZMmSK//5o1a+a57ICAACwtLbU+r9KlSwPQsmVLjIyMqFOnDgAfffQRZmZmmJmZUapUKZ49ewbA2LFjsbKyIjo6mtu3b6NUKuX5lSxZkoULFzJmzBiSk5NZsGBBnrFs3LiRPn36ULx48Vd+XpA1lAVgYmIil2UPPRkYGNC4cWNWrlzJzp07uX37NtWqVcPPz4/WrVsDWXtLkyZNkteHUaNGMWTIEHx8fGjYsOErl/3gwQO8vb1ZtWqVHEv//v2ZNGkSX331lfz53b17l5s3b7J06VKt4287duygZ8+ePH78GMjak1CpVPJ31c7OjqZNmwJQvXp1+biPmZkZ+/btw9bWlkGDBvHFF19oxWVjY8OzZ89ISkrK12f4PhOJ5D2wbds21Go1S5cuBSA9PZ34+HgOHz7MZ599BmQlm/T0dLmNvr4+9vb28rRy5crJ07J/6PNDoVDIK3k2ExMT5s2bR4cOHXB2dpZ/aF+OwdjYWP5hhqzktnHjRo4fP05GRgYdOnTIdxwvx/Si7GMGGo0m1+kvCw0NxcXFhcGDB+eYFhISkmMe2f9/3XxfxdbWlpIlS8o/1i+KjY0lPj6eAQMGyO8lO7bjx48jSRJmZmY54slNenp6jgPMeX1eL9LT05M/vzJlyrBmzRocHBxo0KABmzZt0qrbsmVLnJ2duXv3Lmq1GgOD3H8mVq1axdq1a+XXKSkp3Lx5k+PHj+c40G1nZwdAQkKCnEyUSiWmpqZYWFgA0KlTJ/ksrv3796PRaOjRoweQdYxFrVbL86tatSoAcXFxucb2ooCAAACt9hUqVAAgIiJCTiQ+Pj5cuXKFyMhIrRMeQkND+fjjj+X38KKXP3sDAwN5falfvz4LFy5kyZIlbNmyha+//lp+P4CcFP8LiUQcIyliSqWS6Ohovv32W6ZOncrUqVNZsGABzZs31zrrx87OjoCAAAIDA+WyJ0+eEBERgZ2dHWfPnpXHwCHruANk/YC8WP46T58+ZdSoUUyZMoVGjRppTbOzs+PatWskJibKZT4+PnJyMTc3p3///nh6esrHIPLypnG9CVtbW44cOaL1w/HgwQOtuPPjxR/f/FCpVLmetluyZEkUCgVHjhzRKr9y5Yr8A/Lo0aN8LcPKyirPsf38Gj9+PJUqVaJfv34UK1Ysx/SdO3cyceJE4uPjtRLFy/766y8OHDgg/9WoUYO+ffuyfv36HHWrVauGjY0Nfn5+ctmTJ09o1KhRjoPdycnJ/PTTT4wZM0b+Qa9atSpPnjyR62QnN2dn59e+3+yNrJdP8TU0NNTqr4EDB9KgQQO+/PJLrT16W1tbDhw4oNX2ypUrr11uUFAQn376KcePH6dbt2588803BAcHy9PT0tKArFO+P3QikRSx7du3061btxzln3/+OQ8ePJCHQlq1aoWlpSXjx4/nwoULnD9/ns2bN1OmTBl69OhBWFgYU6ZM4caNG+zfv5979+4Bz3efAwMDCQkJ4fz58yQmJmr9GL34g/7w4UPS0tKIj48nLCwMf39/0tLSCAwMpHPnzqjVasaNG8e1a9c4fvw4f//9t7xlBTBo0CCCgoKoXLnyK88+KlWqFL6+vqSnp3Pu3DnCw8OJiYkhIyND/vGWXjjw+uLrl//NHoaIi4vj4cOHfPLJJ4SEhDB06FDOnj3LyZMn+eOPP7RW2NwSxMtlpUqVwsfHh7S0NPbv3w9ATEyMnKCioqLkujdu3MDS0pI2bdrIMcXHxxMbG0tcXBzdunVj7ty5bNq0iatXr7J06VIUCgV16tTB3t6eZcuWkZycTEZGBmFhYfJn8bKaNWsSHh7+ys/l5fKXX9+5c4fY2FhUKhWXLl0CIDw8nISEBO7fv09cXBytWrVi/vz5eHp6yt+ll5UrV07rz9jYmBIlSlCmTBkAdu3axeLFi8nMzMTAwIBBgwbJJ0NoNBrOnz/PqFGjtOapUqmYPn06bdq0YezYsXL5qFGjOH36tPy9vXbtGu7u7lSuXDnX2AwNDYmPj+fp06e4uLhQt25dfv/9d3m6j48Pffr0oUSJElqf3/fff09CQgJz586V6/bo0YPVq1ezcuVKrly5wvr16+XTkjMzM/P8nG/fvs25c+cwMzPjm2++yZEwIiIicHR0fKMRhPeVSCRF6MCBA3h6enL9+nViY2Pl8uTkZG7fvg3A3LlzOXnyJObm5mzYsAFTU1PGjh3L9u3b5Qu/ateuzZIlS7h79y6jRo3iwYMH8tBJkyZNaN26Nb169WLDhg00btwYR0dHjh49ire3N48ePeLkyZPyuG6TJk2oXr06vXr1YufOnXTo0AEfHx/Cw8MpV64ca9asIS4ujpEjR3Lq1KkcPwQWFha0adOGXr16vfK9jx49msePH9O5c2d5Sz77fe/btw/IOlMnMjJSHiY5cOAAKSkp8vQDBw6QmppKlSpVqF27Nh4eHqSmplK+fHnWrl1LQkICkyZNYu/evYwbNw6lUilfzLZp0yaePXtGRkaGvOe3Y8cOrS3G6dOns3nzZgYPHoybmxtWVlbcu3dPHk7JyMjgp59+YsuWLezatYstW7bISbVr164cOnSIX375BWtra77++mu6du3K2rVrmTFjBk5OTnz00UeYmJiwZs0a1Go1nTp1YsGCBRQvXhwjIyNu3ryZ43Nr164dQUFB8hZzamqqnOQOHDhAbGws27dvB+Do0aNERUVx6NAhoqKiOHXqFKGhoYwYMYI1a9YwevRoGjRogJWVFVu3biUsLIwxY8bIQ6alSpXC0NCQCRMmyHu4b+Ls2bPs27ePs2fPAjB06FDMzc1ZuXIl3333HWPGjKF27dpA1vDR4cOHWbZsGX369OGbb77R2lNp2bIlU6ZMYf78+WzdupULFy7www8/5Lnsnj17smbNGv78809MTEz46aef0Gg0TJgwgVWrVhEbG8tXX31Fenq6fFbasWPHSE9Pp02bNuzbt4/Zs2cTHBzMsGHDGDZsGHv27GHy5MkAdO7cmYCAAC5evIi/vz8XL17k8ePHXLlyBT8/P3mPZdKkSSxatIhVq1YxYcIErSGzBw8eaF2Q+SFTSC+nU0EogOTkZBYtWsT8+fOLOpS36qeffuLKlSs6XXRYUHPmzKFNmza0bNnynS/7TXl5eVG2bFnq1q1b1KG8VzIzM+nevTtbtmyRT7L5kImD7UKhOHnyJEqlksuXL9O/f/+iDuetkyQpx5DGuzJ9+nRmzZpFkyZNMDQ0LJIY8uPhw4fExcXxySefFHUo7519+/bJZ8/9F4ihLaFQHD16lCVLltCoUSOqV69e1OG8Vb6+vly4cAF/f3/OnTv3zpdvbm7ON998w++//17gA+9vU/HixRkwYEBRh/HeuXDhAlZWVjqf1fg+EkNbgvABS05O1jp1WHj/KZXK/8QB9heJRCIIgiAUiBjaEgRBEApEJBJBEAShQEQiEQRBEApEJBJBEAShQEQiEQRBEApEJBJBEAShQEQiEQRBEApEJBJBEAShQP4P5EsOzb44yQoAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 420x170 with 3 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "fig, axs = plt.subplots(1, 3, figsize=(4.2, 1.7))\n",
    "sns.despine(fig)\n",
    "\n",
    "def round_down(x, decimals=2):\n",
    "    x = np.asarray(x, dtype=float)\n",
    "    f = 10**decimals\n",
    "    return np.floor(x * f) / f\n",
    "\n",
    "for didx, dataset in enumerate([\"gsm8k\", \"mmlu\", \"math\"]):\n",
    "    ax = axs[didx]\n",
    "    disp = ConfusionMatrixDisplay(cm_dict[dataset], display_labels=[0,1])\n",
    "    disp.plot(ax=ax, colorbar=False, values_format='.3f', cmap='Blues')\n",
    "    ax.set_title(dataset.upper(), fontsize=11)\n",
    "    ax.set_xlabel(None); ax.set_ylabel(None)\n",
    "    if didx > 0:\n",
    "        ax.set_yticklabels([])\n",
    "\n",
    "fig.supxlabel(\"Accuracy uniterrupted (max 4,096 tokens)\", fontsize=11, y=-0.1)\n",
    "fig.supylabel(\"Accuracy w/\\nearly termination\", fontsize=11, x=-0.01)\n",
    "\n",
    "# fig.tight_layout()\n",
    "plt.show()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "reasoning",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
