{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "/teamspace/studios/this_studio\n",
      "/teamspace/studios/this_studio/embedding-text-structure/project\n",
      "/teamspace/studios/this_studio/embedding-text-structure/project\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/zeus/miniconda3/envs/cloudspace/lib/python3.10/site-packages/IPython/core/magics/osm.py:417: UserWarning: This is now an optional IPython functionality, setting dhist requires you to install the `pickleshare` library.\n",
      "  self.shell.db['dhist'] = compress_dhist(dhist)[-100:]\n"
     ]
    }
   ],
   "source": [
    "!pwd\n",
    "%cd embedding-text-structure/project/\n",
    "!pwd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from pathlib import Path\n",
    "\n",
    "from needle_haystack_similarity_plotting import * "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "WARNING: (other) intfloat_e5-mistral-7b-instruct not found\n",
      "WARNING: google-bert_bert-base-uncased not found\n"
     ]
    }
   ],
   "source": [
    "DATA_PATH = \"./data\"\n",
    "\n",
    "\n",
    "model_dirs = filter(\n",
    "    lambda x: x.is_dir(), Path(DATA_PATH).glob(\"*\")\n",
    ")  # Note the path here jic\n",
    "models = list(map(lambda x: x.parts[-1], model_dirs))\n",
    "\n",
    "cs_model_keywords = [\"embed-english-v3.0\", \"text-embedding-3-small\"] # \"embed-english-v3.0\", \n",
    "os_model_keywords = [\n",
    "    \"BAAI_bge-m3\",\n",
    "    \"jinaai_jina-embeddings-v2-base-en\",\n",
    "    \"dwzhu_e5rope-base\",\n",
    "    \"mosaicml_mosaic-bert-base-seqlen-1024\",\n",
    "    \"nomic-ai_nomic-embed-text-v1.5\",\n",
    "    \"intfloat_e5-large-v2\",\n",
    "]\n",
    "model_keywords = cs_model_keywords + os_model_keywords\n",
    "\n",
    "relevant_models = []\n",
    "for model in models: \n",
    "    if model in model_keywords:\n",
    "        relevant_models.append(model)\n",
    "    else: \n",
    "        print(f\"WARNING: {model} not found\")\n",
    "# graph_total_avgs(relevant_models, mode=\"insert\") # insert or remove\n",
    "# graph_total_avgs(relevant_models, mode=\"remove\") # insert or remove\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "mode = 'insert'\n",
    "model_names = relevant_models\n",
    "inserts = [0.05, 0.1, 0.2, 0.5, 1]\n",
    "removes = [0.05, 0.1, 0.2, 0.5]\n",
    "input_sizes = inserts if mode == 'insert' else removes\n",
    "posns = [0, 0.5, 1]\n",
    "\n",
    "# Get the average data for the models\n",
    "total_avgs = get_total_avgs(model_names, posns, input_sizes, mode=mode)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'dwzhu_e5rope-base': [0.83150995, 0.9620588, 0.9610531],\n",
       " 'BAAI_bge-m3': [0.93733865, 0.97115064, 0.9787945],\n",
       " 'intfloat_e5-large-v2': [0.9522503, 0.9647754, 0.97599393],\n",
       " 'text-embedding-3-small': [0.9232778, 0.9691427, 0.9637714],\n",
       " 'jinaai_jina-embeddings-v2-base-en': [0.985457, 0.99956316, 0.999718],\n",
       " 'nomic-ai_nomic-embed-text-v1.5': [0.90284675, 0.98397774, 0.9883496],\n",
       " 'embed-english-v3.0': [0.9394447, 0.96336883, 0.9760959],\n",
       " 'mosaicml_mosaic-bert-base-seqlen-1024': [0.9960022, 0.9965006, 0.9972786]}"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# total_avgs.keys()\n",
    "total_avgs[.1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Begin</th>\n",
       "      <th>Mid</th>\n",
       "      <th>End</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>dwzhu_e5rope-base</th>\n",
       "      <td>0.831510</td>\n",
       "      <td>0.962059</td>\n",
       "      <td>0.961053</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BAAI_bge-m3</th>\n",
       "      <td>0.937339</td>\n",
       "      <td>0.971151</td>\n",
       "      <td>0.978795</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>intfloat_e5-large-v2</th>\n",
       "      <td>0.952250</td>\n",
       "      <td>0.964775</td>\n",
       "      <td>0.975994</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>text-embedding-3-small</th>\n",
       "      <td>0.923278</td>\n",
       "      <td>0.969143</td>\n",
       "      <td>0.963771</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>jinaai_jina-embeddings-v2-base-en</th>\n",
       "      <td>0.985457</td>\n",
       "      <td>0.999563</td>\n",
       "      <td>0.999718</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>nomic-ai_nomic-embed-text-v1.5</th>\n",
       "      <td>0.902847</td>\n",
       "      <td>0.983978</td>\n",
       "      <td>0.988350</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>embed-english-v3.0</th>\n",
       "      <td>0.939445</td>\n",
       "      <td>0.963369</td>\n",
       "      <td>0.976096</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mosaicml_mosaic-bert-base-seqlen-1024</th>\n",
       "      <td>0.996002</td>\n",
       "      <td>0.996501</td>\n",
       "      <td>0.997279</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                          Begin       Mid       End\n",
       "dwzhu_e5rope-base                      0.831510  0.962059  0.961053\n",
       "BAAI_bge-m3                            0.937339  0.971151  0.978795\n",
       "intfloat_e5-large-v2                   0.952250  0.964775  0.975994\n",
       "text-embedding-3-small                 0.923278  0.969143  0.963771\n",
       "jinaai_jina-embeddings-v2-base-en      0.985457  0.999563  0.999718\n",
       "nomic-ai_nomic-embed-text-v1.5         0.902847  0.983978  0.988350\n",
       "embed-english-v3.0                     0.939445  0.963369  0.976096\n",
       "mosaicml_mosaic-bert-base-seqlen-1024  0.996002  0.996501  0.997279"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame.from_dict(total_avgs[.1], orient='index', columns=['Begin', 'Mid', 'End'])\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Begin</th>\n",
       "      <th>Mid</th>\n",
       "      <th>End</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>count</th>\n",
       "      <td>8.000000</td>\n",
       "      <td>8.000000</td>\n",
       "      <td>8.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mean</th>\n",
       "      <td>0.933516</td>\n",
       "      <td>0.976317</td>\n",
       "      <td>0.980132</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>std</th>\n",
       "      <td>0.051344</td>\n",
       "      <td>0.015065</td>\n",
       "      <td>0.014203</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>min</th>\n",
       "      <td>0.831510</td>\n",
       "      <td>0.962059</td>\n",
       "      <td>0.961053</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25%</th>\n",
       "      <td>0.918170</td>\n",
       "      <td>0.964424</td>\n",
       "      <td>0.972938</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50%</th>\n",
       "      <td>0.938392</td>\n",
       "      <td>0.970147</td>\n",
       "      <td>0.977445</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75%</th>\n",
       "      <td>0.960552</td>\n",
       "      <td>0.987108</td>\n",
       "      <td>0.990582</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>max</th>\n",
       "      <td>0.996002</td>\n",
       "      <td>0.999563</td>\n",
       "      <td>0.999718</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          Begin       Mid       End\n",
       "count  8.000000  8.000000  8.000000\n",
       "mean   0.933516  0.976317  0.980132\n",
       "std    0.051344  0.015065  0.014203\n",
       "min    0.831510  0.962059  0.961053\n",
       "25%    0.918170  0.964424  0.972938\n",
       "50%    0.938392  0.970147  0.977445\n",
       "75%    0.960552  0.987108  0.990582\n",
       "max    0.996002  0.999563  0.999718"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.describe()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "dict_keys([0.05, 0.1, 0.2, 0.5, 1])"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "total_avgs.keys()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Begin</th>\n",
       "      <th>Mid</th>\n",
       "      <th>End</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>dwzhu_e5rope-base</th>\n",
       "      <td>0.809360</td>\n",
       "      <td>0.946518</td>\n",
       "      <td>0.948495</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BAAI_bge-m3</th>\n",
       "      <td>0.857652</td>\n",
       "      <td>0.939189</td>\n",
       "      <td>0.950730</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>intfloat_e5-large-v2</th>\n",
       "      <td>0.929681</td>\n",
       "      <td>0.952526</td>\n",
       "      <td>0.966022</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>text-embedding-3-small</th>\n",
       "      <td>0.896385</td>\n",
       "      <td>0.948343</td>\n",
       "      <td>0.931394</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>jinaai_jina-embeddings-v2-base-en</th>\n",
       "      <td>0.982490</td>\n",
       "      <td>0.998748</td>\n",
       "      <td>0.999269</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>nomic-ai_nomic-embed-text-v1.5</th>\n",
       "      <td>0.861660</td>\n",
       "      <td>0.976784</td>\n",
       "      <td>0.984089</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>embed-english-v3.0</th>\n",
       "      <td>0.906600</td>\n",
       "      <td>0.947951</td>\n",
       "      <td>0.959628</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mosaicml_mosaic-bert-base-seqlen-1024</th>\n",
       "      <td>0.986083</td>\n",
       "      <td>0.989727</td>\n",
       "      <td>0.991884</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                          Begin       Mid       End\n",
       "dwzhu_e5rope-base                      0.809360  0.946518  0.948495\n",
       "BAAI_bge-m3                            0.857652  0.939189  0.950730\n",
       "intfloat_e5-large-v2                   0.929681  0.952526  0.966022\n",
       "text-embedding-3-small                 0.896385  0.948343  0.931394\n",
       "jinaai_jina-embeddings-v2-base-en      0.982490  0.998748  0.999269\n",
       "nomic-ai_nomic-embed-text-v1.5         0.861660  0.976784  0.984089\n",
       "embed-english-v3.0                     0.906600  0.947951  0.959628\n",
       "mosaicml_mosaic-bert-base-seqlen-1024  0.986083  0.989727  0.991884"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model_sums = {}\n",
    "model_counts = {}\n",
    "\n",
    "# Iterate through the outer dictionary (by size)\n",
    "for size, inner_dict in total_avgs.items():\n",
    "    for model, values in inner_dict.items():\n",
    "        if model not in model_sums:\n",
    "            model_sums[model] = np.zeros(len(values))\n",
    "            model_counts[model] = 0\n",
    "        model_sums[model] += np.array(values)\n",
    "        model_counts[model] += 1\n",
    "\n",
    "# Calculate the average for each model\n",
    "model_avgs = {model: model_sums[model] / model_counts[model] for model in model_sums}\n",
    "\n",
    "# Convert the result to a DataFrame\n",
    "df_avgs = pd.DataFrame.from_dict(model_avgs, orient='index', columns=['Begin', 'Mid', 'End'])\n",
    "\n",
    "# Display the DataFrame with the averages\n",
    "df_avgs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['dwzhu_e5rope-base',\n",
       " 'BAAI_bge-m3',\n",
       " 'intfloat_e5-large-v2',\n",
       " 'text-embedding-3-small',\n",
       " 'jinaai_jina-embeddings-v2-base-en',\n",
       " 'nomic-ai_nomic-embed-text-v1.5',\n",
       " 'embed-english-v3.0',\n",
       " 'mosaicml_mosaic-bert-base-seqlen-1024']"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(df_avgs.index)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Begin</th>\n",
       "      <th>Mid</th>\n",
       "      <th>End</th>\n",
       "      <th>posn_encoding</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>dwzhu_e5rope-base</th>\n",
       "      <td>0.809360</td>\n",
       "      <td>0.946518</td>\n",
       "      <td>0.948495</td>\n",
       "      <td>ROPE</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>BAAI_bge-m3</th>\n",
       "      <td>0.857652</td>\n",
       "      <td>0.939189</td>\n",
       "      <td>0.950730</td>\n",
       "      <td>APE</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>intfloat_e5-large-v2</th>\n",
       "      <td>0.929681</td>\n",
       "      <td>0.952526</td>\n",
       "      <td>0.966022</td>\n",
       "      <td>APE</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>text-embedding-3-small</th>\n",
       "      <td>0.896385</td>\n",
       "      <td>0.948343</td>\n",
       "      <td>0.931394</td>\n",
       "      <td>NA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>jinaai_jina-embeddings-v2-base-en</th>\n",
       "      <td>0.982490</td>\n",
       "      <td>0.998748</td>\n",
       "      <td>0.999269</td>\n",
       "      <td>ALIBI</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>nomic-ai_nomic-embed-text-v1.5</th>\n",
       "      <td>0.861660</td>\n",
       "      <td>0.976784</td>\n",
       "      <td>0.984089</td>\n",
       "      <td>ROPE</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>embed-english-v3.0</th>\n",
       "      <td>0.906600</td>\n",
       "      <td>0.947951</td>\n",
       "      <td>0.959628</td>\n",
       "      <td>NA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mosaicml_mosaic-bert-base-seqlen-1024</th>\n",
       "      <td>0.986083</td>\n",
       "      <td>0.989727</td>\n",
       "      <td>0.991884</td>\n",
       "      <td>ALIBI</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                          Begin       Mid       End  \\\n",
       "dwzhu_e5rope-base                      0.809360  0.946518  0.948495   \n",
       "BAAI_bge-m3                            0.857652  0.939189  0.950730   \n",
       "intfloat_e5-large-v2                   0.929681  0.952526  0.966022   \n",
       "text-embedding-3-small                 0.896385  0.948343  0.931394   \n",
       "jinaai_jina-embeddings-v2-base-en      0.982490  0.998748  0.999269   \n",
       "nomic-ai_nomic-embed-text-v1.5         0.861660  0.976784  0.984089   \n",
       "embed-english-v3.0                     0.906600  0.947951  0.959628   \n",
       "mosaicml_mosaic-bert-base-seqlen-1024  0.986083  0.989727  0.991884   \n",
       "\n",
       "                                      posn_encoding  \n",
       "dwzhu_e5rope-base                              ROPE  \n",
       "BAAI_bge-m3                                     APE  \n",
       "intfloat_e5-large-v2                            APE  \n",
       "text-embedding-3-small                           NA  \n",
       "jinaai_jina-embeddings-v2-base-en             ALIBI  \n",
       "nomic-ai_nomic-embed-text-v1.5                 ROPE  \n",
       "embed-english-v3.0                               NA  \n",
       "mosaicml_mosaic-bert-base-seqlen-1024         ALIBI  "
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model_to_posn_encoding = {\n",
    "    \"BAAI_bge-m3\": \"APE\",\n",
    "    \"jinaai_jina-embeddings-v2-base-en\": \"ALIBI\",\n",
    "    \"dwzhu_e5rope-base\": \"ROPE\",\n",
    "    \"mosaicml_mosaic-bert-base-seqlen-1024\": \"ALIBI\",\n",
    "    \"nomic-ai_nomic-embed-text-v1.5\": \"ROPE\",\n",
    "    \"intfloat_e5-large-v2\": \"APE\",\n",
    "    \"text-embedding-3-small\": \"NA\",\n",
    "    \"embed-english-v3.0\": \"NA\",\n",
    "}\n",
    "# df[\"posn_encoding\"] = df_avgs.index.apply(lambda x: model_to_posn_encoding[x])\n",
    "df_avgs[\"posn_encoding\"] = df_avgs.index.to_series().apply(lambda x: model_to_posn_encoding[x])\n",
    "df_avgs\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Begin</th>\n",
       "      <th>Mid</th>\n",
       "      <th>End</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>posn_encoding</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>ALIBI</th>\n",
       "      <td>0.984286</td>\n",
       "      <td>0.994237</td>\n",
       "      <td>0.995577</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>APE</th>\n",
       "      <td>0.893666</td>\n",
       "      <td>0.945857</td>\n",
       "      <td>0.958376</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>NA</th>\n",
       "      <td>0.901493</td>\n",
       "      <td>0.948147</td>\n",
       "      <td>0.945511</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ROPE</th>\n",
       "      <td>0.835510</td>\n",
       "      <td>0.961651</td>\n",
       "      <td>0.966292</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  Begin       Mid       End\n",
       "posn_encoding                              \n",
       "ALIBI          0.984286  0.994237  0.995577\n",
       "APE            0.893666  0.945857  0.958376\n",
       "NA             0.901493  0.948147  0.945511\n",
       "ROPE           0.835510  0.961651  0.966292"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_avgs_grouped = df_avgs.groupby('posn_encoding').mean()\n",
    "df_avgs_grouped"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "research",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
