{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# P-BERT: Computing Inverted Computational Complexity Ratio, Number of Operations (Normalized), Estimated Inference Time\n",
    "This notebook illustrates the computations of the above three metrics for P-BERT. The results are as depicted in the paper Tables 1-4."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Setup\n",
    "The data is the results obtained from our methodology."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = {\n",
    "    \"rte\": [\n",
    "        [[12, 58, 49, 52, 26, 27, 26, 29, 66, 18, 5], [0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0]],\n",
    "        [[12, 58, 49, 52, 26, 27, 26, 67, 67, 18, 5], [0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0]], \n",
    "        [[13, 23, 20, 53, 15, 21, 36, 25, 37, 65, 5], [2, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1]], \n",
    "        [[34, 24, 57, 17, 57, 66, 58, 56, 68, 34, 55], [1, 1, 1, 0, 0, 1, 0, 0, 1, 0, 1]],\n",
    "        [[34, 39, 2, 30, 32, 8, 52, 29, 44, 39, 13], [2, 2, 1, 1, 1, 1, 1, 0, 2, 0, 2]], \n",
    "        [[55, 24, 62, 56, 57, 66, 59, 67, 68, 64, 57], [1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1]], \n",
    "    ], \n",
    "    \"mrpc\": [\n",
    "        [[4, 4, 2, 7, 25, 2, 57, 4, 31, 38, 36], [1, 1, 2, 1, 2, 1, 1, 0, 0, 0, 1]], \n",
    "        [[22, 3, 2, 42, 27, 7, 16, 49, 56, 38, 39], [1, 1, 1, 1, 0, 1, 1, 2, 0, 1, 1]], \n",
    "        [[22, 3, 2, 42, 27, 7, 17, 49, 56, 38, 40], [1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1]],\n",
    "        [[22, 3, 3, 42, 27, 61, 61, 66, 56, 38, 40], [1, 1, 0, 1, 0, 1, 0, 0, 0, 1, 1]], \n",
    "        [[23, 31, 4, 4, 21, 64, 37, 45, 37, 12, 45], [1, 2, 1, 1, 0, 1, 1, 0, 1, 0, 1]],\n",
    "        [[25, 21, 47, 23, 15, 51, 67, 67, 37, 35, 62], [1, 1, 1, 1, 2, 1, 2, 1, 0, 0, 1]], \n",
    "        [[45, 31, 4, 23, 15, 5, 62, 49, 38, 13, 61], [1, 1, 1, 1, 2, 1, 2, 0, 1, 0, 1]], \n",
    "        [[54, 57, 3, 14, 54, 59, 61, 1, 40, 19, 34], [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0]], \n",
    "        [[54, 57, 3, 14, 54, 59, 61, 1, 41, 5, 34], [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1]], \n",
    "        [[54, 57, 3, 14, 54, 59, 61, 66, 35, 5, 63], [1, 2, 0, 1, 0, 0, 0, 0, 0, 0, 1]], \n",
    "    ], \n",
    "    \"stsb\": [\n",
    "        [[7, 27, 63, 42, 36, 31, 44, 4, 44, 2, 24], [1, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0]],\n",
    "        [[8, 27, 63, 42, 36, 31, 44, 6, 44, 14, 23], [1, 2, 1, 2, 1, 0, 0, 0, 0, 0, 1]], \n",
    "        [[9, 40, 13, 42, 35, 33, 63, 6, 7, 28, 64], [1, 1, 1, 2, 2, 0, 0, 0, 0, 0, 0]],\n",
    "        [[10, 9, 20, 1, 15, 59, 21, 14, 44, 65, 48], [1, 2, 0, 1, 2, 0, 0, 0, 0, 0, 2]], \n",
    "        [[14, 46, 34, 28, 56, 13, 46, 43, 23, 26, 53], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]], \n",
    "        [[15, 63, 33, 42, 35, 33, 63, 7, 7, 28, 64], [1, 1, 1, 2, 2, 0, 0, 0, 0, 0, 0]],\n",
    "        [[15, 63, 33, 42, 56, 32, 63, 44, 7, 28, 64], [1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0]], \n",
    "        [[19, 1, 58, 45, 35, 44, 22, 58, 64, 57, 4], [1, 2, 1, 2, 1, 2, 2, 2, 2, 2, 2]],\n",
    "        [[48, 51, 11, 6, 20, 48, 50, 3, 9, 27, 26], [1, 1, 1, 1, 0, 0, 0, 2, 0, 0, 0]],\n",
    "        [[54, 7, 20, 1, 15, 48, 52, 14, 67, 7, 39], [1, 2, 2, 1, 1, 0, 0, 0, 2, 0, 2]],\n",
    "    ], \n",
    "    \"cola\": [\n",
    "        [[1, 24, 7, 13, 55, 65, 19, 40, 2, 12, 18], [0, 0, 2, 0, 1, 1, 1, 0, 0, 0, 0]], \n",
    "        [[4, 16, 17, 15, 21, 3, 49, 33, 53, 24, 2], [1, 2, 2, 0, 1, 1, 0, 0, 1, 0, 1]], \n",
    "        [[4, 18, 6, 13, 21, 6, 5, 33, 49, 24, 38], [1, 2, 2, 1, 1, 1, 0, 0, 1, 0, 1]],\n",
    "        [[5, 25, 63, 11, 11, 8, 11, 42, 4, 2, 18], [0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0]], \n",
    "        [[5, 26, 63, 11, 10, 64, 11, 41, 1, 67, 24], [0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0]], \n",
    "        [[11, 18, 19, 64, 22, 53, 50, 46, 3, 1, 7], [2, 0, 1, 2, 0, 1, 2, 1, 0, 0, 0]], \n",
    "        [[11, 18, 19, 64, 22, 53, 50, 46, 3, 1, 21], [2, 0, 1, 2, 1, 1, 0, 1, 0, 0, 0]], \n",
    "        [[13, 18, 17, 8, 4, 3, 50, 31, 3, 1, 4], [1, 0, 1, 0, 0, 1, 2, 1, 0, 0, 0]], \n",
    "        [[13, 18, 17, 8, 4, 44, 5, 31, 1, 1, 40], [1, 0, 1, 1, 0, 1, 2, 1, 0, 0, 0]],\n",
    "        [[23, 18, 4, 15, 23, 5, 50, 52, 2, 5, 4], [1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0]], \n",
    "        [[42, 18, 18, 62, 21, 53, 47, 46, 1, 1, 21], [2, 0, 1, 2, 1, 1, 0, 1, 0, 0, 0]],\n",
    "        [[45, 23, 15, 17, 12, 64, 11, 41, 15, 68, 38], [0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0]], \n",
    "    ]\n",
    "}"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Inverted Computational Complexity Ratio Function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "BERT_COMPUTATIONAL_COMPLEXITY = 1165824\n",
    "BITS_OPTIONS = [4, 8, 16, 32]\n",
    "\n",
    "def compute_inverted_computational_complexity_ratio(states, bits): \n",
    "    computational_complexity = 0\n",
    "    states_removed = 0\n",
    "    for layer in range(11):\n",
    "        states_removed += states[layer]\n",
    "        computational_complexity += (layer + 1) * (768 - states_removed) * BITS_OPTIONS[bits[layer]]\n",
    "    return BERT_COMPUTATIONAL_COMPLEXITY / computational_complexity "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Number of Operations (Normalized) & Estimated Inference Time Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "NUM_LAYERS_L = 12\n",
    "SEQUENCE_LENGTH_S = 512\n",
    "NUMBER_OF_EXAMPLES = {\"rte\": 3000 + 2490 + 277, \n",
    "                      \"mrpc\": 1725 + 3668 + 408, \n",
    "                      \"stsb\": 1379 + 5749 + 1500, \n",
    "                      \"cola\": 1063 + 8551 + 1043\n",
    "                      } \n",
    "    \n",
    "def self_attention_layer(s, i, k):\n",
    "    return 3*s*i*k/1000000 + 2*(s**2)*k/1000000 + 2*(s**2)/1000000\n",
    "\n",
    "def add_norm_later(s, k): \n",
    "    return (s**2)*k/1000000\n",
    "\n",
    "def feed_forward_layer(s, k, d):\n",
    "    return 2*(2*s*k*d/1000000 + 2*(s**2)*k/1000000)\n",
    "\n",
    "def layer(s, i, k, d):\n",
    "    return self_attention_layer(s, i, k) + \\\n",
    "        add_norm_later(s, k) + \\\n",
    "            feed_forward_layer(s, k, d)\n",
    "\n",
    "def compute_number_of_operations(task, states):\n",
    "    num_hidden_states_k = 768\n",
    "    embedding_size_i = num_hidden_states_k\n",
    "    intermediate_size_d = 4 * num_hidden_states_k \n",
    "    \n",
    "    num_of_example = NUMBER_OF_EXAMPLES[task]\n",
    "    operations = layer(SEQUENCE_LENGTH_S, embedding_size_i, num_hidden_states_k, intermediate_size_d)\n",
    "    \n",
    "    for i in range(NUM_LAYERS_L - 1):\n",
    "        num_hidden_states_k -= states[i]\n",
    "        embedding_size_i = num_hidden_states_k\n",
    "        intermediate_size_d = 4 * num_hidden_states_k \n",
    "        operations += layer(SEQUENCE_LENGTH_S, embedding_size_i, num_hidden_states_k, intermediate_size_d) \n",
    "    operations *= num_of_example\n",
    "    return operations\n",
    "\n",
    "BERT_OPERATIONS = {\"rte\": 494643777.11001617, \"mrpc\": 497560005.3780481, \"stsb\": 740035808.7229443, \"cola\": 914066019.1887363}\n",
    "\n",
    "def compute_number_of_operations_ratio(operations, task):\n",
    "    return round(operations / BERT_OPERATIONS[task], 3)\n",
    "\n",
    "def compute_estimated_inference_time(operations):\n",
    "    return round(operations / 19.5 / 1000000, 1)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Applying the Functions & Obtaining the Results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "final_table = {\"task\": [], \"inverted computational complexity ratio\": [], \"# of operations ratio\": [], \"est. inference time (s)\": []}\n",
    "\n",
    "for task, lst in data.items():\n",
    "    for pair in lst:\n",
    "        states, bits = pair\n",
    "        final_table[\"task\"].append(task)\n",
    "        final_table[\"inverted computational complexity ratio\"].append(round(compute_inverted_computational_complexity_ratio(states, bits), 2))\n",
    "        operations = compute_number_of_operations(task, states)\n",
    "        final_table[\"# of operations ratio\"].append(compute_number_of_operations_ratio(operations, task))\n",
    "        final_table[\"est. inference time (s)\"].append(compute_estimated_inference_time(operations))\n",
    "        \n",
    "final_df = pd.DataFrame(final_table)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### RTE"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>task</th>\n",
       "      <th>inverted computational complexity ratio</th>\n",
       "      <th># of operations ratio</th>\n",
       "      <th>est. inference time (s)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>rte</td>\n",
       "      <td>3.38</td>\n",
       "      <td>0.678</td>\n",
       "      <td>17.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>rte</td>\n",
       "      <td>5.02</td>\n",
       "      <td>0.704</td>\n",
       "      <td>17.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>rte</td>\n",
       "      <td>7.21</td>\n",
       "      <td>0.553</td>\n",
       "      <td>14.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>rte</td>\n",
       "      <td>7.27</td>\n",
       "      <td>0.589</td>\n",
       "      <td>14.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>rte</td>\n",
       "      <td>7.37</td>\n",
       "      <td>0.606</td>\n",
       "      <td>15.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>rte</td>\n",
       "      <td>7.64</td>\n",
       "      <td>0.475</td>\n",
       "      <td>12.1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  task  inverted computational complexity ratio  # of operations ratio  \\\n",
       "4  rte                                     3.38                  0.678   \n",
       "2  rte                                     5.02                  0.704   \n",
       "3  rte                                     7.21                  0.553   \n",
       "1  rte                                     7.27                  0.589   \n",
       "0  rte                                     7.37                  0.606   \n",
       "5  rte                                     7.64                  0.475   \n",
       "\n",
       "   est. inference time (s)  \n",
       "4                     17.2  \n",
       "2                     17.9  \n",
       "3                     14.0  \n",
       "1                     14.9  \n",
       "0                     15.4  \n",
       "5                     12.1  "
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "rte_df = final_df[final_df['task'] == 'rte']\n",
    "sorted_rte_df = rte_df.sort_values(by='inverted computational complexity ratio')\n",
    "\n",
    "sorted_rte_df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### MRPC"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>task</th>\n",
       "      <th>inverted computational complexity ratio</th>\n",
       "      <th># of operations ratio</th>\n",
       "      <th>est. inference time (s)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>3.58</td>\n",
       "      <td>0.847</td>\n",
       "      <td>21.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>3.67</td>\n",
       "      <td>0.755</td>\n",
       "      <td>19.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>3.73</td>\n",
       "      <td>0.682</td>\n",
       "      <td>17.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>4.18</td>\n",
       "      <td>0.622</td>\n",
       "      <td>15.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>4.54</td>\n",
       "      <td>0.709</td>\n",
       "      <td>18.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>5.01</td>\n",
       "      <td>0.754</td>\n",
       "      <td>19.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>5.83</td>\n",
       "      <td>0.669</td>\n",
       "      <td>17.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>7.33</td>\n",
       "      <td>0.559</td>\n",
       "      <td>14.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>7.54</td>\n",
       "      <td>0.589</td>\n",
       "      <td>15.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>mrpc</td>\n",
       "      <td>8.53</td>\n",
       "      <td>0.586</td>\n",
       "      <td>15.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    task  inverted computational complexity ratio  # of operations ratio  \\\n",
       "6   mrpc                                     3.58                  0.847   \n",
       "7   mrpc                                     3.67                  0.755   \n",
       "12  mrpc                                     3.73                  0.682   \n",
       "11  mrpc                                     4.18                  0.622   \n",
       "10  mrpc                                     4.54                  0.709   \n",
       "8   mrpc                                     5.01                  0.754   \n",
       "9   mrpc                                     5.83                  0.669   \n",
       "15  mrpc                                     7.33                  0.559   \n",
       "14  mrpc                                     7.54                  0.589   \n",
       "13  mrpc                                     8.53                  0.586   \n",
       "\n",
       "    est. inference time (s)  \n",
       "6                      21.6  \n",
       "7                      19.3  \n",
       "12                     17.4  \n",
       "11                     15.9  \n",
       "10                     18.1  \n",
       "8                      19.2  \n",
       "9                      17.1  \n",
       "15                     14.3  \n",
       "14                     15.0  \n",
       "13                     15.0  "
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "mrpc_df = final_df[final_df['task'] == 'mrpc']\n",
    "sorted_mrpc_df = mrpc_df.sort_values(by='inverted computational complexity ratio')\n",
    "\n",
    "sorted_mrpc_df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### STSB"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>task</th>\n",
       "      <th>inverted computational complexity ratio</th>\n",
       "      <th># of operations ratio</th>\n",
       "      <th>est. inference time (s)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>stsb</td>\n",
       "      <td>2.47</td>\n",
       "      <td>0.633</td>\n",
       "      <td>24.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>stsb</td>\n",
       "      <td>3.57</td>\n",
       "      <td>0.690</td>\n",
       "      <td>26.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>stsb</td>\n",
       "      <td>3.96</td>\n",
       "      <td>0.771</td>\n",
       "      <td>29.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>stsb</td>\n",
       "      <td>5.05</td>\n",
       "      <td>0.682</td>\n",
       "      <td>25.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>stsb</td>\n",
       "      <td>5.15</td>\n",
       "      <td>0.645</td>\n",
       "      <td>24.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>stsb</td>\n",
       "      <td>5.25</td>\n",
       "      <td>0.661</td>\n",
       "      <td>25.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>stsb</td>\n",
       "      <td>5.51</td>\n",
       "      <td>0.612</td>\n",
       "      <td>23.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>stsb</td>\n",
       "      <td>6.97</td>\n",
       "      <td>0.651</td>\n",
       "      <td>24.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>stsb</td>\n",
       "      <td>8.49</td>\n",
       "      <td>0.577</td>\n",
       "      <td>21.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>stsb</td>\n",
       "      <td>8.67</td>\n",
       "      <td>0.637</td>\n",
       "      <td>24.2</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    task  inverted computational complexity ratio  # of operations ratio  \\\n",
       "23  stsb                                     2.47                  0.633   \n",
       "25  stsb                                     3.57                  0.690   \n",
       "19  stsb                                     3.96                  0.771   \n",
       "18  stsb                                     5.05                  0.682   \n",
       "17  stsb                                     5.15                  0.645   \n",
       "24  stsb                                     5.25                  0.661   \n",
       "21  stsb                                     5.51                  0.612   \n",
       "16  stsb                                     6.97                  0.651   \n",
       "22  stsb                                     8.49                  0.577   \n",
       "20  stsb                                     8.67                  0.637   \n",
       "\n",
       "    est. inference time (s)  \n",
       "23                     24.0  \n",
       "25                     26.2  \n",
       "19                     29.3  \n",
       "18                     25.9  \n",
       "17                     24.5  \n",
       "24                     25.1  \n",
       "21                     23.2  \n",
       "16                     24.7  \n",
       "22                     21.9  \n",
       "20                     24.2  "
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# stsb\n",
    "\n",
    "stsb_df = final_df[final_df['task'] == 'stsb']\n",
    "sorted_stsb_df = stsb_df.sort_values(by='inverted computational complexity ratio')\n",
    "\n",
    "sorted_stsb_df"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### CoLA"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>task</th>\n",
       "      <th>inverted computational complexity ratio</th>\n",
       "      <th># of operations ratio</th>\n",
       "      <th>est. inference time (s)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>cola</td>\n",
       "      <td>3.79</td>\n",
       "      <td>0.828</td>\n",
       "      <td>38.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>cola</td>\n",
       "      <td>4.08</td>\n",
       "      <td>0.814</td>\n",
       "      <td>38.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>cola</td>\n",
       "      <td>4.12</td>\n",
       "      <td>0.784</td>\n",
       "      <td>36.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>cola</td>\n",
       "      <td>4.22</td>\n",
       "      <td>0.822</td>\n",
       "      <td>38.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>cola</td>\n",
       "      <td>4.39</td>\n",
       "      <td>0.678</td>\n",
       "      <td>31.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.00</td>\n",
       "      <td>0.677</td>\n",
       "      <td>31.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.17</td>\n",
       "      <td>0.776</td>\n",
       "      <td>36.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.18</td>\n",
       "      <td>0.741</td>\n",
       "      <td>34.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.23</td>\n",
       "      <td>0.632</td>\n",
       "      <td>29.6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.35</td>\n",
       "      <td>0.761</td>\n",
       "      <td>35.7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>cola</td>\n",
       "      <td>5.89</td>\n",
       "      <td>0.693</td>\n",
       "      <td>32.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>cola</td>\n",
       "      <td>6.42</td>\n",
       "      <td>0.677</td>\n",
       "      <td>31.7</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    task  inverted computational complexity ratio  # of operations ratio  \\\n",
       "28  cola                                     3.79                  0.828   \n",
       "34  cola                                     4.08                  0.814   \n",
       "27  cola                                     4.12                  0.784   \n",
       "33  cola                                     4.22                  0.822   \n",
       "31  cola                                     4.39                  0.678   \n",
       "32  cola                                     5.00                  0.677   \n",
       "35  cola                                     5.17                  0.776   \n",
       "26  cola                                     5.18                  0.741   \n",
       "36  cola                                     5.23                  0.632   \n",
       "29  cola                                     5.35                  0.761   \n",
       "30  cola                                     5.89                  0.693   \n",
       "37  cola                                     6.42                  0.677   \n",
       "\n",
       "    est. inference time (s)  \n",
       "28                     38.8  \n",
       "34                     38.1  \n",
       "27                     36.7  \n",
       "33                     38.5  \n",
       "31                     31.8  \n",
       "32                     31.7  \n",
       "35                     36.4  \n",
       "26                     34.7  \n",
       "36                     29.6  \n",
       "29                     35.7  \n",
       "30                     32.5  \n",
       "37                     31.7  "
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cola_df = final_df[final_df['task'] == 'cola']\n",
    "sorted_cola_df = cola_df.sort_values(by='inverted computational complexity ratio')\n",
    "\n",
    "sorted_cola_df"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
