{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Index(['layer_idx', 'layer_name', 'compression_ratio', 'length', 'weights'], dtype='object')\n",
      "   layer_idx layer_name  compression_ratio  length\n",
      "0          0     q_proj           0.035318    4096\n",
      "1          0     k_proj           0.032586    4096\n",
      "2          0     v_proj           0.136755    4096\n",
      "3          0     o_proj           0.195188    4096\n",
      "4          0  gate_proj           0.465770    4096\n",
      "5          0    up_proj           0.464270    4096\n",
      "6          0  down_proj           0.661998    4096\n",
      "7          1     q_proj           0.119843    4096\n",
      "8          1     k_proj           0.120274    4096\n",
      "9          1     v_proj           0.423415    4096\n"
     ]
    }
   ],
   "source": [
    "import json \n",
    "import pandas as pd\n",
    "import torch\n",
    "import numpy as np\n",
    "\n",
    "exp_name = \"eval_thresh.json\"\n",
    "\n",
    "with open(f'data/{exp_name}') as f:\n",
    "    compression_stats = json.load(f) \n",
    "\n",
    "df = pd.read_json(f'data/{exp_name}')\n",
    "\n",
    "print(df.columns)\n",
    "print(df[['layer_idx', 'layer_name', 'compression_ratio', 'length']].head(10).to_string())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mean Compression Ratio by Layer Index:\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns \n",
    "import matplotlib.colors as mcolors\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "\n",
    "sns.set_theme(style=\"whitegrid\")\n",
    "\n",
    "# 1. Convert layer_idx # 1. Convert layer_idx column to an integer from string\n",
    "df['layer_idx'] = df['layer_idx'].astype(int)\n",
    "\n",
    "# 2. Group by layer_idx and print the mean compression ratio\n",
    "mean_compression_ratio = df.groupby('layer_idx')['compression_ratio'].mean()\n",
    "def sigmoid(x):\n",
    "    return 1 / (1 + np.exp(-x))\n",
    "\n",
    "df['sigmoid_weights'] = df['weights'].apply(lambda x: sigmoid(np.array(x)))\n",
    "\n",
    "print(\"Mean Compression Ratio by Layer Index:\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'0': {'q_proj': 133,\n",
       "  'k_proj': 128,\n",
       "  'v_proj': 500,\n",
       "  'o_proj': 773,\n",
       "  'gate_proj': 2049,\n",
       "  'up_proj': 2001,\n",
       "  'down_proj': 2818},\n",
       " '1': {'q_proj': 470,\n",
       "  'k_proj': 470,\n",
       "  'v_proj': 1743,\n",
       "  'o_proj': 1474,\n",
       "  'gate_proj': 2687,\n",
       "  'up_proj': 2891},\n",
       " '2': {'q_proj': 963, 'k_proj': 992},\n",
       " '3': {'q_proj': 1269, 'k_proj': 1198},\n",
       " '4': {'q_proj': 1047, 'k_proj': 1085},\n",
       " '5': {'q_proj': 1096, 'k_proj': 1032},\n",
       " '6': {'q_proj': 1061, 'k_proj': 1147},\n",
       " '7': {'q_proj': 1036, 'k_proj': 1052},\n",
       " '8': {'q_proj': 1012, 'k_proj': 1024},\n",
       " '9': {'q_proj': 1081, 'k_proj': 1085},\n",
       " '10': {'q_proj': 974, 'k_proj': 984},\n",
       " '11': {'q_proj': 1039, 'k_proj': 1099},\n",
       " '12': {'q_proj': 1032, 'k_proj': 970},\n",
       " '13': {'q_proj': 1000, 'k_proj': 981},\n",
       " '14': {'q_proj': 949, 'k_proj': 972},\n",
       " '15': {'q_proj': 1085, 'k_proj': 1083},\n",
       " '16': {'q_proj': 1040, 'k_proj': 803},\n",
       " '17': {'q_proj': 1129, 'k_proj': 1056},\n",
       " '18': {'q_proj': 1027, 'k_proj': 988},\n",
       " '19': {'q_proj': 1248, 'k_proj': 1056},\n",
       " '20': {'q_proj': 1017, 'k_proj': 881},\n",
       " '21': {'q_proj': 1096, 'k_proj': 979, 'v_proj': 1955},\n",
       " '22': {'q_proj': 1127, 'k_proj': 1138},\n",
       " '23': {'q_proj': 1185, 'k_proj': 1035},\n",
       " '24': {'q_proj': 910, 'k_proj': 849},\n",
       " '25': {'q_proj': 1136, 'k_proj': 1001},\n",
       " '26': {'q_proj': 908, 'k_proj': 911},\n",
       " '27': {'q_proj': 1295, 'k_proj': 1149},\n",
       " '28': {'q_proj': 1210, 'k_proj': 1319},\n",
       " '29': {'q_proj': 783, 'k_proj': 751},\n",
       " '30': {'q_proj': 1305, 'k_proj': 1220, 'o_proj': 1958},\n",
       " '31': {'q_proj': 792, 'k_proj': 880, 'o_proj': 1758}}"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "def get_mapping_dict(compression_stats):\n",
    "    def sigmoid(x):\n",
    "        return 1 / (1 + np.exp(-x))\n",
    "\n",
    "    df = pd.DataFrame(compression_stats)\n",
    "    df['sigmoid_weights'] = df['weights'].apply(lambda x: sigmoid(np.array(x)))\n",
    "    df['topk'] = df['sigmoid_weights'].apply(lambda x: (x > 0.50).sum())\n",
    "\n",
    "    mapping = {}\n",
    "    for _, row in df.iterrows():\n",
    "        if row['layer_name'] in ['q_proj', 'k_proj', 'v_proj', 'o_proj']:\n",
    "            m = n = 4096\n",
    "        else:\n",
    "            m = 4096\n",
    "            n = 11008\n",
    "\n",
    "        compression_rate = row['topk'] * (m + n) / (m * n)\n",
    "        if compression_rate > 0.97:\n",
    "            continue \n",
    "\n",
    "        if row['layer_idx'] not in mapping: \n",
    "            mapping[row['layer_idx']] = {} \n",
    "\n",
    "        mapping[row['layer_idx']][row['layer_name']] = row['topk']\n",
    "\n",
    "    return mapping \n",
    "\n",
    "get_mapping_dict(compression_stats)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "\n",
    "def detect_boundary_vectorized(L, window_size=20, threshold=0.30):\n",
    "    if isinstance(L, list):\n",
    "        L = torch.FloatTensor(L)\n",
    "    elif isinstance(L, np.ndarray):\n",
    "        L = torch.from_numpy(L)\n",
    "        \n",
    "    N = len(L)\n",
    "    if window_size > N:\n",
    "        raise ValueError(\"Window size must be less than or equal to the length of the vector\")\n",
    "    \n",
    "    # Calculate cumulative sum\n",
    "    cumsum = torch.cumsum(L, dim=0)\n",
    "    \n",
    "    # Calculate moving average\n",
    "    moving_avg = (cumsum[window_size:] - cumsum[:-window_size]) / window_size\n",
    "    \n",
    "    # Find the first index where moving average is below threshold\n",
    "    below_threshold = (moving_avg < threshold).nonzero(as_tuple=True)[0]\n",
    "    \n",
    "    return below_threshold[0].item() if len(below_threshold) > 0 else N\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mean topk compression: 0.8544524943709769\n"
     ]
    }
   ],
   "source": [
    "from functools import partial\n",
    "\n",
    "transf = partial(detect_boundary_vectorized, window_size=30, threshold=0.30)\n",
    "df['topk'] = df['sigmoid_weights'].apply(lambda x: detect_boundary_vectorized(x, window_size=30, threshold=0.30))\n",
    "\n",
    "compression_rates = []\n",
    "mapping = {}\n",
    "for idx, row in df.iterrows():\n",
    "    if row['layer_name'] in ['q_proj', 'k_proj', 'v_proj', 'o_proj']:\n",
    "        m = n = 4096\n",
    "    else:\n",
    "        m = 4096\n",
    "        n = 11008\n",
    "\n",
    "    compression_rate = row['topk'] * (m + n) / (m * n)\n",
    "    if compression_rate > 0.96:\n",
    "        compression_rate = 1. \n",
    "\n",
    "    compression_rates.append(compression_rate)\n",
    "    if row['layer_idx'] not in mapping: \n",
    "        mapping[row['layer_idx']] = {} \n",
    "\n",
    "    mapping[row['layer_idx']][row['layer_name']] = row['topk']\n",
    "\n",
    "df['topk_compression'] = compression_rates\n",
    "subdf = df[['layer_name', 'layer_idx', 'topk', 'topk_compression']]\n",
    "print('Mean topk compression:', subdf.topk_compression.mean())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "\n",
    "with open('data/mapping_tv.json', 'w') as f:\n",
    "    json.dump(mapping, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "mlp",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
