{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "677b961b-0971-43a7-9f9c-c8cdc7487864",
   "metadata": {},
   "source": [
    "# Pythia-410M transcoder-vs.-SAE interpretability challenge!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "41bb7b5f-31e7-47bd-80d0-617c66174cb5",
   "metadata": {},
   "outputs": [],
   "source": [
    "from transcoder_circuits.circuit_analysis import *\n",
    "from transcoder_circuits.feature_dashboards import *\n",
    "from transcoder_circuits.replacement_ctx import *"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "989bda79-57c3-477c-98cf-0994db1e90f6",
   "metadata": {},
   "source": [
    "Now, import the SAE/transcoder code, along with the model that we'll be analyzing (GPT2-small)."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "b3e4c6bf-2f7a-4420-a0c8-dae13b0a723f",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loaded pretrained model pythia-410m into HookedTransformer\n"
     ]
    }
   ],
   "source": [
    "from sae_training.sparse_autoencoder import SparseAutoencoder\n",
    "from transformer_lens import HookedTransformer, utils\n",
    "import os\n",
    "import torch\n",
    "\n",
    "model = HookedTransformer.from_pretrained('pythia-410m')"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "412c64ef-d644-49d4-9695-6d97dbe64ed4",
   "metadata": {
    "id": "N3D_0qDmBY5K"
   },
   "source": [
    "Now, load in a corpus of text that we'll use for our analysis. We'll be drawing from OpenWebText, which is similar to the dataset on which GPT2-small was trained."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "c0d05463-ccc7-4c0b-97f0-618df0ea4498",
   "metadata": {
    "jupyter": {
     "source_hidden": true
    }
   },
   "outputs": [],
   "source": [
    "# This function was stolen from one of Neel Nanda's exploratory notebooks\n",
    "# Thanks, Neel!\n",
    "import einops\n",
    "def tokenize_and_concatenate(\n",
    "    dataset,\n",
    "    tokenizer,\n",
    "    streaming = False,\n",
    "    max_length = 1024,\n",
    "    column_name = \"text\",\n",
    "    add_bos_token = True,\n",
    "):\n",
    "    \"\"\"Helper function to tokenizer and concatenate a dataset of text. This converts the text to tokens, concatenates them (separated by EOS tokens) and then reshapes them into a 2D array of shape (____, sequence_length), dropping the last batch. Tokenizers are much faster if parallelised, so we chop the string into 20, feed it into the tokenizer, in parallel with padding, then remove padding at the end.\n",
    "\n",
    "    This tokenization is useful for training language models, as it allows us to efficiently train on a large corpus of text of varying lengths (without, eg, a lot of truncation or padding). Further, for models with absolute positional encodings, this avoids privileging early tokens (eg, news articles often begin with CNN, and models may learn to use early positional encodings to predict these)\n",
    "\n",
    "    Args:\n",
    "        dataset (Dataset): The dataset to tokenize, assumed to be a HuggingFace text dataset.\n",
    "        tokenizer (AutoTokenizer): The tokenizer. Assumed to have a bos_token_id and an eos_token_id.\n",
    "        streaming (bool, optional): Whether the dataset is being streamed. If True, avoids using parallelism. Defaults to False.\n",
    "        max_length (int, optional): The length of the context window of the sequence. Defaults to 1024.\n",
    "        column_name (str, optional): The name of the text column in the dataset. Defaults to 'text'.\n",
    "        add_bos_token (bool, optional): . Defaults to True.\n",
    "\n",
    "    Returns:\n",
    "        Dataset: Returns the tokenized dataset, as a dataset of tensors, with a single column called \"tokens\"\n",
    "\n",
    "    Note: There is a bug when inputting very small datasets (eg, <1 batch per process) where it just outputs nothing. I'm not super sure why\n",
    "    \"\"\"\n",
    "    for key in dataset.features:\n",
    "        if key != column_name:\n",
    "            dataset = dataset.remove_columns(key)\n",
    "\n",
    "    if tokenizer.pad_token is None:\n",
    "        # We add a padding token, purely to implement the tokenizer. This will be removed before inputting tokens to the model, so we do not need to increment d_vocab in the model.\n",
    "        tokenizer.add_special_tokens({\"pad_token\": \"<PAD>\"})\n",
    "    # Define the length to chop things up into - leaving space for a bos_token if required\n",
    "    if add_bos_token:\n",
    "        seq_len = max_length - 1\n",
    "    else:\n",
    "        seq_len = max_length\n",
    "\n",
    "    def tokenize_function(examples):\n",
    "        text = examples[column_name]\n",
    "        # Concatenate it all into an enormous string, separated by eos_tokens\n",
    "        full_text = tokenizer.eos_token.join(text)\n",
    "        # Divide into 20 chunks of ~ equal length\n",
    "        num_chunks = 20\n",
    "        chunk_length = (len(full_text) - 1) // num_chunks + 1\n",
    "        chunks = [\n",
    "            full_text[i * chunk_length : (i + 1) * chunk_length]\n",
    "            for i in range(num_chunks)\n",
    "        ]\n",
    "        # Tokenize the chunks in parallel. Uses NumPy because HuggingFace map doesn't want tensors returned\n",
    "        tokens = tokenizer(chunks, return_tensors=\"np\", padding=True)[\n",
    "            \"input_ids\"\n",
    "        ].flatten()\n",
    "        # Drop padding tokens\n",
    "        tokens = tokens[tokens != tokenizer.pad_token_id]\n",
    "        num_tokens = len(tokens)\n",
    "        num_batches = num_tokens // (seq_len)\n",
    "        # Drop the final tokens if not enough to make a full sequence\n",
    "        tokens = tokens[: seq_len * num_batches]\n",
    "        tokens = einops.rearrange(\n",
    "            tokens, \"(batch seq) -> batch seq\", batch=num_batches, seq=seq_len\n",
    "        )\n",
    "        if add_bos_token:\n",
    "            prefix = np.full((num_batches, 1), tokenizer.bos_token_id)\n",
    "            tokens = np.concatenate([prefix, tokens], axis=1)\n",
    "        return {\"tokens\": tokens}\n",
    "\n",
    "    tokenized_dataset = dataset.map(\n",
    "        tokenize_function,\n",
    "        batched=True,\n",
    "        remove_columns=[column_name],\n",
    "    )\n",
    "    #tokenized_dataset.set_format(type=\"torch\", columns=[\"tokens\"])\n",
    "    return tokenized_dataset\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "566356a8-ff08-4fce-857e-065245f70dd6",
   "metadata": {},
   "outputs": [],
   "source": [
    "from datasets import load_dataset\n",
    "from huggingface_hub import HfApi\n",
    "import numpy as np\n",
    "\n",
    "dataset = load_dataset('Skylion007/openwebtext', split='train', streaming=True)\n",
    "dataset = dataset.shuffle(seed=42, buffer_size=10_000)\n",
    "tokenized_owt = tokenize_and_concatenate(dataset, model.tokenizer, max_length=128, streaming=True)\n",
    "tokenized_owt = tokenized_owt.shuffle(42)\n",
    "tokenized_owt = tokenized_owt.take(12800*2)\n",
    "owt_tokens = np.stack([x['tokens'] for x in tokenized_owt])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "9015ff5e-b158-47c9-874a-850f5fa41700",
   "metadata": {},
   "outputs": [],
   "source": [
    "owt_tokens_torch = torch.from_numpy(owt_tokens).cuda()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8c04591d-2d89-4f9f-8ff8-53cb21b8022a",
   "metadata": {},
   "source": [
    "# Load transcoder and SAEs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "ceee9c39-f092-47c3-a5b8-bed038158906",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pickle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "263847f2-be18-41d2-84e5-66e5ef6144b6",
   "metadata": {},
   "outputs": [],
   "source": [
    "transcoder_template = \"pythia-transcoders/lr_0.0002_l1_5.5e-05/szsvunrm/final_sparse_autoencoder_pythia-410m_blocks.15.ln2.hook_normalized_32768\"\n",
    "transcoder = SparseAutoencoder.load_from_pretrained(f\"{transcoder_template}.pt\").eval()\n",
    "with open(f\"{transcoder_template}_log_feature_sparsity.pt\", \"rb\") as fp:\n",
    "    tc_sparsity = pickle.load(fp)\n",
    "tc_freqs = tc_sparsity['freqs']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "43706dae-4a5c-4896-90d5-ad216f24e3d9",
   "metadata": {},
   "outputs": [],
   "source": [
    "sae_template = \"./pythia-saes/l1_7e-05/olr1w3lx/final_sparse_autoencoder_pythia-410m_blocks.15.ln2.hook_normalized_32768\"\n",
    "sae = SparseAutoencoder.load_from_pretrained(f\"{sae_template}.pt\").eval()\n",
    "with open(f\"{sae_template}_log_feature_sparsity.pt\", \"rb\") as fp:\n",
    "    sae_sparsity = pickle.load(fp)\n",
    "sae_freqs = sae_sparsity['freqs']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "ae6b83d2-3ea6-42dd-bc74-953ca44bfedb",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAjoAAAGiCAYAAADulWxzAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAwSklEQVR4nO3df1jVdZ7//8cR5YQMvAc8Awc2NLc11sItw1lEZ0vLQEZkSjdrcM/mjuE0llxewtVG7SZzXWO2qdm1eVWu62gZRddcZjXpdUZc+8WIP8KhCTXHGg00EEs4Rxg7EL4/f8y397cjVqIQ8uJ+u673Fe/X6/l+n9eL49V5+Hq/3x6Xbdu2AAAADDSorwcAAADQWwg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBY3Qo6S5cu1Q9/+EPFxMQoISFBt956qw4ePBhWY9u2SktLlZycrKioKE2aNEn79u0LqwmFQlqwYIE8Ho+io6OVl5eno0ePhtU0NzfL5/PJsixZliWfz6eWlpawmrq6Ok2fPl3R0dHyeDwqLCxUe3t7d6YEAAAM1q2g89Zbb+nee+/Vzp07VVFRoS+++EJZWVlqa2tzah577DE9/vjjWrVqlfbs2SOv16tbbrlFp06dcmoWLlyoTZs2qby8XJWVlWptbVVubq46Ozudmvz8fNXU1Mjv98vv96umpkY+n8/p7+zs1LRp09TW1qbKykqVl5dr48aNKioqupjfBwAAMIl9EZqammxJ9ltvvWXbtm2fOXPG9nq99qOPPurUfP7557ZlWfYzzzxj27Ztt7S02EOGDLHLy8udmmPHjtmDBg2y/X6/bdu2vX//fluSvXPnTqemqqrKlmR/8MEHtm3b9pYtW+xBgwbZx44dc2pefPFF2+1224FA4GKmBQAADDH4YkJSIBCQJMXHx0uSDh8+rMbGRmVlZTk1brdbN954o3bs2KGf//znqq6uVkdHR1hNcnKy0tLStGPHDmVnZ6uqqkqWZSkjI8OpGT9+vCzL0o4dO5SamqqqqiqlpaUpOTnZqcnOzlYoFFJ1dbUmT57cZbyhUEihUMjZP3PmjE6ePKlhw4bJ5XJdzK8CAAB8R2zb1qlTp5ScnKxBg7754tQFBx3btrVo0SL96Ec/UlpamiSpsbFRkpSYmBhWm5iYqI8//tipiYyMVFxcXJeaL49vbGxUQkJCl9dMSEgIqzn7deLi4hQZGenUnG3p0qX65S9/2d2pAgCAS1B9fb0uv/zyb6y54KBz33336Y9//KMqKyu79J29OmLb9reumJxdc676C6n5qpKSEi1atMjZDwQCGj58uOrr6xUbG/uN4wMAAJeGYDColJQUxcTEfGvtBQWdBQsW6LXXXtPbb78dlqS8Xq+kv662JCUlOe1NTU3O6ovX61V7e7uam5vDVnWampo0YcIEp+b48eNdXvfEiRNh59m1a1dYf3Nzszo6Orqs9HzJ7XbL7XZ3aY+NjSXoAADQz5zPbSfdeurKtm3dd999evnll7V9+3aNHDkyrH/kyJHyer2qqKhw2trb2/XWW285ISY9PV1DhgwJq2loaFBtba1Tk5mZqUAgoN27dzs1u3btUiAQCKupra1VQ0ODU7N161a53W6lp6d3Z1oAAMBQLtu27fMtnj9/vl544QW9+uqrSk1Nddoty1JUVJQk6b/+67+0dOlSrVu3TqNGjdIjjzyiN998UwcPHnSWmH7xi1/o9ddf1/r16xUfH6/i4mJ99tlnqq6uVkREhCQpJydHn3zyiVavXi1JmjdvnkaMGKHf/va3kv76ePl1112nxMRELVu2TCdPntScOXN066236sknnzyv+QSDQVmWpUAgwIoOAAD9RLc+v7vziJakc27r1q1zas6cOWMvXrzY9nq9ttvttm+44Qb7/fffDzvP6dOn7fvuu8+Oj4+3o6Ki7NzcXLuuri6s5rPPPrNnz55tx8TE2DExMfbs2bPt5ubmsJqPP/7YnjZtmh0VFWXHx8fb9913n/3555+f93wCgYAticfRAQDoR7rz+d2tFR3TsKIDAED/053Pb77rCgAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMNbivB2CyKx7YHLZ/5NFpfTQSAAAGJlZ0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAY3U76Lz99tuaPn26kpOT5XK59Morr4T1u1yuc27Lli1zaiZNmtSl/8477ww7T3Nzs3w+nyzLkmVZ8vl8amlpCaupq6vT9OnTFR0dLY/Ho8LCQrW3t3d3SgAAwFDdDjptbW269tprtWrVqnP2NzQ0hG2//vWv5XK5NHPmzLC6goKCsLrVq1eH9efn56umpkZ+v19+v181NTXy+XxOf2dnp6ZNm6a2tjZVVlaqvLxcGzduVFFRUXenBAAADDW4uwfk5OQoJyfna/u9Xm/Y/quvvqrJkyfrb//2b8Pahw4d2qX2SwcOHJDf79fOnTuVkZEhSVqzZo0yMzN18OBBpaamauvWrdq/f7/q6+uVnJwsSVqxYoXmzJmjJUuWKDY2trtTAwAAhunVe3SOHz+uzZs3a+7cuV36ysrK5PF4dM0116i4uFinTp1y+qqqqmRZlhNyJGn8+PGyLEs7duxwatLS0pyQI0nZ2dkKhUKqrq4+53hCoZCCwWDYBgAAzNXtFZ3uePbZZxUTE6MZM2aEtc+ePVsjR46U1+tVbW2tSkpK9N5776miokKS1NjYqISEhC7nS0hIUGNjo1OTmJgY1h8XF6fIyEin5mxLly7VL3/5y56YGgAA6Ad6Nej8+te/1uzZs3XZZZeFtRcUFDg/p6WladSoURo3bpz27t2r66+/XtJfb2o+m23bYe3nU/NVJSUlWrRokbMfDAaVkpLSvUkBAIB+o9cuXb3zzjs6ePCg7r777m+tvf766zVkyBAdOnRI0l/v8zl+/HiXuhMnTjirOF6vt8vKTXNzszo6Orqs9HzJ7XYrNjY2bAMAAObqtaCzdu1apaen69prr/3W2n379qmjo0NJSUmSpMzMTAUCAe3evdup2bVrlwKBgCZMmODU1NbWqqGhwanZunWr3G630tPTe3g2AACgP+r2pavW1lZ9+OGHzv7hw4dVU1Oj+Ph4DR8+XNJfLwn95je/0YoVK7oc/9FHH6msrEw//vGP5fF4tH//fhUVFWns2LGaOHGiJGn06NGaOnWqCgoKnMfO582bp9zcXKWmpkqSsrKydPXVV8vn82nZsmU6efKkiouLVVBQwEoNAACQdAErOu+++67Gjh2rsWPHSpIWLVqksWPH6uGHH3ZqysvLZdu2fvrTn3Y5PjIyUv/3f/+n7OxspaamqrCwUFlZWdq2bZsiIiKcurKyMo0ZM0ZZWVnKysrSP/zDP2jDhg1Of0REhDZv3qzLLrtMEydO1KxZs3Trrbdq+fLl3Z0SAAAwlMu2bbuvB9FXgsGgLMtSIBDolVWgKx7YHLZ/5NFpPf4aAAAMNN35/Oa7rgAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAY/Xqt5cPdEcuyz+rJdAn4wAAYKBiRQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIzV7aDz9ttva/r06UpOTpbL5dIrr7wS1j9nzhy5XK6wbfz48WE1oVBICxYskMfjUXR0tPLy8nT06NGwmubmZvl8PlmWJcuy5PP51NLSElZTV1en6dOnKzo6Wh6PR4WFhWpvb+/ulAAAgKG6HXTa2tp07bXXatWqVV9bM3XqVDU0NDjbli1bwvoXLlyoTZs2qby8XJWVlWptbVVubq46Ozudmvz8fNXU1Mjv98vv96umpkY+n8/p7+zs1LRp09TW1qbKykqVl5dr48aNKioq6u6UAACAoQZ394CcnBzl5OR8Y43b7ZbX6z1nXyAQ0Nq1a7VhwwZNmTJFkvT8888rJSVF27ZtU3Z2tg4cOCC/36+dO3cqIyNDkrRmzRplZmbq4MGDSk1N1datW7V//37V19crOTlZkrRixQrNmTNHS5YsUWxsbHenBgAADNMr9+i8+eabSkhI0FVXXaWCggI1NTU5fdXV1ero6FBWVpbTlpycrLS0NO3YsUOSVFVVJcuynJAjSePHj5dlWWE1aWlpTsiRpOzsbIVCIVVXV59zXKFQSMFgMGwDAADm6vGgk5OTo7KyMm3fvl0rVqzQnj17dNNNNykUCkmSGhsbFRkZqbi4uLDjEhMT1djY6NQkJCR0OXdCQkJYTWJiYlh/XFycIiMjnZqzLV261Lnnx7IspaSkXPR8AQDApavbl66+zR133OH8nJaWpnHjxmnEiBHavHmzZsyY8bXH2bYtl8vl7H/154up+aqSkhItWrTI2Q8Gg4QdAAAM1uuPlyclJWnEiBE6dOiQJMnr9aq9vV3Nzc1hdU1NTc4Kjdfr1fHjx7uc68SJE2E1Z6/cNDc3q6Ojo8tKz5fcbrdiY2PDNgAAYK5eDzqfffaZ6uvrlZSUJElKT0/XkCFDVFFR4dQ0NDSotrZWEyZMkCRlZmYqEAho9+7dTs2uXbsUCATCampra9XQ0ODUbN26VW63W+np6b09LQAA0A90+9JVa2urPvzwQ2f/8OHDqqmpUXx8vOLj41VaWqqZM2cqKSlJR44c0YMPPiiPx6PbbrtNkmRZlubOnauioiINGzZM8fHxKi4u1pgxY5ynsEaPHq2pU6eqoKBAq1evliTNmzdPubm5Sk1NlSRlZWXp6quvls/n07Jly3Ty5EkVFxeroKCAlRoAACDpAoLOu+++q8mTJzv7X97zctddd+npp5/W+++/r+eee04tLS1KSkrS5MmT9dJLLykmJsY5ZuXKlRo8eLBmzZql06dP6+abb9b69esVERHh1JSVlamwsNB5OisvLy/s3+6JiIjQ5s2bNX/+fE2cOFFRUVHKz8/X8uXLu/9bAAAARnLZtm339SD6SjAYlGVZCgQCvbMKVGqdtR/o+dcAAGCA6c7nN991BQAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxuh103n77bU2fPl3JyclyuVx65ZVXnL6Ojg79+7//u8aMGaPo6GglJyfrX//1X/XJJ5+EnWPSpElyuVxh25133hlW09zcLJ/PJ8uyZFmWfD6fWlpawmrq6uo0ffp0RUdHy+PxqLCwUO3t7d2dEgAAMFS3g05bW5uuvfZarVq1qkvfX/7yF+3du1f/+Z//qb179+rll1/Wn/70J+Xl5XWpLSgoUENDg7OtXr06rD8/P181NTXy+/3y+/2qqamRz+dz+js7OzVt2jS1tbWpsrJS5eXl2rhxo4qKiro7JQAAYKjB3T0gJydHOTk55+yzLEsVFRVhbU8++aT+8R//UXV1dRo+fLjTPnToUHm93nOe58CBA/L7/dq5c6cyMjIkSWvWrFFmZqYOHjyo1NRUbd26Vfv371d9fb2Sk5MlSStWrNCcOXO0ZMkSxcbGdjlvKBRSKBRy9oPBYPcmDwAA+pVev0cnEAjI5XLp+9//flh7WVmZPB6PrrnmGhUXF+vUqVNOX1VVlSzLckKOJI0fP16WZWnHjh1OTVpamhNyJCk7O1uhUEjV1dXnHMvSpUudS2GWZSklJaUHZwoAAC413V7R6Y7PP/9cDzzwgPLz88NWWGbPnq2RI0fK6/WqtrZWJSUleu+995zVoMbGRiUkJHQ5X0JCghobG52axMTEsP64uDhFRkY6NWcrKSnRokWLnP1gMEjYAQDAYL0WdDo6OnTnnXfqzJkzeuqpp8L6CgoKnJ/T0tI0atQojRs3Tnv37tX1118vSXK5XF3Oadt2WPv51HyV2+2W2+2+oPkAAID+p1cuXXV0dGjWrFk6fPiwKioqznm/zFddf/31GjJkiA4dOiRJ8nq9On78eJe6EydOOKs4Xq+3y8pNc3OzOjo6uqz0AACAganHg86XIefQoUPatm2bhg0b9q3H7Nu3Tx0dHUpKSpIkZWZmKhAIaPfu3U7Nrl27FAgENGHCBKemtrZWDQ0NTs3WrVvldruVnp7ew7MCAAD9UbcvXbW2turDDz909g8fPqyamhrFx8crOTlZ//zP/6y9e/fq9ddfV2dnp7PqEh8fr8jISH300UcqKyvTj3/8Y3k8Hu3fv19FRUUaO3asJk6cKEkaPXq0pk6dqoKCAuex83nz5ik3N1epqamSpKysLF199dXy+XxatmyZTp48qeLiYhUUFHzrChIAABgYXLZt29054M0339TkyZO7tN91110qLS3VyJEjz3ncG2+8oUmTJqm+vl7/8i//otraWrW2tiolJUXTpk3T4sWLFR8f79SfPHlShYWFeu211yRJeXl5WrVqVdjTW3V1dZo/f762b9+uqKgo5efna/ny5ed9H04wGJRlWQoEAr0Tjkqts/YDPf8aAAAMMN35/O520DEJQQcAgP6nO5/ffNcVAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIzV7aDz9ttva/r06UpOTpbL5dIrr7wS1m/btkpLS5WcnKyoqChNmjRJ+/btC6sJhUJasGCBPB6PoqOjlZeXp6NHj4bVNDc3y+fzybIsWZYln8+nlpaWsJq6ujpNnz5d0dHR8ng8KiwsVHt7e3enBAAADNXtoNPW1qZrr71Wq1atOmf/Y489pscff1yrVq3Snj175PV6dcstt+jUqVNOzcKFC7Vp0yaVl5ersrJSra2tys3NVWdnp1OTn5+vmpoa+f1++f1+1dTUyOfzOf2dnZ2aNm2a2traVFlZqfLycm3cuFFFRUXdnRIAADCVfREk2Zs2bXL2z5w5Y3u9XvvRRx912j7//HPbsiz7mWeesW3btltaWuwhQ4bY5eXlTs2xY8fsQYMG2X6/37Zt296/f78tyd65c6dTU1VVZUuyP/jgA9u2bXvLli32oEGD7GPHjjk1L774ou12u+1AIHBe4w8EArak867vtsWx4RsAALho3fn87tF7dA4fPqzGxkZlZWU5bW63WzfeeKN27NghSaqurlZHR0dYTXJystLS0pyaqqoqWZaljIwMp2b8+PGyLCusJi0tTcnJyU5Ndna2QqGQqqurzzm+UCikYDAYtgEAAHP1aNBpbGyUJCUmJoa1JyYmOn2NjY2KjIxUXFzcN9YkJCR0OX9CQkJYzdmvExcXp8jISKfmbEuXLnXu+bEsSykpKRcwSwAA0F/0ylNXLpcrbN+27S5tZzu75lz1F1LzVSUlJQoEAs5WX1//jWMCAAD9W48GHa/XK0ldVlSampqc1Rev16v29nY1Nzd/Y83x48e7nP/EiRNhNWe/TnNzszo6Orqs9HzJ7XYrNjY2bAMAAObq0aAzcuRIeb1eVVRUOG3t7e166623NGHCBElSenq6hgwZElbT0NCg2tpapyYzM1OBQEC7d+92anbt2qVAIBBWU1tbq4aGBqdm69atcrvdSk9P78lpAQCAfmpwdw9obW3Vhx9+6OwfPnxYNTU1io+P1/Dhw7Vw4UI98sgjGjVqlEaNGqVHHnlEQ4cOVX5+viTJsizNnTtXRUVFGjZsmOLj41VcXKwxY8ZoypQpkqTRo0dr6tSpKigo0OrVqyVJ8+bNU25urlJTUyVJWVlZuvrqq+Xz+bRs2TKdPHlSxcXFKigoYKUGAABIuoCg8+6772ry5MnO/qJFiyRJd911l9avX6/7779fp0+f1vz589Xc3KyMjAxt3bpVMTExzjErV67U4MGDNWvWLJ0+fVo333yz1q9fr4iICKemrKxMhYWFztNZeXl5Yf92T0REhDZv3qz58+dr4sSJioqKUn5+vpYvX9793wIAADCSy7Ztu68H0VeCwaAsy1IgEOidVaBS66z9QM+/BgAAA0x3Pr/5risAAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGKvHg84VV1whl8vVZbv33nslSXPmzOnSN378+LBzhEIhLViwQB6PR9HR0crLy9PRo0fDapqbm+Xz+WRZlizLks/nU0tLS09PBwAA9GM9HnT27NmjhoYGZ6uoqJAk3X777U7N1KlTw2q2bNkSdo6FCxdq06ZNKi8vV2VlpVpbW5Wbm6vOzk6nJj8/XzU1NfL7/fL7/aqpqZHP5+vp6QAAgH5scE+f8Ac/+EHY/qOPPqorr7xSN954o9Pmdrvl9XrPeXwgENDatWu1YcMGTZkyRZL0/PPPKyUlRdu2bVN2drYOHDggv9+vnTt3KiMjQ5K0Zs0aZWZm6uDBg0pNTe3paQEAgH6oV+/RaW9v1/PPP6+f/exncrlcTvubb76phIQEXXXVVSooKFBTU5PTV11drY6ODmVlZTltycnJSktL044dOyRJVVVVsizLCTmSNH78eFmW5dScSygUUjAYDNsAAIC5ejXovPLKK2ppadGcOXOctpycHJWVlWn79u1asWKF9uzZo5tuukmhUEiS1NjYqMjISMXFxYWdKzExUY2NjU5NQkJCl9dLSEhwas5l6dKlzj09lmUpJSWlB2YJAAAuVT1+6eqr1q5dq5ycHCUnJzttd9xxh/NzWlqaxo0bpxEjRmjz5s2aMWPG157Ltu2wVaGv/vx1NWcrKSnRokWLnP1gMEjYAQDAYL0WdD7++GNt27ZNL7/88jfWJSUlacSIETp06JAkyev1qr29Xc3NzWGrOk1NTZowYYJTc/z48S7nOnHihBITE7/2tdxut9xu94VMBwAA9EO9dulq3bp1SkhI0LRp076x7rPPPlN9fb2SkpIkSenp6RoyZIjztJYkNTQ0qLa21gk6mZmZCgQC2r17t1Oza9cuBQIBpwYAAKBXVnTOnDmjdevW6a677tLgwf//S7S2tqq0tFQzZ85UUlKSjhw5ogcffFAej0e33XabJMmyLM2dO1dFRUUaNmyY4uPjVVxcrDFjxjhPYY0ePVpTp05VQUGBVq9eLUmaN2+ecnNzeeIKAAA4eiXobNu2TXV1dfrZz34W1h4REaH3339fzz33nFpaWpSUlKTJkyfrpZdeUkxMjFO3cuVKDR48WLNmzdLp06d18803a/369YqIiHBqysrKVFhY6DydlZeXp1WrVvXGdAAAQD/lsm3b7utB9JVgMCjLshQIBBQbG9vzL1BqnbUf6PnXAABggOnO5zffdQUAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAY/V40CktLZXL5QrbvF6v02/btkpLS5WcnKyoqChNmjRJ+/btCztHKBTSggUL5PF4FB0drby8PB09ejSsprm5WT6fT5ZlybIs+Xw+tbS09PR0AABAP9YrKzrXXHONGhoanO399993+h577DE9/vjjWrVqlfbs2SOv16tbbrlFp06dcmoWLlyoTZs2qby8XJWVlWptbVVubq46Ozudmvz8fNXU1Mjv98vv96umpkY+n683pgMAAPqpwb1y0sGDw1ZxvmTbtp544gk99NBDmjFjhiTp2WefVWJiol544QX9/Oc/VyAQ0Nq1a7VhwwZNmTJFkvT8888rJSVF27ZtU3Z2tg4cOCC/36+dO3cqIyNDkrRmzRplZmbq4MGDSk1N7Y1pAQCAfqZXVnQOHTqk5ORkjRw5Unfeeaf+/Oc/S5IOHz6sxsZGZWVlObVut1s33nijduzYIUmqrq5WR0dHWE1ycrLS0tKcmqqqKlmW5YQcSRo/frwsy3JqziUUCikYDIZtAADAXD0edDIyMvTcc8/pd7/7ndasWaPGxkZNmDBBn332mRobGyVJiYmJYcckJiY6fY2NjYqMjFRcXNw31iQkJHR57YSEBKfmXJYuXerc02NZllJSUi5qrgAA4NLW40EnJydHM2fO1JgxYzRlyhRt3rxZ0l8vUX3J5XKFHWPbdpe2s51dc676bztPSUmJAoGAs9XX15/XnAAAQP/U64+XR0dHa8yYMTp06JBz387Zqy5NTU3OKo/X61V7e7uam5u/seb48eNdXuvEiRNdVou+yu12KzY2NmwDAADm6vWgEwqFdODAASUlJWnkyJHyer2qqKhw+tvb2/XWW29pwoQJkqT09HQNGTIkrKahoUG1tbVOTWZmpgKBgHbv3u3U7Nq1S4FAwKkBAADo8aeuiouLNX36dA0fPlxNTU361a9+pWAwqLvuuksul0sLFy7UI488olGjRmnUqFF65JFHNHToUOXn50uSLMvS3LlzVVRUpGHDhik+Pl7FxcXOpTBJGj16tKZOnaqCggKtXr1akjRv3jzl5ubyxBUAAHD0eNA5evSofvrTn+rTTz/VD37wA40fP147d+7UiBEjJEn333+/Tp8+rfnz56u5uVkZGRnaunWrYmJinHOsXLlSgwcP1qxZs3T69GndfPPNWr9+vSIiIpyasrIyFRYWOk9n5eXladWqVT09HQAA0I+5bNu2+3oQfSUYDMqyLAUCgd65X6fUOms/0POvAQDAANOdz2++6woAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgLIIOAAAwFkEHAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxurxoLN06VL98Ic/VExMjBISEnTrrbfq4MGDYTVz5syRy+UK28aPHx9WEwqFtGDBAnk8HkVHRysvL09Hjx4Nq2lubpbP55NlWbIsSz6fTy0tLT09JQAA0E/1eNB56623dO+992rnzp2qqKjQF198oaysLLW1tYXVTZ06VQ0NDc62ZcuWsP6FCxdq06ZNKi8vV2VlpVpbW5Wbm6vOzk6nJj8/XzU1NfL7/fL7/aqpqZHP5+vpKQEAgH5qcE+f0O/3h+2vW7dOCQkJqq6u1g033OC0u91ueb3ec54jEAho7dq12rBhg6ZMmSJJev7555WSkqJt27YpOztbBw4ckN/v186dO5WRkSFJWrNmjTIzM3Xw4EGlpqb29NQAAEA/0+v36AQCAUlSfHx8WPubb76phIQEXXXVVSooKFBTU5PTV11drY6ODmVlZTltycnJSktL044dOyRJVVVVsizLCTmSNH78eFmW5dScLRQKKRgMhm0AAMBcvRp0bNvWokWL9KMf/UhpaWlOe05OjsrKyrR9+3atWLFCe/bs0U033aRQKCRJamxsVGRkpOLi4sLOl5iYqMbGRqcmISGhy2smJCQ4NWdbunSpcz+PZVlKSUnpqakCAIBLUI9fuvqq++67T3/84x9VWVkZ1n7HHXc4P6elpWncuHEaMWKENm/erBkzZnzt+Wzblsvlcva/+vPX1XxVSUmJFi1a5OwHg0HCDgAABuu1FZ0FCxbotdde0xtvvKHLL7/8G2uTkpI0YsQIHTp0SJLk9XrV3t6u5ubmsLqmpiYlJiY6NcePH+9yrhMnTjg1Z3O73YqNjQ3bAACAuXo86Ni2rfvuu08vv/yytm/frpEjR37rMZ999pnq6+uVlJQkSUpPT9eQIUNUUVHh1DQ0NKi2tlYTJkyQJGVmZioQCGj37t1Oza5duxQIBJwaAAAwsPX4pat7771XL7zwgl599VXFxMQ498tYlqWoqCi1traqtLRUM2fOVFJSko4cOaIHH3xQHo9Ht912m1M7d+5cFRUVadiwYYqPj1dxcbHGjBnjPIU1evRoTZ06VQUFBVq9erUkad68ecrNzeWJKwAAIKkXgs7TTz8tSZo0aVJY+7p16zRnzhxFRETo/fff13PPPaeWlhYlJSVp8uTJeumllxQTE+PUr1y5UoMHD9asWbN0+vRp3XzzzVq/fr0iIiKcmrKyMhUWFjpPZ+Xl5WnVqlU9PSUAANBPuWzbtvt6EH0lGAzKsiwFAoHeuV+n1DprP9DzrwEAwADTnc9vvusKAAAYi6ADAACMRdABAADGIugAAABjEXQAAICxCDoAAMBYBB0AAGAsgg4AADAWQQcAABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxiLoAAAAYxF0AACAsQg6AADAWAQdAABgrMF9PQAAAL5LVzywOWz/yKPT+mgk+C4QdAAAxjo71GDgIegAAAa08wlDrPr0XwQdAIAxWMHB2Qg6AAB8C+7r6b946goAABiLFR1ggOFvpsDF476e/oOgAwDot3rznpwjl+V/++t//sLX951jbISf7x5BBwBglPMJKH32WqVf/jfQ00PB1yDoAEBPKLXO0caH2UU76/d6rhWU7zLY9Jiz/7zwZ6XXEHQAmOtCw8e5juut83yXLrUP0wv4/fTLUHMevrzMxaWtnkfQAWCOCwkWFxpGLrUQcz7645gHCCfAlX6l8VILpv0UQQdA/9BTS/182KO/+JrLdqz6dE+/DzpPPfWUli1bpoaGBl1zzTV64okn9E//9E99PSzgktVl6b9U/fNvjgQWDDDnWvW54vMXCD7fol8HnZdeekkLFy7UU089pYkTJ2r16tXKycnR/v37NXz48L4eHmCMKx7YfO57I/rjfSqAQY5clt8l+Eis+nxVvw46jz/+uObOnau7775bkvTEE0/od7/7nZ5++mktXbq0S30oFFIoFHL2A4G//k86GAz2zgBDdvh+b70O0B1n/7mUvvXP5pnQXxR0ffNxaYt/p9rL5l7s6ABchD+6fipJCpZ088CSoz0/mF705ee2bZ/j/0tns/upUChkR0RE2C+//HJYe2FhoX3DDTec85jFixfbktjY2NjY2NgM2Orr6781L/TbFZ1PP/1UnZ2dSkxMDGtPTExUY2PjOY8pKSnRokWLnP0zZ87o5MmTGjZsmFwuV4+OLxgMKiUlRfX19YqNje3Rc6N7eC8uHbwXlw7ei0sH70X32batU6dOKTk5+Vtr+23Q+dLZAcW27a8NLW63W263O6zt+9//fm8NTZIUGxvLH9xLBO/FpYP34tLBe3Hp4L3oHsuyzquu3357ucfjUURERJfVm6ampi6rPAAAYGDqt0EnMjJS6enpqqioCGuvqKjQhAkT+mhUAADgUtKvL10tWrRIPp9P48aNU2Zmpv7nf/5HdXV1uueee/p6aHK73Vq8eHGXS2X47vFeXDp4Ly4dvBeXDt6L3uWy7fN5NuvS9dRTT+mxxx5TQ0OD0tLStHLlSt1www19PSwAAHAJ6PdBBwAA4Ov023t0AAAAvg1BBwAAGIugAwAAjEXQAQAAxiLo9LAlS5ZowoQJGjp06Nf+q8t1dXWaPn26oqOj5fF4VFhYqPb29u92oAPUn/70J/3kJz+Rx+NRbGysJk6cqDfeeKOvhzVgbd68WRkZGYqKipLH49GMGTP6ekgDWigU0nXXXSeXy6Wampq+Hs6Ac+TIEc2dO1cjR45UVFSUrrzySi1evJjPh4tE0Olh7e3tuv322/WLX/zinP2dnZ2aNm2a2traVFlZqfLycm3cuFFFRUXf8UgHpmnTpumLL77Q9u3bVV1dreuuu065ublf+/1o6D0bN26Uz+fTv/3bv+m9997T73//e+Xn5/f1sAa0+++//7y+Owi944MPPtCZM2e0evVq7du3TytXrtQzzzyjBx98sK+H1r9d5JeI42usW7fOtiyrS/uWLVvsQYMG2ceOHXPaXnzxRdvtdtuBQOA7HOHAc+LECVuS/fbbbzttwWDQlmRv27atD0c28HR0dNh/8zd/Y//v//5vXw8F/58tW7bYf//3f2/v27fPlmT/4Q9/6Oshwbbtxx57zB45cmRfD6NfY0XnO1ZVVaW0tLSwvzVlZ2crFAqpurq6D0dmvmHDhmn06NF67rnn1NbWpi+++EKrV69WYmKi0tPT+3p4A8revXt17NgxDRo0SGPHjlVSUpJycnK0b9++vh7agHT8+HEVFBRow4YNGjp0aF8PB18RCAQUHx/f18Po1wg637HGxsYuXzoaFxenyMhILp/0MpfLpYqKCv3hD39QTEyMLrvsMq1cuVJ+v7/Xv8Ue4f785z9LkkpLS/Uf//Efev311xUXF6cbb7xRJ0+e7OPRDSy2bWvOnDm65557NG7cuL4eDr7io48+0pNPPnlJfK1Rf0bQOQ+lpaVyuVzfuL377rvnfT6Xy9Wlzbbtc7bj253v+2PbtubPn6+EhAS988472r17t37yk58oNzdXDQ0NfT0NI5zve3HmzBlJ0kMPPaSZM2cqPT1d69atk8vl0m9+85s+noUZzve9ePLJJxUMBlVSUtLXQzbWhXyGfPLJJ5o6dapuv/123X333X00cjPwFRDn4dNPP9Wnn376jTVXXHGFLrvsMmd//fr1WrhwoVpaWsLqHn74Yb366qt67733nLbm5mbFx8dr+/btmjx5co+OfSA43/fn97//vbKystTc3KzY2Finb9SoUZo7d64eeOCB3h6q8c73vaiqqtJNN92kd955Rz/60Y+cvoyMDE2ZMkVLlizp7aEa73zfizvvvFO//e1vw/6i1dnZqYiICM2ePVvPPvtsbw/VeN39DPnkk080efJkZWRkaP369Ro0iDWJi9Gvv738u+LxeOTxeHrkXJmZmVqyZIkaGhqUlJQkSdq6davcbjf3iVyg831//vKXv0hSl/9pDBo0yFlhwMU53/ciPT1dbrdbBw8edIJOR0eHjhw5ohEjRvT2MAeE830v/vu//1u/+tWvnP1PPvlE2dnZeumll5SRkdGbQxwwuvMZcuzYMU2ePNlZ5STkXDyCTg+rq6vTyZMnVVdXp87OTuffovi7v/s7fe9731NWVpauvvpq+Xw+LVu2TCdPnlRxcbEKCgrCVhnQ8zIzMxUXF6e77rpLDz/8sKKiorRmzRodPnxY06ZN6+vhDSixsbG65557tHjxYqWkpGjEiBFatmyZJOn222/v49ENLMOHDw/b/973vidJuvLKK3X55Zf3xZAGrE8++USTJk3S8OHDtXz5cp04ccLp83q9fTiy/o2g08MefvjhsKXesWPHSpLeeOMNTZo0SREREdq8ebPmz5+viRMnKioqSvn5+Vq+fHlfDXnA8Hg88vv9euihh3TTTTepo6ND11xzjV599VVde+21fT28AWfZsmUaPHiwfD6fTp8+rYyMDG3fvl1xcXF9PTSgT2zdulUffvihPvzwwy4hk7tMLhz36AAAAGNx8Q8AABiLoAMAAIxF0AEAAMYi6AAAAGMRdAAAgLEIOgAAwFgEHQAAYCyCDgAAMBZBBwAAGIugAwAAjEXQAQAAxvp/L7QQzbplVUEAAAAASUVORK5CYII=",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "plt.hist(sae_freqs, bins=100)\n",
    "plt.hist(tc_freqs, bins=100)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "a5f9dd4d-b210-491d-8ea7-57e2347526ca",
   "metadata": {},
   "outputs": [],
   "source": [
    "tc_live = np.arange(len(tc_freqs))[utils.to_numpy(tc_freqs > -4)]\n",
    "sae_live = np.arange(len(sae_freqs))[utils.to_numpy(sae_freqs > -4)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "6f8d39e3-4a1c-43dd-aef6-3ce7fc6c1c95",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(10403, 9381)"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(sae_live), len(tc_live)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "19a7678b-9aa0-40a9-a6e3-912226fa0294",
   "metadata": {},
   "source": [
    "# Generate feature dashboards\n",
    "\n",
    "This code generates a list of feature dashboards for 50 random transcoder features and 50 random SAE features. It saves these dashboards along with a text file containing the features that they correspond to.\n",
    "\n",
    "Note that we found that SAE features might have different ranges of activations than transcoder features. To prevent this from coloring our assessment, we then wrote a short additional script (not included here) to remove all numerical information about feature activations from the feature dashboards."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "ae027264-269b-4809-9db0-27ac5e0035c1",
   "metadata": {},
   "outputs": [],
   "source": [
    "save_dir = 'feature dashboards/'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "fa5beb13-3923-45ff-aa09-731633e131de",
   "metadata": {},
   "outputs": [],
   "source": [
    "import random\n",
    "\n",
    "num_features = 50\n",
    "tc_features = np.random.choice(tc_live[1:], size=num_features, replace=False)\n",
    "sae_features = np.random.choice(sae_live[1:], size=num_features, replace=False)\n",
    "features_list = [(x, 'tc') for x in tc_features] + [(x, 'sae') for x in sae_features]\n",
    "random.shuffle(features_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "996bc3d0-f013-48e1-a2ff-163b2876d1b9",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.75it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.74it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 2\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.74it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 4\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.75it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 5\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.74it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 6\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.74it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 7\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.74it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 8\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.75it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 9\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 200/200 [01:54<00:00,  1.75it/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "i: 10\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 92%|█████████▎| 185/200 [01:46<00:08,  1.74it/s]\n",
      "\n",
      "KeyboardInterrupt\n",
      "\n"
     ]
    }
   ],
   "source": [
    "i = 0\n",
    "while i < 2*num_features:\n",
    "    print(f\"i: {i}\")\n",
    "    feature_idx, feature_type = features_list[i]\n",
    "    if feature_type == 'tc':\n",
    "        scores = get_feature_scores(model, transcoder, owt_tokens_torch, feature_idx, batch_size=128)\n",
    "    elif feature_type == 'sae':\n",
    "        scores = get_feature_scores(model, sae, owt_tokens_torch, feature_idx, batch_size=128)\n",
    "        \n",
    "    if (scores>0).sum() < 4:\n",
    "        # replace feature if there are less than four activating examples\n",
    "        new_feature = None\n",
    "        while new_feature is None or (new_feature, feature_type) in features_list:\n",
    "            new_feature = random.choice(tc_live[1:] if feature_type == 'tc' else sae_live[1:])\n",
    "        del features_list[i]\n",
    "        features_list.append((new_feature, feature_type))\n",
    "        continue\n",
    "    \n",
    "    with open(save_dir + f'{i}.html', \"w\") as fp:\n",
    "        fp.write(display_activating_examples_dash(model, owt_tokens_torch, scores, do_display=False))\n",
    "    i += 1\n",
    "\n",
    "with open(save_dir + 'SECRET_FEATURES_LIST.txt', \"w\") as fp:\n",
    "    fp.write(\"\\n\".join([f'{i}: {feature_type}[{feature_idx}]' for i, (feature_type, feature_idx) in enumerate(features_list)]))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "995ae1b3-1460-46de-afb7-721776cbdc43",
   "metadata": {},
   "source": [
    "# Evaluating results\n",
    "\n",
    "This section shows how we evaluated the results of our interpretability comparison. We load in the list of features and compare them to a list of notes (taken by the human evaluator) for each feature. Then, we can see how many SAE/transcoder features were interpretable, maybe-interpretable, or uninterpretable."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "35cfcf12-71a4-4a5d-93e4-48d0e6eb8183",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('feature dashboards/SECRET_FEATURES_LIST.txt', 'r') as fp:\n",
    "    feature_strs = fp.readlines()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "6f9628e2-f415-4482-a62e-06a828341a9a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "is_tc = np.array(['tc' in x for x in feature_strs])\n",
    "is_sae = np.array(['sae' in x for x in feature_strs])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "a4e3d7d0-5eef-4362-8335-34e623369155",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "50"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "is_tc.sum()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "9416dd2e-d55c-4809-b66c-1e53625d493f",
   "metadata": {},
   "source": [
    "The below cell contains the human evaluator's notes on feature interpretability."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "61c92f3b-67f9-444d-a5f8-b8423b246528",
   "metadata": {
    "jupyter": {
     "source_hidden": true
    }
   },
   "outputs": [],
   "source": [
    "interp_strs = \\\n",
    "\"\"\"0 yes\n",
    "1 yes, context-free\n",
    "2 yes\n",
    "3 maybe, context-free\n",
    "4 yes\n",
    "5 yes\n",
    "6 yes\n",
    "7 yes\n",
    "8 yes\n",
    "9 yes\n",
    "10 yes, context-free\n",
    "11 maybe\n",
    "12 maybe\n",
    "13 yes\n",
    "14 yes, context-free\n",
    "15 yes\n",
    "16 yes\n",
    "17 yes, context-free\n",
    "18 yes\n",
    "19 maybe, context-free\n",
    "20 yes\n",
    "21 yes\n",
    "22 yes\n",
    "23 yes, context-free\n",
    "24 maybe, context-free\n",
    "25 yes, context-free\n",
    "26 yes\n",
    "27 yes\n",
    "28 maybe\n",
    "29 yes\n",
    "30 maybe, context-free\n",
    "31 yes\n",
    "32 yes\n",
    "33 maybe\n",
    "34 yes\n",
    "35 yes\n",
    "36 yes\n",
    "37 yes\n",
    "38 maybe\n",
    "39 yes\n",
    "40 yes\n",
    "41 yes, context-free\n",
    "42 no\n",
    "43 no\n",
    "44 maybe\n",
    "45 yes\n",
    "46 yes\n",
    "47 yes, context-free\n",
    "48 yes, context-free\n",
    "49 yes, context-free\n",
    "50 yes\n",
    "51 yes\n",
    "52 yes\n",
    "53 yes\n",
    "54 yes\n",
    "55 maybe\n",
    "56 yes\n",
    "57 no\n",
    "58 maybe\n",
    "59 yes\n",
    "60 yes, context-free\n",
    "61 yes\n",
    "62 yes\n",
    "63 maybe\n",
    "64 yes\n",
    "65 no\n",
    "66 yes\n",
    "67 maybe\n",
    "68 yes\n",
    "69 yes\n",
    "70 yes\n",
    "71 yes, context-free\n",
    "72 maybe\n",
    "73 yes\n",
    "74 yes\n",
    "75 yes, context-free\n",
    "76 yes\n",
    "77 yes\n",
    "78 yes, context-free\n",
    "79 yes\n",
    "80 yes\n",
    "81 yes\n",
    "82 yes, context-free\n",
    "83 yes\n",
    "84 no\n",
    "85 yes\n",
    "86 yes, context-free\n",
    "87 yes\n",
    "88 yes\n",
    "89 yes\n",
    "90 yes\n",
    "91 yes, context-free\n",
    "92 yes\n",
    "93 yes\n",
    "94 yes\n",
    "95 yes\n",
    "96 yes, context-free\n",
    "97 yes\n",
    "98 maybe\n",
    "99 yes\"\"\".split(\"\\n\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "ce9278e7-01ef-4a31-a737-e0b68d71fe53",
   "metadata": {},
   "outputs": [],
   "source": [
    "is_yes = np.array(['yes' in x for x in interp_strs])\n",
    "is_maybe = np.array(['maybe' in x for x in interp_strs])\n",
    "is_no = np.array(['no' in x for x in interp_strs])\n",
    "is_ctx_free = np.array(['context-free' in x for x in interp_strs])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "85d536db-80ba-4fb3-954f-0b7504465c05",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "41"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_tc, is_yes).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "881fe686-3395-439d-b2a9-23fea7dda440",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "38"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_sae, is_yes).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "1f0386c0-9b3a-4484-9edc-5444916d5fd3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_tc, is_maybe).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "e24dd7ae-301b-4742-b85d-2bfa94e1c4da",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_sae, is_maybe).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "d284ecd8-a163-4ff3-a1ae-f457af60da37",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_tc, is_no).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "cca04b1c-71e6-4420-b9bf-06c2ddd00112",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_sae, is_no).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "67fa843d-ed85-4f25-8e1f-ffedf5d42ead",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "6"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_tc, is_ctx_free).sum()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "1a1ba177-a741-4183-8818-59a3147d1029",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "16"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.logical_and(is_sae, is_ctx_free).sum()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
