{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "bf94871b",
   "metadata": {},
   "source": [
    "## This notebook will leverage pre-trained Phoneme2Word decoder to reconstruct sentences from sequences of phonemes"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "f31dcc4b",
   "metadata": {},
   "outputs": [],
   "source": [
    "# from phoneme2text import Phoneme2TextModel, PhonemeTokenizer, VanillaTransformerEncoder\n",
    "from transformers import BartForConditionalGeneration, BartTokenizer, BartConfig\n",
    "import jiwer\n",
    "import nltk\n",
    "from nltk.corpus import cmudict\n",
    "import tqdm\n",
    "import pandas as pd\n",
    "import sys\n",
    "sys.path.append(\"..\")\n",
    "from dataset import PHONE_DEF_SIL\n",
    "import torch\n",
    "from config import PHONEME2TEXT_MODEL\n",
    "import os \n",
    "import ast\n",
    "from phoneme2text import Phoneme2TextModel, NoisyBookCorpusPhonemeDataset\n",
    "from pytorch_lightning.callbacks import ModelCheckpoint, EarlyStopping\n",
    "from pytorch_lightning.loggers import WandbLogger\n",
    "from g2p_en import G2p\n",
    "from pytorch_lightning import Trainer\n",
    "from datasets import load_dataset\n",
    "import numpy as np\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "f388457c",
   "metadata": {},
   "outputs": [],
   "source": [
    "## load the Phoneme2Text model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "ba46e3e0",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Load GPT-2 config and enable cross-attention\n",
    "model = Phoneme2TextModel(learning_rate=1e-4, weight_decay=1e-5)\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "7f354906",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# Define ModelCheckpoint to save the best model based on validation loss\n",
    "checkpoint_callback = ModelCheckpoint(\n",
    "    monitor=\"val_loss\",  # Ensure your validation step logs \"val_loss\"\n",
    "    mode=\"min\",          # Save the model with the lowest validation loss\n",
    "    save_top_k=1,        # Keep only the best model\n",
    "    dirpath=\"NoisyPhoneme2TextBART/\",  # Directory to save checkpoints\n",
    "    filename=\"best_model\",  # Model filename\n",
    "    verbose=True\n",
    ")\n",
    "\n",
    "# Define EarlyStopping callback with patience of 3 epochs\n",
    "early_stopping_callback = EarlyStopping(\n",
    "    monitor=\"val_loss\",\n",
    "    patience=5,   # Stop training if no improvement in 3 epochs\n",
    "    mode=\"min\",\n",
    "    verbose=True\n",
    ")\n",
    "\n",
    "wandb_logger = WandbLogger(project=\"Phoneme2TextBART\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "836da088",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_268665/1915409509.py:33: FutureWarning: You are using `torch.load` with `weights_only=False` (the current default value), which uses the default pickle module implicitly. It is possible to construct malicious pickle data which will execute arbitrary code during unpickling (See https://github.com/pytorch/pytorch/blob/main/SECURITY.md#untrusted-models for more details). In a future release, the default value for `weights_only` will be flipped to `True`. This limits the functions that could be executed during unpickling. Arbitrary objects will no longer be allowed to be loaded via this mode unless they are explicitly allowlisted by the user via `torch.serialization.add_safe_globals`. We recommend you start setting `weights_only=True` for any use case where you don't have full control of the loaded file. Please open an issue on GitHub for any issues related to this experimental feature.\n",
      "  model.load_state_dict(torch.load(\"NoisyPhoneme2TextBART/best_model.ckpt\")[\"state_dict\"])\n"
     ]
    }
   ],
   "source": [
    "TRAIN = False\n",
    "\n",
    "if TRAIN:\n",
    "    g2p = G2p()\n",
    "\n",
    "    dataset = load_dataset(\"bookcorpus/bookcorpus\", cache_dir = \"/data/HF\")\n",
    "    # This returns a dict with 'train' split\n",
    "    train_data = dataset['train']\n",
    "    \n",
    "    train_size = 1000000\n",
    "    val_size = 10000\n",
    "\n",
    "    train_dataset = NoisyBookCorpusPhonemeDataset(train_data[:train_size][\"text\"], g2p, addInterWordSymbol=True, apply_augmentation=True, corruption_prob=0.5, error_rate=0.3)\n",
    "    val_dataset = NoisyBookCorpusPhonemeDataset(train_data[train_size:train_size+val_size][\"text\"], g2p, addInterWordSymbol=True)\n",
    "\n",
    "    BS = 128\n",
    "    # 4) Wrap in a DataLoader for batching and iteration\n",
    "    train_dataloader = torch.utils.data.DataLoader(train_dataset, batch_size=BS, shuffle=True)\n",
    "    val_dataloader = torch.utils.data.DataLoader(val_dataset, batch_size=BS, shuffle=False)\n",
    "\n",
    "\n",
    "    # 🔹 Define the PyTorch Lightning Trainer\n",
    "    trainer = Trainer(max_epochs=5, accelerator=\"gpu\" if torch.cuda.is_available() else \"cpu\",devices=[2],\n",
    "                    callbacks=[checkpoint_callback, early_stopping_callback], logger=wandb_logger)\n",
    "    \n",
    "\n",
    "\n",
    "    # 🔹 Train the model\n",
    "    trainer.fit(model, train_dataloader,val_dataloader,)\n",
    "\n",
    "\n",
    "else:\n",
    "    model.load_state_dict(torch.load(\"NoisyPhoneme2TextBART/best_model.ckpt\")[\"state_dict\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "261655de",
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_text(model, phoneme_seqs, max_length=10):\n",
    "        \"\"\"\n",
    "        Generate text from a sequence of phonemes\n",
    "        \"\"\"\n",
    "        phoneme_ids = model.phoneme_tokenizer.batch_encode(phoneme_seqs)\n",
    "        phoneme_mask = (phoneme_ids != model.phoneme_tokenizer.vocab[\"[PAD]\"]).long().to(model.device)\n",
    "\n",
    "        # Run through encoder\n",
    "        encoder_outputs = model.encoder(phoneme_ids.to(model.device), phoneme_mask.to(model.device))\n",
    "\n",
    "        #project\n",
    "        encoder_outputs = model.proj_layer(encoder_outputs)\n",
    "\n",
    "        # Decode using GPT-2\n",
    "        output_ids = model.decoder.generate(\n",
    "            encoder_hidden_states=encoder_outputs,\n",
    "            encoder_attention_mask=phoneme_mask,\n",
    "            # max_length=max_length,\n",
    "            max_new_tokens=max_length,\n",
    "            num_beams=1,\n",
    "        )\n",
    "\n",
    "        # Convert token IDs back to text\n",
    "        return model.text_tokenizer.batch_decode(output_ids, skip_special_tokens=True)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "752066f3",
   "metadata": {},
   "source": [
    "## load results from one folder"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "6d19722f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>True Phonemes</th>\n",
       "      <th>Predicted Phonemes</th>\n",
       "      <th>True Sentence</th>\n",
       "      <th>Day Index</th>\n",
       "      <th>CER</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>['TH', 'IY', 'AA', 'K', 'R', 'AH', 'S', 'IY', ...</td>\n",
       "      <td>['DH', 'R', 'AE', 'K', 'S', 'SIL', 'IH', 'G', ...</td>\n",
       "      <td>Theocracy reconsidered.</td>\n",
       "      <td>0</td>\n",
       "      <td>0.700000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>['R', 'IH', 'CH', 'SIL', 'P', 'ER', 'CH', 'AH'...</td>\n",
       "      <td>['R', 'IY', 'K', 'S', 'SIL', 'P', 'AA', 'SH', ...</td>\n",
       "      <td>Rich purchased several signed lithographs.</td>\n",
       "      <td>0</td>\n",
       "      <td>0.471698</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>['S', 'OW', 'SIL', 'R', 'UW', 'L', 'Z', 'SIL',...</td>\n",
       "      <td>['DH', 'AH', 'SIL', 'R', 'UW', 'L', 'Z', 'SIL'...</td>\n",
       "      <td>So rules we made, in unabashed collusion.</td>\n",
       "      <td>0</td>\n",
       "      <td>0.356322</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>['L', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', 'AA', ...</td>\n",
       "      <td>['K', 'R', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', '...</td>\n",
       "      <td>Lori's costume needed black gloves to be compl...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.297872</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>['DH', 'AH', 'SIL', 'T', 'UW', 'TH', 'SIL', 'F...</td>\n",
       "      <td>['DH', 'AH', 'SIL', 'S', 'UW', 'TH', 'SIL', 'V...</td>\n",
       "      <td>The tooth fairy forgot to come when Roger's to...</td>\n",
       "      <td>0</td>\n",
       "      <td>0.294118</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>875</th>\n",
       "      <td>['Y', 'AO', 'R', 'SIL', 'T', 'Y', 'UW', 'IH', ...</td>\n",
       "      <td>['Y', 'UH', 'R', 'SIL', 'IH', 'F', 'R', 'EY', ...</td>\n",
       "      <td>Your tuition reimbursement.</td>\n",
       "      <td>23</td>\n",
       "      <td>0.175407</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>876</th>\n",
       "      <td>['G', 'EH', 'T', 'IH', 'NG', 'SIL', 'P', 'L', ...</td>\n",
       "      <td>['G', 'EH', 'T', 'IH', 'NG', 'SIL', 'B', 'L', ...</td>\n",
       "      <td>Getting pledge sheets for the Boy Scouts.</td>\n",
       "      <td>23</td>\n",
       "      <td>0.177504</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>877</th>\n",
       "      <td>['IH', 'F', 'SIL', 'Y', 'UW', 'SIL', 'HH', 'AE...</td>\n",
       "      <td>['IH', 'F', 'SIL', 'Y', 'UW', 'SIL', 'HH', 'AE...</td>\n",
       "      <td>If you have any doubts whatsoever.</td>\n",
       "      <td>23</td>\n",
       "      <td>0.176672</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>878</th>\n",
       "      <td>['M', 'IH', 'S', 'T', 'ER', 'IY', 'SIL', 'M', ...</td>\n",
       "      <td>['M', 'AE', 'T', 'ER', 'IY', 'SIL', 'M', 'UW',...</td>\n",
       "      <td>Mystery movies.</td>\n",
       "      <td>23</td>\n",
       "      <td>0.177269</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>879</th>\n",
       "      <td>['AY', 'SIL', 'K', 'AE', 'N', 'T', 'SIL', 'R',...</td>\n",
       "      <td>['AY', 'SIL', 'K', 'AE', 'N', 'T', 'SIL', 'R',...</td>\n",
       "      <td>I can't remember where.</td>\n",
       "      <td>23</td>\n",
       "      <td>0.176127</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>880 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                         True Phonemes  \\\n",
       "0    ['TH', 'IY', 'AA', 'K', 'R', 'AH', 'S', 'IY', ...   \n",
       "1    ['R', 'IH', 'CH', 'SIL', 'P', 'ER', 'CH', 'AH'...   \n",
       "2    ['S', 'OW', 'SIL', 'R', 'UW', 'L', 'Z', 'SIL',...   \n",
       "3    ['L', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', 'AA', ...   \n",
       "4    ['DH', 'AH', 'SIL', 'T', 'UW', 'TH', 'SIL', 'F...   \n",
       "..                                                 ...   \n",
       "875  ['Y', 'AO', 'R', 'SIL', 'T', 'Y', 'UW', 'IH', ...   \n",
       "876  ['G', 'EH', 'T', 'IH', 'NG', 'SIL', 'P', 'L', ...   \n",
       "877  ['IH', 'F', 'SIL', 'Y', 'UW', 'SIL', 'HH', 'AE...   \n",
       "878  ['M', 'IH', 'S', 'T', 'ER', 'IY', 'SIL', 'M', ...   \n",
       "879  ['AY', 'SIL', 'K', 'AE', 'N', 'T', 'SIL', 'R',...   \n",
       "\n",
       "                                    Predicted Phonemes  \\\n",
       "0    ['DH', 'R', 'AE', 'K', 'S', 'SIL', 'IH', 'G', ...   \n",
       "1    ['R', 'IY', 'K', 'S', 'SIL', 'P', 'AA', 'SH', ...   \n",
       "2    ['DH', 'AH', 'SIL', 'R', 'UW', 'L', 'Z', 'SIL'...   \n",
       "3    ['K', 'R', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', '...   \n",
       "4    ['DH', 'AH', 'SIL', 'S', 'UW', 'TH', 'SIL', 'V...   \n",
       "..                                                 ...   \n",
       "875  ['Y', 'UH', 'R', 'SIL', 'IH', 'F', 'R', 'EY', ...   \n",
       "876  ['G', 'EH', 'T', 'IH', 'NG', 'SIL', 'B', 'L', ...   \n",
       "877  ['IH', 'F', 'SIL', 'Y', 'UW', 'SIL', 'HH', 'AE...   \n",
       "878  ['M', 'AE', 'T', 'ER', 'IY', 'SIL', 'M', 'UW',...   \n",
       "879  ['AY', 'SIL', 'K', 'AE', 'N', 'T', 'SIL', 'R',...   \n",
       "\n",
       "                                         True Sentence  Day Index       CER  \n",
       "0                              Theocracy reconsidered.          0  0.700000  \n",
       "1           Rich purchased several signed lithographs.          0  0.471698  \n",
       "2            So rules we made, in unabashed collusion.          0  0.356322  \n",
       "3    Lori's costume needed black gloves to be compl...          0  0.297872  \n",
       "4    The tooth fairy forgot to come when Roger's to...          0  0.294118  \n",
       "..                                                 ...        ...       ...  \n",
       "875                        Your tuition reimbursement.         23  0.175407  \n",
       "876          Getting pledge sheets for the Boy Scouts.         23  0.177504  \n",
       "877                 If you have any doubts whatsoever.         23  0.176672  \n",
       "878                                    Mystery movies.         23  0.177269  \n",
       "879                            I can't remember where.         23  0.176127  \n",
       "\n",
       "[880 rows x 5 columns]"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# results_dir = \"../results/gru_ctc_mfcc/\"\n",
    "results_dir = \"../results/mfcc_sm_gru_ctc_LONGRUN/\"\n",
    "\n",
    "\n",
    "df = pd.read_csv(os.path.join(results_dir, \"results.csv\"))\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "da23ce93",
   "metadata": {},
   "outputs": [],
   "source": [
    "def decode_with_beam(phoneme_seq_beam, return_N=5):\n",
    "    # Step 1: Preprocess phoneme sequences\n",
    "    phoneme_seqs_beam = []\n",
    "    for phoneme_seq in phoneme_seq_beam:\n",
    "        phoneme_seq = [i if i != \"SIL\" else \" \" for i in phoneme_seq]\n",
    "        phoneme_seq = \" \".join(phoneme_seq)\n",
    "        phoneme_seqs_beam.append(phoneme_seq)\n",
    "\n",
    "    # Step 2: Generate beam outputs\n",
    "    generated_beam = model.generate_text(\n",
    "        phoneme_seqs_beam,\n",
    "        num_beams=5,\n",
    "        max_length=40,\n",
    "        do_sample=True,\n",
    "        num_return_sequences=return_N,\n",
    "    )\n",
    "\n",
    "    # Step 3: Expand phoneme sequences to match generated output\n",
    "    expanded_phoneme_seqs_beam = []\n",
    "    for seq in phoneme_seqs_beam:\n",
    "        expanded_phoneme_seqs_beam.extend([seq] * return_N)\n",
    "\n",
    "    # Step 4: Remove duplicate generations and align\n",
    "    unique_pairs = list(dict.fromkeys(zip(generated_beam, expanded_phoneme_seqs_beam)))  # removes duplicates, keeps order\n",
    "    generated_beam, phoneme_seqs_beam = zip(*unique_pairs)  # unzip\n",
    "    generated_beam, phoneme_seqs_beam = list(generated_beam), list(phoneme_seqs_beam)\n",
    "\n",
    "    # Step 5: Score and sort\n",
    "    with torch.no_grad():\n",
    "        scores = []\n",
    "        for phoneme_seq, sentence in zip(phoneme_seqs_beam, generated_beam):\n",
    "            nll, _ = model(phoneme_seq, sentence)\n",
    "            scores.append(-nll.cpu().numpy())\n",
    "\n",
    "        sorted_idx = np.argsort(scores)[::-1]\n",
    "        sorted_generated_beam = [generated_beam[i] for i in sorted_idx]\n",
    "        sorted_scores = [scores[i] for i in sorted_idx]\n",
    "\n",
    "    return sorted_generated_beam[:return_N]\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "c1037452",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Phoneme2TextModel(\n",
       "  (model): BartForConditionalGeneration(\n",
       "    (model): BartModel(\n",
       "      (shared): BartScaledWordEmbedding(50265, 768, padding_idx=1)\n",
       "      (encoder): BartEncoder(\n",
       "        (embed_tokens): BartScaledWordEmbedding(50265, 768, padding_idx=1)\n",
       "        (embed_positions): BartLearnedPositionalEmbedding(1026, 768)\n",
       "        (layers): ModuleList(\n",
       "          (0-5): 6 x BartEncoderLayer(\n",
       "            (self_attn): BartSdpaAttention(\n",
       "              (k_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (v_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (q_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (out_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "            )\n",
       "            (self_attn_layer_norm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "            (activation_fn): GELUActivation()\n",
       "            (fc1): Linear(in_features=768, out_features=3072, bias=True)\n",
       "            (fc2): Linear(in_features=3072, out_features=768, bias=True)\n",
       "            (final_layer_norm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "          )\n",
       "        )\n",
       "        (layernorm_embedding): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "      )\n",
       "      (decoder): BartDecoder(\n",
       "        (embed_tokens): BartScaledWordEmbedding(50265, 768, padding_idx=1)\n",
       "        (embed_positions): BartLearnedPositionalEmbedding(1026, 768)\n",
       "        (layers): ModuleList(\n",
       "          (0-5): 6 x BartDecoderLayer(\n",
       "            (self_attn): BartSdpaAttention(\n",
       "              (k_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (v_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (q_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (out_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "            )\n",
       "            (activation_fn): GELUActivation()\n",
       "            (self_attn_layer_norm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "            (encoder_attn): BartSdpaAttention(\n",
       "              (k_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (v_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (q_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "              (out_proj): Linear(in_features=768, out_features=768, bias=True)\n",
       "            )\n",
       "            (encoder_attn_layer_norm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "            (fc1): Linear(in_features=768, out_features=3072, bias=True)\n",
       "            (fc2): Linear(in_features=3072, out_features=768, bias=True)\n",
       "            (final_layer_norm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "          )\n",
       "        )\n",
       "        (layernorm_embedding): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
       "      )\n",
       "    )\n",
       "    (lm_head): Linear(in_features=768, out_features=50265, bias=False)\n",
       "  )\n",
       ")"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.to(\"cuda:0\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "4a72b9ac",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['i think that s something we might want', 'i think thatis something we might want', 'i think thatso something we might want', 'i think that S something we might want', 'i think thats something we might want']\n",
      "I think that's something we might want.\n"
     ]
    }
   ],
   "source": [
    "idx = 160\n",
    "print(decode_with_beam([df[\"Predicted Phonemes\"].apply(ast.literal_eval).iloc[idx]], return_N=5))\n",
    "print(df[\"True Sentence\"].iloc[idx])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "94958c15",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['in the context it would do well for us to pit in mine the vision of phoenix']\n"
     ]
    }
   ],
   "source": [
    "# df[\"Predicted Phonemes\"].apply(ast.literal_eval).iloc[0]\n",
    "i=0\n",
    "phoneme_batch = df[\"Predicted Phonemes\"][i:i+32]\n",
    "phoneme_batch = phoneme_batch.apply(ast.literal_eval).tolist()\n",
    "print(decode_with_beam(phoneme_batch, return_N=1))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "2938bcbd",
   "metadata": {},
   "outputs": [],
   "source": [
    "# phoneme_batch.__len__()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "9961d3b3",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 880/880 [00:57<00:00, 15.21it/s]\n"
     ]
    }
   ],
   "source": [
    "pred_texts = []\n",
    "\n",
    "for i in tqdm.trange(0,len(df), 1):\n",
    "    #convert ids to phonemes\n",
    "    phoneme_batch = df[\"Predicted Phonemes\"][i:i+1]\n",
    "    phoneme_batch = phoneme_batch.apply(ast.literal_eval).tolist()\n",
    "\n",
    "\n",
    "    #pass through phoneme2text model\n",
    "    pred_text = decode_with_beam(phoneme_batch, return_N=1)\n",
    "    pred_texts.extend(pred_text)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "b8565ddd",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Predicted Text:  its really important\n",
      "Original Text:  It's really unfortunate.\n"
     ]
    }
   ],
   "source": [
    "idx = 532\n",
    "print(\"Predicted Text: \", pred_texts[idx])\n",
    "print(\"Original Text: \", df[\"True Sentence\"][idx])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "78ce2bfd",
   "metadata": {},
   "outputs": [],
   "source": [
    "import string\n",
    "import re\n",
    "def preprocess_text(text):\n",
    "    \"\"\"\n",
    "    Remove punctuation, strip, and convert text to lowercase.\n",
    "    \"\"\"\n",
    "    return text.translate(str.maketrans('', '', string.punctuation)).strip().lower()\n",
    "\n",
    "\n",
    "# def preprocess_text(text):\n",
    "#     \"\"\"\n",
    "#     Simplified preprocessing:\n",
    "#     - Lowercase\n",
    "#     - Replace apostrophes with space (so \"I'm\" → \"I m\")\n",
    "#     - Remove punctuation (except what's now handled)\n",
    "#     - Normalize whitespace\n",
    "#     \"\"\"\n",
    "#     text = text.lower()\n",
    "#     text = text.replace(\"'\", \" \")  # <- key change\n",
    "#     text = text.translate(str.maketrans('', '', string.punctuation))\n",
    "#     text = re.sub(r'\\s+', ' ', text)  # Normalize multiple spaces\n",
    "#     return text.strip()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "47f9997d",
   "metadata": {},
   "outputs": [],
   "source": [
    "import jiwer  # For WER\n",
    "import sacrebleu  # For BLEU\n",
    "from rouge_score import rouge_scorer  # For ROUGE\n",
    "from nltk.translate.meteor_score import meteor_score  # For METEOR\n",
    "import bert_score  # For BERTScore\n",
    "import numpy as np\n",
    "\n",
    "def compute_metrics(text_transcriptions, gpt_decoded):\n",
    "    \"\"\"\n",
    "    Compute various NLP evaluation metrics for text generation.\n",
    "\n",
    "    Args:\n",
    "        text_transcriptions (list): List of ground-truth reference sentences.\n",
    "        gpt_decoded (list): List of model-generated sentences.\n",
    "\n",
    "    Returns:\n",
    "        dict: Dictionary containing all computed metrics.\n",
    "    \"\"\"\n",
    "\n",
    "    #remove punctuation, strip and lower case\n",
    "\n",
    "\n",
    "    text_transcriptions = [preprocess_text(text) for text in text_transcriptions]\n",
    "    gpt_decoded = [preprocess_text(text) for text in gpt_decoded]\n",
    "\n",
    "    results = {}\n",
    "\n",
    "    # WER (Word Error Rate)\n",
    "    wer = jiwer.wer(text_transcriptions, gpt_decoded)\n",
    "    results[\"WER\"] = wer\n",
    "\n",
    "    # BLEU Score\n",
    "    bleu = sacrebleu.corpus_bleu(gpt_decoded, [text_transcriptions]).score\n",
    "    results[\"BLEU\"] = bleu\n",
    "\n",
    "    # ROUGE Scores\n",
    "    rouge = rouge_scorer.RougeScorer([\"rouge1\", \"rouge2\", \"rougeL\"], use_stemmer=True)\n",
    "    rouge_scores = [rouge.score(ref, pred) for ref, pred in zip(text_transcriptions, gpt_decoded)]\n",
    "    results[\"ROUGE-1\"] = np.mean([score[\"rouge1\"].fmeasure for score in rouge_scores])\n",
    "    results[\"ROUGE-2\"] = np.mean([score[\"rouge2\"].fmeasure for score in rouge_scores])\n",
    "    results[\"ROUGE-L\"] = np.mean([score[\"rougeL\"].fmeasure for score in rouge_scores])\n",
    "\n",
    "    ##METEOR\n",
    "    tokenized_references = [ref.split() for ref in text_transcriptions]  # Tokenize reference sentences\n",
    "    tokenized_hypotheses = [pred.split() for pred in gpt_decoded]  # Tokenize predicted sentences\n",
    "\n",
    "    meteor_scores = [meteor_score([ref], pred) for ref, pred in zip(tokenized_references, tokenized_hypotheses)]\n",
    "    results[\"METEOR\"] = np.mean(meteor_scores)\n",
    "    # BERTScore (Semantic Similarity)\n",
    "    P, R, F1 = bert_score.score(gpt_decoded, text_transcriptions, lang=\"en\", rescale_with_baseline=True)\n",
    "    results[\"BERTScore_Precision\"] = P.mean().item()\n",
    "    results[\"BERTScore_Recall\"] = R.mean().item()\n",
    "    results[\"BERTScore_F1\"] = F1.mean().item()\n",
    "\n",
    "    ## save also all values without recomputing when possible\n",
    "    results[\"METEOR_scores\"] = meteor_scores\n",
    "    results[\"ROUGE_scores\"] = rouge_scores\n",
    "\n",
    "    results[\"WER_scores\"] = [jiwer.wer([ref], [pred]) for ref, pred in zip(text_transcriptions, gpt_decoded)]\n",
    "    results[\"BERTScore_F1_scores\"] = F1.cpu().numpy().tolist()\n",
    "    return results\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "1ce2829b",
   "metadata": {},
   "outputs": [],
   "source": [
    "sentences = df[\"True Sentence\"].tolist()\n",
    "decoded_sentences = pred_texts"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "ccc75d96",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Some weights of RobertaModel were not initialized from the model checkpoint at roberta-large and are newly initialized: ['roberta.pooler.dense.bias', 'roberta.pooler.dense.weight']\n",
      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "WER: 0.3136\n",
      "BLEU: 46.1677\n",
      "ROUGE-1: 0.7080\n",
      "ROUGE-2: 0.5298\n",
      "ROUGE-L: 0.7080\n",
      "METEOR: 0.6688\n",
      "BERTScore_Precision: 0.5156\n",
      "BERTScore_Recall: 0.5584\n",
      "BERTScore_F1: 0.5371\n"
     ]
    }
   ],
   "source": [
    "\n",
    "metrics = compute_metrics(sentences,decoded_sentences)\n",
    "for metric, score in metrics.items():\n",
    "    if \"scores\" not in metric:\n",
    "        print(f\"{metric}: {score:.4f}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "f0ec6a7b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "results_df = pd.DataFrame({\n",
    "    \"target_sentence\": sentences,\n",
    "    \"pred_sentence\": decoded_sentences,\n",
    "})\n",
    "\n",
    "#unfold cer_list\n",
    "# cer_list_unfold = [item for sublist in cer_list for item in sublist]\n",
    "\n",
    "results_df[\"WER_scores\"] = metrics[\"WER_scores\"]\n",
    "results_df[\"METEOR_scores\"] = metrics[\"METEOR_scores\"]\n",
    "results_df[\"ROUGE_scores\"] = metrics[\"ROUGE_scores\"]\n",
    "results_df[\"BERTScore_F1_scores\"] = metrics[\"BERTScore_F1_scores\"]\n",
    "\n",
    "results_df.to_csv(f\"{results_dir}/language_results_P2T.csv\", index=False)\n",
    "\n",
    "overall_metrics = {k:v for k,v in metrics.items() if \"scores\" not in k}\n",
    "\n",
    "metrics_df = pd.DataFrame(overall_metrics, index=[0])\n",
    "metrics_df.to_csv(f\"{results_dir}/language_metrics_P2T.csv\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "4cbc5c38",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>target_sentence</th>\n",
       "      <th>pred_sentence</th>\n",
       "      <th>WER_scores</th>\n",
       "      <th>METEOR_scores</th>\n",
       "      <th>ROUGE_scores</th>\n",
       "      <th>BERTScore_F1_scores</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>469</th>\n",
       "      <td>Were thoroughbreds.</td>\n",
       "      <td>we re both abandoned</td>\n",
       "      <td>2.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>-0.022317</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>229</th>\n",
       "      <td>Don't collect unemployment.</td>\n",
       "      <td>do nt tell a mannot</td>\n",
       "      <td>1.666667</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>-0.025470</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>621</th>\n",
       "      <td>Started investigating.</td>\n",
       "      <td>or a expensivelooking</td>\n",
       "      <td>1.500000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>-0.182870</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>58</th>\n",
       "      <td>Those musicians harmonize marvelously.</td>\n",
       "      <td>those emblems are mine i moan nervously</td>\n",
       "      <td>1.500000</td>\n",
       "      <td>0.116279</td>\n",
       "      <td>{'rouge1': (0.14285714285714285, 0.25, 0.18181...</td>\n",
       "      <td>0.084962</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>369</th>\n",
       "      <td>I'm wearing shorts.</td>\n",
       "      <td>i m rehearsing stories</td>\n",
       "      <td>1.333333</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.061029</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>111</th>\n",
       "      <td>Noise causes air pollution.</td>\n",
       "      <td>mary was guardhis dare solution</td>\n",
       "      <td>1.250000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>-0.168450</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>400</th>\n",
       "      <td>Friday afternoon at five thirty.</td>\n",
       "      <td>i do nt want that five lady</td>\n",
       "      <td>1.200000</td>\n",
       "      <td>0.096154</td>\n",
       "      <td>{'rouge1': (0.14285714285714285, 0.2, 0.166666...</td>\n",
       "      <td>-0.175747</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>Academic aptitude guarantees your diploma.</td>\n",
       "      <td>corrected mick abdul to disturb your replacement</td>\n",
       "      <td>1.200000</td>\n",
       "      <td>0.096154</td>\n",
       "      <td>{'rouge1': (0.14285714285714285, 0.2, 0.166666...</td>\n",
       "      <td>-0.038453</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>61</th>\n",
       "      <td>Inflammatory cells were strikingly absent.</td>\n",
       "      <td>in tim or sales were twitchingly apprent</td>\n",
       "      <td>1.200000</td>\n",
       "      <td>0.096154</td>\n",
       "      <td>{'rouge1': (0.14285714285714285, 0.2, 0.166666...</td>\n",
       "      <td>0.089066</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>Primitive tribes have an upbeat attitude.</td>\n",
       "      <td>many times have and a bit had stood</td>\n",
       "      <td>1.166667</td>\n",
       "      <td>0.080645</td>\n",
       "      <td>{'rouge1': (0.125, 0.16666666666666666, 0.1428...</td>\n",
       "      <td>0.008529</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>He talked about unauthentic storylines too.</td>\n",
       "      <td>ii checked about on athletic stores you</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.081967</td>\n",
       "      <td>{'rouge1': (0.14285714285714285, 0.16666666666...</td>\n",
       "      <td>0.034050</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>875</th>\n",
       "      <td>Your tuition reimbursement.</td>\n",
       "      <td>pure frustration resentment</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.146426</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Theocracy reconsidered.</td>\n",
       "      <td>rafe suggested</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.034907</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>624</th>\n",
       "      <td>To upholster chairs.</td>\n",
       "      <td>two offholsto chores</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.110160</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>612</th>\n",
       "      <td>Golden Retriever.</td>\n",
       "      <td>children rejoice</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>-0.007997</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>681</th>\n",
       "      <td>State land grant colleges.</td>\n",
       "      <td>set that rent soldiers</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.046407</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>272</th>\n",
       "      <td>Increasingly democratically oriented.</td>\n",
       "      <td>incredibly dismissively gordon</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.215967</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>117</th>\n",
       "      <td>Visionary leaders.</td>\n",
       "      <td>virginia later</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>{'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.064084</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>878</th>\n",
       "      <td>Mystery movies.</td>\n",
       "      <td>mattory movie</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.250000</td>\n",
       "      <td>{'rouge1': (0.5, 0.5, 0.5), 'rouge2': (0.0, 0....</td>\n",
       "      <td>0.377130</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Rich purchased several signed lithographs.</td>\n",
       "      <td>cheeks parcheis several sighs and lipsoffs</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.098039</td>\n",
       "      <td>{'rouge1': (0.16666666666666666, 0.2, 0.181818...</td>\n",
       "      <td>0.051935</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                 target_sentence  \\\n",
       "469                          Were thoroughbreds.   \n",
       "229                  Don't collect unemployment.   \n",
       "621                       Started investigating.   \n",
       "58        Those musicians harmonize marvelously.   \n",
       "369                          I'm wearing shorts.   \n",
       "111                  Noise causes air pollution.   \n",
       "400             Friday afternoon at five thirty.   \n",
       "19    Academic aptitude guarantees your diploma.   \n",
       "61    Inflammatory cells were strikingly absent.   \n",
       "13     Primitive tribes have an upbeat attitude.   \n",
       "10   He talked about unauthentic storylines too.   \n",
       "875                  Your tuition reimbursement.   \n",
       "0                        Theocracy reconsidered.   \n",
       "624                         To upholster chairs.   \n",
       "612                            Golden Retriever.   \n",
       "681                   State land grant colleges.   \n",
       "272        Increasingly democratically oriented.   \n",
       "117                           Visionary leaders.   \n",
       "878                              Mystery movies.   \n",
       "1     Rich purchased several signed lithographs.   \n",
       "\n",
       "                                        pred_sentence  WER_scores  \\\n",
       "469                              we re both abandoned    2.000000   \n",
       "229                               do nt tell a mannot    1.666667   \n",
       "621                             or a expensivelooking    1.500000   \n",
       "58            those emblems are mine i moan nervously    1.500000   \n",
       "369                            i m rehearsing stories    1.333333   \n",
       "111                   mary was guardhis dare solution    1.250000   \n",
       "400                       i do nt want that five lady    1.200000   \n",
       "19   corrected mick abdul to disturb your replacement    1.200000   \n",
       "61           in tim or sales were twitchingly apprent    1.200000   \n",
       "13                many times have and a bit had stood    1.166667   \n",
       "10            ii checked about on athletic stores you    1.000000   \n",
       "875                       pure frustration resentment    1.000000   \n",
       "0                                      rafe suggested    1.000000   \n",
       "624                              two offholsto chores    1.000000   \n",
       "612                                  children rejoice    1.000000   \n",
       "681                            set that rent soldiers    1.000000   \n",
       "272                    incredibly dismissively gordon    1.000000   \n",
       "117                                    virginia later    1.000000   \n",
       "878                                     mattory movie    1.000000   \n",
       "1          cheeks parcheis several sighs and lipsoffs    1.000000   \n",
       "\n",
       "     METEOR_scores                                       ROUGE_scores  \\\n",
       "469       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "229       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "621       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "58        0.116279  {'rouge1': (0.14285714285714285, 0.25, 0.18181...   \n",
       "369       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "111       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "400       0.096154  {'rouge1': (0.14285714285714285, 0.2, 0.166666...   \n",
       "19        0.096154  {'rouge1': (0.14285714285714285, 0.2, 0.166666...   \n",
       "61        0.096154  {'rouge1': (0.14285714285714285, 0.2, 0.166666...   \n",
       "13        0.080645  {'rouge1': (0.125, 0.16666666666666666, 0.1428...   \n",
       "10        0.081967  {'rouge1': (0.14285714285714285, 0.16666666666...   \n",
       "875       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "0         0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "624       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "612       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "681       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "272       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "117       0.000000  {'rouge1': (0.0, 0.0, 0.0), 'rouge2': (0.0, 0....   \n",
       "878       0.250000  {'rouge1': (0.5, 0.5, 0.5), 'rouge2': (0.0, 0....   \n",
       "1         0.098039  {'rouge1': (0.16666666666666666, 0.2, 0.181818...   \n",
       "\n",
       "     BERTScore_F1_scores  \n",
       "469            -0.022317  \n",
       "229            -0.025470  \n",
       "621            -0.182870  \n",
       "58              0.084962  \n",
       "369             0.061029  \n",
       "111            -0.168450  \n",
       "400            -0.175747  \n",
       "19             -0.038453  \n",
       "61              0.089066  \n",
       "13              0.008529  \n",
       "10              0.034050  \n",
       "875             0.146426  \n",
       "0               0.034907  \n",
       "624             0.110160  \n",
       "612            -0.007997  \n",
       "681             0.046407  \n",
       "272             0.215967  \n",
       "117             0.064084  \n",
       "878             0.377130  \n",
       "1               0.051935  "
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "results_df.sort_values(\"WER_scores\", ascending=False).head(20)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "b5e84641",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>target_sentence</th>\n",
       "      <th>pred_sentence</th>\n",
       "      <th>WER_scores</th>\n",
       "      <th>METEOR_scores</th>\n",
       "      <th>ROUGE_scores</th>\n",
       "      <th>BERTScore_F1_scores</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>434</th>\n",
       "      <td>I'm not sure how to go about it.</td>\n",
       "      <td>i m not sure how to go about it</td>\n",
       "      <td>0.25</td>\n",
       "      <td>0.862938</td>\n",
       "      <td>{'rouge1': (0.7777777777777778, 0.875, 0.82352...</td>\n",
       "      <td>0.733860</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>433</th>\n",
       "      <td>I can't really think of anything else offhand.</td>\n",
       "      <td>i cant really think of anything s offfriend</td>\n",
       "      <td>0.25</td>\n",
       "      <td>0.748264</td>\n",
       "      <td>{'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.71...</td>\n",
       "      <td>0.354997</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>702</th>\n",
       "      <td>Sometimes it will skip.</td>\n",
       "      <td>sometimes it will accept</td>\n",
       "      <td>0.25</td>\n",
       "      <td>0.736111</td>\n",
       "      <td>{'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...</td>\n",
       "      <td>0.574604</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>701</th>\n",
       "      <td>Buying of our fish.</td>\n",
       "      <td>mykking of our fish</td>\n",
       "      <td>0.25</td>\n",
       "      <td>0.736111</td>\n",
       "      <td>{'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...</td>\n",
       "      <td>0.457258</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>721</th>\n",
       "      <td>To find a mountain.</td>\n",
       "      <td>to find a manand</td>\n",
       "      <td>0.25</td>\n",
       "      <td>0.736111</td>\n",
       "      <td>{'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...</td>\n",
       "      <td>0.560610</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>487</th>\n",
       "      <td>How different the people there really are.</td>\n",
       "      <td>how different the people there really are</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.998542</td>\n",
       "      <td>{'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....</td>\n",
       "      <td>1.000001</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>492</th>\n",
       "      <td>How to do things.</td>\n",
       "      <td>how to do things</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.992188</td>\n",
       "      <td>{'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>497</th>\n",
       "      <td>They didn't fight together.</td>\n",
       "      <td>they didnt fight together</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.992188</td>\n",
       "      <td>{'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>501</th>\n",
       "      <td>If you do decide to go with child care.</td>\n",
       "      <td>if you do decide to go with child care</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.999314</td>\n",
       "      <td>{'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>632</th>\n",
       "      <td>Because you don't know.</td>\n",
       "      <td>because you dont know</td>\n",
       "      <td>0.00</td>\n",
       "      <td>0.992188</td>\n",
       "      <td>{'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                    target_sentence  \\\n",
       "434                I'm not sure how to go about it.   \n",
       "433  I can't really think of anything else offhand.   \n",
       "702                         Sometimes it will skip.   \n",
       "701                             Buying of our fish.   \n",
       "721                             To find a mountain.   \n",
       "..                                              ...   \n",
       "487      How different the people there really are.   \n",
       "492                               How to do things.   \n",
       "497                     They didn't fight together.   \n",
       "501         If you do decide to go with child care.   \n",
       "632                         Because you don't know.   \n",
       "\n",
       "                                   pred_sentence  WER_scores  METEOR_scores  \\\n",
       "434              i m not sure how to go about it        0.25       0.862938   \n",
       "433  i cant really think of anything s offfriend        0.25       0.748264   \n",
       "702                     sometimes it will accept        0.25       0.736111   \n",
       "701                          mykking of our fish        0.25       0.736111   \n",
       "721                             to find a manand        0.25       0.736111   \n",
       "..                                           ...         ...            ...   \n",
       "487    how different the people there really are        0.00       0.998542   \n",
       "492                             how to do things        0.00       0.992188   \n",
       "497                    they didnt fight together        0.00       0.992188   \n",
       "501       if you do decide to go with child care        0.00       0.999314   \n",
       "632                        because you dont know        0.00       0.992188   \n",
       "\n",
       "                                          ROUGE_scores  BERTScore_F1_scores  \n",
       "434  {'rouge1': (0.7777777777777778, 0.875, 0.82352...             0.733860  \n",
       "433  {'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.71...             0.354997  \n",
       "702  {'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...             0.574604  \n",
       "701  {'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...             0.457258  \n",
       "721  {'rouge1': (0.75, 0.75, 0.75), 'rouge2': (0.66...             0.560610  \n",
       "..                                                 ...                  ...  \n",
       "487  {'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....             1.000001  \n",
       "492  {'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....             1.000000  \n",
       "497  {'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....             1.000000  \n",
       "501  {'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....             1.000000  \n",
       "632  {'rouge1': (1.0, 1.0, 1.0), 'rouge2': (1.0, 1....             1.000000  \n",
       "\n",
       "[400 rows x 6 columns]"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "results_df.sort_values(\"WER_scores\", ascending=False).tail(400)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "4d2c77b1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array([154.,   0.,   0.,   2.,   5.,  19.,  27.,  35.,  36.,   3.,  43.,\n",
       "         14.,  64.,   2.,  36.,  10.,  88.,   0.,  22.,   2.,  47.,  20.,\n",
       "         13.,   0.,   0.,  73.,   0.,   8.,  13.,   0.,  28.,   7.,   0.,\n",
       "         33.,   1.,   4.,   0.,  16.,   0.,   0.,   9.,   4.,   3.,   2.,\n",
       "          0.,   1.,   0.,   0.,   0.,   0.,  26.,   0.,   0.,   0.,   0.,\n",
       "          0.,   0.,   0.,   1.,   0.,   3.,   0.,   1.,   0.,   0.,   0.,\n",
       "          1.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,   2.,   0.,\n",
       "          0.,   0.,   0.,   0.,   0.,   0.,   1.,   0.,   0.,   0.,   0.,\n",
       "          0.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,   0.,\n",
       "          1.]),\n",
       " array([0.  , 0.02, 0.04, 0.06, 0.08, 0.1 , 0.12, 0.14, 0.16, 0.18, 0.2 ,\n",
       "        0.22, 0.24, 0.26, 0.28, 0.3 , 0.32, 0.34, 0.36, 0.38, 0.4 , 0.42,\n",
       "        0.44, 0.46, 0.48, 0.5 , 0.52, 0.54, 0.56, 0.58, 0.6 , 0.62, 0.64,\n",
       "        0.66, 0.68, 0.7 , 0.72, 0.74, 0.76, 0.78, 0.8 , 0.82, 0.84, 0.86,\n",
       "        0.88, 0.9 , 0.92, 0.94, 0.96, 0.98, 1.  , 1.02, 1.04, 1.06, 1.08,\n",
       "        1.1 , 1.12, 1.14, 1.16, 1.18, 1.2 , 1.22, 1.24, 1.26, 1.28, 1.3 ,\n",
       "        1.32, 1.34, 1.36, 1.38, 1.4 , 1.42, 1.44, 1.46, 1.48, 1.5 , 1.52,\n",
       "        1.54, 1.56, 1.58, 1.6 , 1.62, 1.64, 1.66, 1.68, 1.7 , 1.72, 1.74,\n",
       "        1.76, 1.78, 1.8 , 1.82, 1.84, 1.86, 1.88, 1.9 , 1.92, 1.94, 1.96,\n",
       "        1.98, 2.  ]),\n",
       " <BarContainer object of 100 artists>)"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAigAAAGeCAYAAAC+dvpwAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8fJSN1AAAACXBIWXMAAA9hAAAPYQGoP6dpAAApUElEQVR4nO3df3RU1b3//9eEkAmlZGLAZJLbBKIXAREBQWKQVijR8ENKLrQaV6SpRei1xBbiVclaAkVtA5QrFBpJdSFoLz8qt4IV2igGA1cNAQPcK4gRbIQonWS1NBkSJEayv3/043w7JPyYMCF7wvOx1ll69tnnzHvPmTgv95wz4zDGGAEAAFgkrKMLAAAAOBcBBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwTnhHF9AWzc3NOnHihHr06CGHw9HR5QAAgEtgjNGpU6eUkJCgsLCLzJGYAO3cudPcfffdJj4+3kgymzdvbtHngw8+MJMmTTJRUVHma1/7mhk+fLg5duyYb/vnn39ufvzjH5uYmBjTvXt3M2XKFOPxeC65hqqqKiOJhYWFhYWFJQSXqqqqi77XBzyD0tDQoMGDB+uHP/yhpkyZ0mL7xx9/rFGjRmn69OlauHChoqKidOjQIUVGRvr6zJkzR9u2bdOmTZvkcrmUk5OjKVOm6J133rmkGnr06CFJqqqqUlRUVKBDAAAAHcDr9SoxMdH3Pn4hDmPa/mOBDodDmzdvVkZGhq8tMzNTXbt21W9/+9tW96mrq9O1116r9evX67vf/a4k6cMPP9SAAQNUWlqq22677aKP6/V65XK5VFdXR0ABACBEBPL+HdSLZJubm7Vt2zbdcMMNSk9PV2xsrFJSUrRlyxZfn/LycjU1NSktLc3X1r9/fyUlJam0tLTV4zY2Nsrr9fotAACg8wpqQKmpqVF9fb0WLVqkcePG6Y033tC//du/acqUKdq5c6ckyePxKCIiQtHR0X77xsXFyePxtHrc/Px8uVwu35KYmBjMsgEAgGWCPoMiSZMnT9acOXM0ZMgQzZ07V3fffbcKCwvbfNy8vDzV1dX5lqqqqmCVDAAALBTU24x79eql8PBw3XjjjX7tAwYM0Ntvvy1Jcrvd+uKLL1RbW+s3i1JdXS23293qcZ1Op5xOZzBLBQAAFgvqDEpERIRuvfVWVVRU+LV/9NFH6t27tyRp2LBh6tq1q4qLi33bKyoqdPz4caWmpgazHAAAEKICnkGpr6/X0aNHfeuVlZU6cOCAYmJilJSUpEcffVT33nuvvvWtb2nMmDEqKirSa6+9ppKSEkmSy+XS9OnTlZubq5iYGEVFRenhhx9WamrqJd3BAwAAOr+AbzMuKSnRmDFjWrRnZ2dr7dq1kqQXXnhB+fn5+vTTT9WvXz8tXLhQkydP9vU9c+aMHnnkEW3YsEGNjY1KT0/Xs88+e96PeM7FbcYAAISeQN6/L+t7UDoKAQUAgNDTYd+DAgAAEAwEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1gnqV913Fn3mbvNb/2TRxA6qBACAqxMzKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWCfggLJr1y5NmjRJCQkJcjgc2rJly3n7/vu//7scDoeWL1/u137y5EllZWUpKipK0dHRmj59uurr6wMtBQAAdFIBB5SGhgYNHjxYBQUFF+y3efNm7d69WwkJCS22ZWVl6dChQ9q+fbu2bt2qXbt2aebMmYGWAgAAOqnwQHcYP368xo8ff8E+n332mR5++GG9/vrrmjhxot+2w4cPq6ioSHv37tXw4cMlSStXrtSECRO0dOnSVgNNY2OjGhsbfeterzfQsgEAQAgJ+jUozc3NmjZtmh599FENHDiwxfbS0lJFR0f7wokkpaWlKSwsTGVlZa0eMz8/Xy6Xy7ckJiYGu2wAAGCRoAeUxYsXKzw8XD/5yU9a3e7xeBQbG+vXFh4erpiYGHk8nlb3ycvLU11dnW+pqqoKdtkAAMAiAX/EcyHl5eX61a9+pX379snhcATtuE6nU06nM2jHAwAAdgvqDMr//M//qKamRklJSQoPD1d4eLiOHTumRx55RH369JEkud1u1dTU+O335Zdf6uTJk3K73cEsBwAAhKigzqBMmzZNaWlpfm3p6emaNm2aHnjgAUlSamqqamtrVV5ermHDhkmSduzYoebmZqWkpASzHAAAEKICDij19fU6evSob72yslIHDhxQTEyMkpKS1LNnT7/+Xbt2ldvtVr9+/SRJAwYM0Lhx4zRjxgwVFhaqqalJOTk5yszMbPUOHgAAcPUJ+COe9957T0OHDtXQoUMlSbm5uRo6dKjmz59/ycdYt26d+vfvr7Fjx2rChAkaNWqUnnvuuUBLAQAAnVTAMyijR4+WMeaS+3/yySct2mJiYrR+/fpAHxoAAFwl+C0eAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALBOwAFl165dmjRpkhISEuRwOLRlyxbftqamJj3++OMaNGiQunfvroSEBH3/+9/XiRMn/I5x8uRJZWVlKSoqStHR0Zo+fbrq6+svezAAAKBzCDigNDQ0aPDgwSooKGix7fTp09q3b5/mzZunffv26ZVXXlFFRYW+853v+PXLysrSoUOHtH37dm3dulW7du3SzJkz2z4KAADQqTiMMabNOzsc2rx5szIyMs7bZ+/evRoxYoSOHTumpKQkHT58WDfeeKP27t2r4cOHS5KKioo0YcIEffrpp0pISLjo43q9XrlcLtXV1SkqKqqt5Z9Xn7nb/NY/WTQx6I8BAMDVJpD373a/BqWurk4Oh0PR0dGSpNLSUkVHR/vCiSSlpaUpLCxMZWVlrR6jsbFRXq/XbwEAAJ1XuwaUM2fO6PHHH9d9993nS0oej0exsbF+/cLDwxUTEyOPx9PqcfLz8+VyuXxLYmJie5YNAAA6WLsFlKamJt1zzz0yxmjVqlWXday8vDzV1dX5lqqqqiBVCQAAbBTeHgf9KpwcO3ZMO3bs8Pucye12q6amxq//l19+qZMnT8rtdrd6PKfTKafT2R6lAgAACwV9BuWrcHLkyBG9+eab6tmzp9/21NRU1dbWqry83Ne2Y8cONTc3KyUlJdjlAACAEBTwDEp9fb2OHj3qW6+srNSBAwcUExOj+Ph4ffe739W+ffu0detWnT171nddSUxMjCIiIjRgwACNGzdOM2bMUGFhoZqampSTk6PMzMxLuoMHAAB0fgEHlPfee09jxozxrefm5kqSsrOz9bOf/Ux/+MMfJElDhgzx2++tt97S6NGjJUnr1q1TTk6Oxo4dq7CwME2dOlUrVqxo4xAAAEBnE3BAGT16tC701SmX8rUqMTExWr9+faAPDQAArhL8Fg8AALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArBNwQNm1a5cmTZqkhIQEORwObdmyxW+7MUbz589XfHy8unXrprS0NB05csSvz8mTJ5WVlaWoqChFR0dr+vTpqq+vv6yBAACAziPggNLQ0KDBgweroKCg1e1LlizRihUrVFhYqLKyMnXv3l3p6ek6c+aMr09WVpYOHTqk7du3a+vWrdq1a5dmzpzZ9lEAAIBOJTzQHcaPH6/x48e3us0Yo+XLl+uJJ57Q5MmTJUkvvfSS4uLitGXLFmVmZurw4cMqKirS3r17NXz4cEnSypUrNWHCBC1dulQJCQmXMRwAANAZBPUalMrKSnk8HqWlpfnaXC6XUlJSVFpaKkkqLS1VdHS0L5xIUlpamsLCwlRWVtbqcRsbG+X1ev0WAADQeQU1oHg8HklSXFycX3tcXJxvm8fjUWxsrN/28PBwxcTE+PqcKz8/Xy6Xy7ckJiYGs2wAAGCZkLiLJy8vT3V1db6lqqqqo0sCAADtKKgBxe12S5Kqq6v92qurq33b3G63ampq/LZ/+eWXOnnypK/PuZxOp6KiovwWAADQeQU1oCQnJ8vtdqu4uNjX5vV6VVZWptTUVElSamqqamtrVV5e7uuzY8cONTc3KyUlJZjlAACAEBXwXTz19fU6evSob72yslIHDhxQTEyMkpKSNHv2bD399NPq27evkpOTNW/ePCUkJCgjI0OSNGDAAI0bN04zZsxQYWGhmpqalJOTo8zMTO7gAQAAktoQUN577z2NGTPGt56bmytJys7O1tq1a/XYY4+poaFBM2fOVG1trUaNGqWioiJFRkb69lm3bp1ycnI0duxYhYWFaerUqVqxYkUQhgMAADoDhzHGdHQRgfJ6vXK5XKqrq2uX61H6zN3mt/7JoolBfwwAAK42gbx/h8RdPAAA4OpCQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1wju6AISePnO3+a1/smhiB1UCAOismEEBAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsE7QA8rZs2c1b948JScnq1u3brr++uv11FNPyRjj62OM0fz58xUfH69u3bopLS1NR44cCXYpAAAgRAU9oCxevFirVq3Sr3/9ax0+fFiLFy/WkiVLtHLlSl+fJUuWaMWKFSosLFRZWZm6d++u9PR0nTlzJtjlAACAEBQe7AO+++67mjx5siZOnChJ6tOnjzZs2KA9e/ZI+sfsyfLly/XEE09o8uTJkqSXXnpJcXFx2rJlizIzM1scs7GxUY2Njb51r9cb7LIBAIBFgj6DMnLkSBUXF+ujjz6SJP3v//6v3n77bY0fP16SVFlZKY/Ho7S0NN8+LpdLKSkpKi0tbfWY+fn5crlcviUxMTHYZQMAAIsEfQZl7ty58nq96t+/v7p06aKzZ8/q5z//ubKysiRJHo9HkhQXF+e3X1xcnG/bufLy8pSbm+tb93q9hBQAADqxoAeUl19+WevWrdP69es1cOBAHThwQLNnz1ZCQoKys7PbdEyn0ymn0xnkSgEAgK2CHlAeffRRzZ0713ctyaBBg3Ts2DHl5+crOztbbrdbklRdXa34+HjfftXV1RoyZEiwywEAACEo6NegnD59WmFh/oft0qWLmpubJUnJyclyu90qLi72bfd6vSorK1NqamqwywEAACEo6DMokyZN0s9//nMlJSVp4MCB2r9/v5555hn98Ic/lCQ5HA7Nnj1bTz/9tPr27avk5GTNmzdPCQkJysjICHY5AAAgBAU9oKxcuVLz5s3Tj3/8Y9XU1CghIUE/+tGPNH/+fF+fxx57TA0NDZo5c6Zqa2s1atQoFRUVKTIyMtjlAACAEOQw//wVryHC6/XK5XKprq5OUVFRQT9+n7nb/NY/WTQx6I8Rynh+AABtEcj7N7/FAwAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYJ+jfJAt0tHO/SE7iy+QAINQwgwIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1wju6AFw5feZu81v/ZNHEDqoEAIALYwYFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB12iWgfPbZZ7r//vvVs2dPdevWTYMGDdJ7773n226M0fz58xUfH69u3bopLS1NR44caY9SAABACAp6QPn73/+u22+/XV27dtWf/vQnffDBB/rP//xPXXPNNb4+S5Ys0YoVK1RYWKiysjJ1795d6enpOnPmTLDLAQAAISjo34OyePFiJSYmas2aNb625ORk378bY7R8+XI98cQTmjx5siTppZdeUlxcnLZs2aLMzMwWx2xsbFRjY6Nv3ev1BrtsAABgkaDPoPzhD3/Q8OHD9b3vfU+xsbEaOnSonn/+ed/2yspKeTwepaWl+dpcLpdSUlJUWlra6jHz8/Plcrl8S2JiYrDLBgAAFgl6QPnzn/+sVatWqW/fvnr99df10EMP6Sc/+YlefPFFSZLH45EkxcXF+e0XFxfn23auvLw81dXV+Zaqqqpglw0AACwS9I94mpubNXz4cP3iF7+QJA0dOlQHDx5UYWGhsrOz23RMp9Mpp9MZzDIBAIDFgj6DEh8frxtvvNGvbcCAATp+/Lgkye12S5Kqq6v9+lRXV/u2AQCAq1vQA8rtt9+uiooKv7aPPvpIvXv3lvSPC2bdbreKi4t9271er8rKypSamhrscgAAQAgK+kc8c+bM0ciRI/WLX/xC99xzj/bs2aPnnntOzz33nCTJ4XBo9uzZevrpp9W3b18lJydr3rx5SkhIUEZGRrDLAQAAISjoAeXWW2/V5s2blZeXpyeffFLJyclavny5srKyfH0ee+wxNTQ0aObMmaqtrdWoUaNUVFSkyMjIYJcDAABCUNADiiTdfffduvvuu8+73eFw6Mknn9STTz7ZHg8PAABCHL/FAwAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYJ3wji4AV68+c7f5rX+yaGIHVQIAsA0zKAAAwDoEFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdfiitk6CLz0DAHQmzKAAAADrEFAAAIB12j2gLFq0SA6HQ7Nnz/a1nTlzRrNmzVLPnj319a9/XVOnTlV1dXV7lwIAAEJEuwaUvXv36je/+Y1uvvlmv/Y5c+botdde06ZNm7Rz506dOHFCU6ZMac9SAABACGm3gFJfX6+srCw9//zzuuaaa3ztdXV1Wr16tZ555hl9+9vf1rBhw7RmzRq9++672r17d3uVAwAAQki7BZRZs2Zp4sSJSktL82svLy9XU1OTX3v//v2VlJSk0tLSVo/V2Ngor9frtwAAgM6rXW4z3rhxo/bt26e9e/e22ObxeBQREaHo6Gi/9ri4OHk8nlaPl5+fr4ULF7ZHqQAAwEJBn0GpqqrST3/6U61bt06RkZFBOWZeXp7q6up8S1VVVVCOCwAA7BT0gFJeXq6amhrdcsstCg8PV3h4uHbu3KkVK1YoPDxccXFx+uKLL1RbW+u3X3V1tdxud6vHdDqdioqK8lsAAEDnFfSPeMaOHav333/fr+2BBx5Q//799fjjjysxMVFdu3ZVcXGxpk6dKkmqqKjQ8ePHlZqaGuxyAABACAp6QOnRo4duuukmv7bu3burZ8+evvbp06crNzdXMTExioqK0sMPP6zU1FTddtttwS4HAACEoA75LZ5ly5YpLCxMU6dOVWNjo9LT0/Xss892RCkAAMBCVySglJSU+K1HRkaqoKBABQUFV+LhAQBAiOG3eAAAgHUIKAAAwDodcg0KAtNn7ja/9U8WTewUjwUAwPkwgwIAAKzDDIplzp3BAADgasQMCgAAsA4BBQAAWIeAAgAArENAAQAA1uEiWeAK4PZtAAgMMygAAMA6BBQAAGAdAgoAALAOAQUAAFiHgAIAAKxDQAEAANYhoAAAAOsQUAAAgHUIKAAAwDoEFAAAYB2+6h4IwLlfWS/xtfUA0B6YQQEAANYhoAAAAOvwEU8Ha+0jAwAArnbMoAAAAOswgwLAOlyMDIAZFAAAYB0CCgAAsA4BBQAAWIeAAgAArENAAQAA1iGgAAAA6xBQAACAdQgoAADAOnxRG9rFuV+0xZdsAQACEfQZlPz8fN16663q0aOHYmNjlZGRoYqKCr8+Z86c0axZs9SzZ099/etf19SpU1VdXR3sUgAAQIgKekDZuXOnZs2apd27d2v79u1qamrSXXfdpYaGBl+fOXPm6LXXXtOmTZu0c+dOnThxQlOmTAl2KQAAIEQF/SOeoqIiv/W1a9cqNjZW5eXl+ta3vqW6ujqtXr1a69ev17e//W1J0po1azRgwADt3r1bt912W7BLAgAAIabdL5Ktq6uTJMXExEiSysvL1dTUpLS0NF+f/v37KykpSaWlpa0eo7GxUV6v128BAACdV7teJNvc3KzZs2fr9ttv10033SRJ8ng8ioiIUHR0tF/fuLg4eTyeVo+Tn5+vhQsXtmepsAC/YAsA+Eq7zqDMmjVLBw8e1MaNGy/rOHl5eaqrq/MtVVVVQaoQAADYqN1mUHJycrR161bt2rVL3/jGN3ztbrdbX3zxhWpra/1mUaqrq+V2u1s9ltPplNPpbK9Sr5jWZggAAEBLQZ9BMcYoJydHmzdv1o4dO5ScnOy3fdiwYeratauKi4t9bRUVFTp+/LhSU1ODXQ4AAAhBQZ9BmTVrltavX69XX31VPXr08F1X4nK51K1bN7lcLk2fPl25ubmKiYlRVFSUHn74YaWmpnIHDwAAkNQOAWXVqlWSpNGjR/u1r1mzRj/4wQ8kScuWLVNYWJimTp2qxsZGpaen69lnnw12KQAAIEQFPaAYYy7aJzIyUgUFBSooKAj2wwMAgE6AHwsEAADWIaAAAADr8GvGQAjhV6IBXC2YQQEAANYhoAAAAOsQUAAAgHW4BqWT4mv1AQChjBkUAABgHQIKAACwDh/xwGpX8rba1j4W4zZeAOgYzKAAAADrEFAAAIB1CCgAAMA6BBQAAGAdAgoAALAOd/HggvjCNwBAR2AGBQAAWIeAAgAArMNHPEAnxxfQAQhFzKAAAADrMIOCqxYXAAOAvZhBAQAA1mEGBbhMV/IHDQHgasEMCgAAsA4BBQAAWIeAAgAArENAAQAA1uEi2XbEbawAALQNMygAAMA6zKAAlriStytzazQA2zGDAgAArMMMSgji2hYEGz8oePl4DoHgYgYFAABYh4ACAACsw0c8QRKKH7tcyZpD8fm52nEhLS4Hrx9crg6dQSkoKFCfPn0UGRmplJQU7dmzpyPLAQAAluiwGZTf/e53ys3NVWFhoVJSUrR8+XKlp6eroqJCsbGxHVUWcEV0lhmlq+X/koN1Aaxtx7ma8JxdmI3PT4cFlGeeeUYzZszQAw88IEkqLCzUtm3b9MILL2ju3Ll+fRsbG9XY2Ohbr6urkyR5vd52qa258bTf+qU8zrn7XE1ae37a6/lo67loa43n7teWfS51v7Yc50q+NoNVz6W41HN4pVxKPcHqE6x6Olp7vTbaKhSes450pZ6fr45pjLl4Z9MBGhsbTZcuXczmzZv92r///e+b73znOy36L1iwwEhiYWFhYWFh6QRLVVXVRbNCh8yg/PWvf9XZs2cVFxfn1x4XF6cPP/ywRf+8vDzl5ub61pubm3Xy5En17NlTDocjqLV5vV4lJiaqqqpKUVFRQT22DRhf6OvsY+zs45M6/xgZX+hrrzEaY3Tq1CklJCRctG9I3MXjdDrldDr92qKjo9v1MaOiojrtC09ifJ1BZx9jZx+f1PnHyPhCX3uM0eVyXVK/DrmLp1evXurSpYuqq6v92qurq+V2uzuiJAAAYJEOCSgREREaNmyYiouLfW3Nzc0qLi5WampqR5QEAAAs0mEf8eTm5io7O1vDhw/XiBEjtHz5cjU0NPju6ukoTqdTCxYsaPGRUmfB+EJfZx9jZx+f1PnHyPhCnw1jdBhzKff6tI9f//rX+uUvfymPx6MhQ4ZoxYoVSklJ6ahyAACAJTo0oAAAALSGHwsEAADWIaAAAADrEFAAAIB1CCgAAMA6nT6gFBQUqE+fPoqMjFRKSor27Nlzwf6bNm1S//79FRkZqUGDBumPf/yj33ZjjObPn6/4+Hh169ZNaWlpOnLkSHsO4aICGePzzz+vb37zm7rmmmt0zTXXKC0trUX/H/zgB3I4HH7LuHHj2nsY5xXI+NauXdui9sjISL8+tp3DQMY3evToFuNzOByaOPH//9VRm87frl27NGnSJCUkJMjhcGjLli0X3aekpES33HKLnE6n/vVf/1Vr165t0SfQv+v2FOgYX3nlFd1555269tprFRUVpdTUVL3++ut+fX72s5+1OIf9+/dvx1GcX6DjKykpafU16vF4/PqF8jls7W/M4XBo4MCBvj62nMP8/Hzdeuut6tGjh2JjY5WRkaGKioqL7mfDe2GnDii/+93vlJubqwULFmjfvn0aPHiw0tPTVVNT02r/d999V/fdd5+mT5+u/fv3KyMjQxkZGTp48KCvz5IlS7RixQoVFhaqrKxM3bt3V3p6us6cOXOlhuUn0DGWlJTovvvu01tvvaXS0lIlJibqrrvu0meffebXb9y4cfrLX/7iWzZs2HAlhtNCoOOT/vHVzP9c+7Fjx/y223QOAx3fK6+84je2gwcPqkuXLvre977n18+W89fQ0KDBgweroKDgkvpXVlZq4sSJGjNmjA4cOKDZs2frwQcf9HsDb8troj0FOsZdu3bpzjvv1B//+EeVl5drzJgxmjRpkvbv3+/Xb+DAgX7n8O23326P8i8q0PF9paKiwq/+2NhY37ZQP4e/+tWv/MZWVVWlmJiYFn+HNpzDnTt3atasWdq9e7e2b9+upqYm3XXXXWpoaDjvPta8F17uLxPbbMSIEWbWrFm+9bNnz5qEhASTn5/fav977rnHTJw40a8tJSXF/OhHPzLGGNPc3Gzcbrf55S9/6dteW1trnE6n2bBhQzuM4OICHeO5vvzyS9OjRw/z4osv+tqys7PN5MmTg11qmwQ6vjVr1hiXy3Xe49l2Di/3/C1btsz06NHD1NfX+9psOn//TFKLXzA/12OPPWYGDhzo13bvvfea9PR03/rlPmft6VLG2Jobb7zRLFy40Le+YMECM3jw4OAVFiSXMr633nrLSDJ///vfz9uns53DzZs3G4fDYT755BNfm63nsKamxkgyO3fuPG8fW94LO+0MyhdffKHy8nKlpaX52sLCwpSWlqbS0tJW9yktLfXrL0np6em+/pWVlfJ4PH59XC6XUlJSznvM9tSWMZ7r9OnTampqUkxMjF97SUmJYmNj1a9fPz300EP629/+FtTaL0Vbx1dfX6/evXsrMTFRkydP1qFDh3zbbDqHwTh/q1evVmZmprp37+7XbsP5a4uL/Q0G4zmzTXNzs06dOtXib/DIkSNKSEjQddddp6ysLB0/fryDKmybIUOGKD4+XnfeeafeeecdX3tnPIerV69WWlqaevfu7ddu4zmsq6uTpBavt39my3thpw0of/3rX3X27FnFxcX5tcfFxbX4LPQrHo/ngv2/+mcgx2xPbRnjuR5//HElJCT4vdDGjRunl156ScXFxVq8eLF27typ8ePH6+zZs0Gt/2LaMr5+/frphRde0Kuvvqr/+q//UnNzs0aOHKlPP/1Ukl3n8HLP3549e3Tw4EE9+OCDfu22nL+2ON/foNfr1eeffx6U17xtli5dqvr6et1zzz2+tpSUFK1du1ZFRUVatWqVKisr9c1vflOnTp3qwEovTXx8vAoLC/X73/9ev//975WYmKjRo0dr3759koLz3y2bnDhxQn/6059a/B3aeA6bm5s1e/Zs3X777brpppvO28+W98IO+y0edLxFixZp48aNKikp8buQNDMz0/fvgwYN0s0336zrr79eJSUlGjt2bEeUeslSU1P9fnBy5MiRGjBggH7zm9/oqaee6sDKgm/16tUaNGiQRowY4dceyufvarN+/XotXLhQr776qt81GuPHj/f9+80336yUlBT17t1bL7/8sqZPn94RpV6yfv36qV+/fr71kSNH6uOPP9ayZcv029/+tgMrax8vvviioqOjlZGR4ddu4zmcNWuWDh482GHXMwWq086g9OrVS126dFF1dbVfe3V1tdxud6v7uN3uC/b/6p+BHLM9tWWMX1m6dKkWLVqkN954QzfffPMF+1533XXq1auXjh49etk1B+JyxveVrl27aujQob7abTqHlzO+hoYGbdy48ZL+Q9dR568tzvc3GBUVpW7dugXlNWGLjRs36sEHH9TLL7/cYjr9XNHR0brhhhtC4hy2ZsSIEb7aO9M5NMbohRde0LRp0xQREXHBvh19DnNycrR161a99dZb+sY3vnHBvra8F3bagBIREaFhw4apuLjY19bc3Kzi4mK//8P+Z6mpqX79JWn79u2+/snJyXK73X59vF6vysrKznvM9tSWMUr/uPr6qaeeUlFRkYYPH37Rx/n000/1t7/9TfHx8UGp+1K1dXz/7OzZs3r//fd9tdt0Di9nfJs2bVJjY6Puv//+iz5OR52/trjY32AwXhM22LBhgx544AFt2LDB7xbx86mvr9fHH38cEuewNQcOHPDV3lnOofSPO2SOHj16Sf+j0FHn0BijnJwcbd68WTt27FBycvJF97HmvTBol9taaOPGjcbpdJq1a9eaDz74wMycOdNER0cbj8djjDFm2rRpZu7cub7+77zzjgkPDzdLly41hw8fNgsWLDBdu3Y177//vq/PokWLTHR0tHn11VfN//3f/5nJkyeb5ORk8/nnn1/x8RkT+BgXLVpkIiIizH//93+bv/zlL77l1KlTxhhjTp06Zf7jP/7DlJaWmsrKSvPmm2+aW265xfTt29ecOXPG+vEtXLjQvP766+bjjz825eXlJjMz00RGRppDhw75+th0DgMd31dGjRpl7r333hbttp2/U6dOmf3795v9+/cbSeaZZ54x+/fvN8eOHTPGGDN37lwzbdo0X/8///nP5mtf+5p59NFHzeHDh01BQYHp0qWLKSoq8vW52HN2pQU6xnXr1pnw8HBTUFDg9zdYW1vr6/PII4+YkpISU1lZad555x2TlpZmevXqZWpqaqwf37Jly8yWLVvMkSNHzPvvv29++tOfmrCwMPPmm2/6+oT6OfzK/fffb1JSUlo9pi3n8KGHHjIul8uUlJT4vd5Onz7t62Pre2GnDijGGLNy5UqTlJRkIiIizIgRI8zu3bt92+644w6TnZ3t1//ll182N9xwg4mIiDADBw4027Zt89ve3Nxs5s2bZ+Li4ozT6TRjx441FRUVV2Io5xXIGHv37m0ktVgWLFhgjDHm9OnT5q677jLXXnut6dq1q+ndu7eZMWNGh/2Hw5jAxjd79mxf37i4ODNhwgSzb98+v+PZdg4DfY1++OGHRpJ54403WhzLtvP31S2n5y5fjSk7O9vccccdLfYZMmSIiYiIMNddd51Zs2ZNi+Ne6Dm70gId4x133HHB/sb849bq+Ph4ExERYf7lX/7F3Hvvvebo0aNXdmD/T6DjW7x4sbn++utNZGSkiYmJMaNHjzY7duxocdxQPofG/OO22m7dupnnnnuu1WPacg5bG5ckv78rW98LHf9vAAAAANbotNegAACA0EVAAQAA1iGgAAAA6xBQAACAdQgoAADAOgQUAABgHQIKAACwDgEFAABYh4ACAACsQ0ABAADWIaAAAADr/H+5D692aSfKOAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 640x480 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "plt.hist(results_df[\"WER_scores\"], bins=100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "5fb0d414",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.2928571428571428"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.percentile(results_df[\"WER_scores\"], 50)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "evo",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
