{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "f1013317",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "[nltk_data] Downloading package cmudict to /home/XXXXXX/nltk_data...\n",
      "[nltk_data]   Package cmudict is already up-to-date!\n"
     ]
    }
   ],
   "source": [
    "import pickle\n",
    "from torch.nn.utils.rnn import pad_sequence\n",
    "from torch.utils.data import DataLoader\n",
    "import torch\n",
    "from dataset import SpeechSentenceDataset, idsToPhonemes, getDatasetLoaders, PHONE_DEF, PHONE_DEF_SIL\n",
    "import re \n",
    "from g2p_en import G2p\n",
    "import numpy as np\n",
    "from model.ctc_modelling import LightningGRUDecoder\n",
    "import time\n",
    "import numpy as np\n",
    "from edit_distance import SequenceMatcher\n",
    "import tqdm\n",
    "import pytorch_lightning as pl\n",
    "import jiwer\n",
    "import nltk\n",
    "from nltk.corpus import cmudict\n",
    "from pytorch_lightning.loggers import WandbLogger\n",
    "import wandb\n",
    "from pytorch_lightning.callbacks import ModelCheckpoint, EarlyStopping\n",
    "import copy\n",
    "from difflib import get_close_matches\n",
    "from transformers import GPT2LMHeadModel, GPT2Config, GPT2Tokenizer\n",
    "import pandas as pd\n",
    "from torchaudio.models.decoder import ctc_decoder\n",
    "import string\n",
    "from config import DATASET_SM_ROBUST, DATASET_SM_ZSCORE\n",
    "import os\n",
    "# from model.ctc_modelling import Light\n",
    "\n",
    "# Download CMU Pronouncing Dictionary (First-time use)\n",
    "nltk.download(\"cmudict\")\n",
    "\n",
    "# Load CMUdict\n",
    "cmu_dict = cmudict.dict()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "c9719402",
   "metadata": {},
   "outputs": [],
   "source": [
    "train_loader, test_loader,_, loadedData = getDatasetLoaders(DATASET_SM_ZSCORE, 64)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "a2dc1e06",
   "metadata": {},
   "outputs": [],
   "source": [
    "nInputFeatures = 256 #channels \n",
    "nClasses = 40 \n",
    "dropout = 0.4 \n",
    "hidden_dim = 1024\n",
    "nlayers = 5\n",
    "stride_len = 4\n",
    "kernel_len =32\n",
    "gaussian_smooth_width = 2\n",
    "bidirectional = True\n",
    "\n",
    "white_noise_SD = 0.8\n",
    "constant_offset_SD = 0.2\n",
    "seq_len = 150\n",
    "max_time_series_len = 12000\n",
    "\n",
    "lr_start = 1e-4\n",
    "lr_end = 1e-5\n",
    "l2_decay = 1e-5\n",
    "\n",
    "\n",
    "warmup_epoch = 5\n",
    "steps_per_epoch = len(train_loader)\n",
    "warmup_steps = warmup_epoch * steps_per_epoch\n",
    "\n",
    "target_epoch = 60\n",
    "total_steps = target_epoch * steps_per_epoch\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "fb37744b",
   "metadata": {},
   "outputs": [],
   "source": [
    "output_name = \"gru_ctc\"\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "b83a12fe",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/torch/functional.py:534: UserWarning: torch.meshgrid: in an upcoming release, it will be required to pass the indexing argument. (Triggered internally at ../aten/src/ATen/native/TensorShape.cpp:3595.)\n",
      "  return _VF.meshgrid(tensors, **kwargs)  # type: ignore[attr-defined]\n",
      "GPU available: True (cuda), used: True\n",
      "TPU available: False, using: 0 TPU cores\n",
      "HPU available: False, using: 0 HPUs\n",
      "You are using a CUDA device ('NVIDIA H100 80GB HBM3') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision\n",
      "\u001b[34m\u001b[1mwandb\u001b[0m: Currently logged in as: \u001b[33mXXXXXXXXXXXXXX\u001b[0m. Use \u001b[1m`wandb login --relogin`\u001b[0m to force relogin\n",
      "\u001b[34m\u001b[1mwandb\u001b[0m: Using wandb-core as the SDK backend.  Please refer to https://wandb.me/wandb-core for more information.\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "Tracking run with wandb version 0.19.4"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "Run data is saved locally in <code>./wandb/run-20250515_085136-5ml9qn9j</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "Syncing run <strong><a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset/runs/5ml9qn9j' target=\"_blank\">GRU_CTC</a></strong> to <a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset' target=\"_blank\">Weights & Biases</a> (<a href='https://wandb.me/developer-guide' target=\"_blank\">docs</a>)<br>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       " View project at <a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset' target=\"_blank\">https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset</a>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       " View run at <a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset/runs/5ml9qn9j' target=\"_blank\">https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset/runs/5ml9qn9j</a>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1,2]\n",
      "\n",
      "  | Name                   | Type              | Params | Mode \n",
      "---------------------------------------------------------------------\n",
      "0 | inputLayerNonlinearity | Softsign          | 0      | train\n",
      "1 | unfolder               | Unfold            | 0      | train\n",
      "2 | gaussianSmoother       | GaussianSmoothing | 0      | train\n",
      "3 | gru_decoder            | GRU               | 132 M  | train\n",
      "4 | fc_decoder_out         | Linear            | 84.0 K | train\n",
      "5 | ctc_loss               | CTCLoss           | 0      | train\n",
      "  | other params           | n/a               | 1.6 M  | n/a  \n",
      "---------------------------------------------------------------------\n",
      "133 M     Trainable params\n",
      "0         Non-trainable params\n",
      "133 M     Total params\n",
      "535.380   Total estimated model params size (MB)\n",
      "6         Modules in train mode\n",
      "0         Modules in eval mode\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "c32a2e4625d740e0abe950771fbfc46a",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Sanity Checking: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/data_connector.py:425: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=63` in the `DataLoader` to improve performance.\n",
      "/data/XXXXXX/speech_decoding_BCI/augmentations.py:91: UserWarning: Using padding='same' with even kernel lengths and odd dilation may require a zero-padded copy of the input be created (Triggered internally at ../aten/src/ATen/native/Convolution.cpp:1036.)\n",
      "  return self.conv(input, weight=self.weight, groups=self.groups, padding=\"same\")\n",
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/pytorch_lightning/utilities/data.py:79: Trying to infer the `batch_size` from an ambiguous collection. The batch size we found is 64. To avoid any miscalculations, use `self.log(..., batch_size=batch_size)`.\n",
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/data_connector.py:425: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=63` in the `DataLoader` to improve performance.\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "81a56f45b120419983fd82fc128eb0a5",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Training: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/pytorch_lightning/utilities/data.py:79: Trying to infer the `batch_size` from an ambiguous collection. The batch size we found is 32. To avoid any miscalculations, use `self.log(..., batch_size=batch_size)`.\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e89b127185c64c9581ecfe74903aa59a",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/XXXXXX/anaconda3/envs/evo/lib/python3.9/site-packages/pytorch_lightning/utilities/data.py:79: Trying to infer the `batch_size` from an ambiguous collection. The batch size we found is 48. To avoid any miscalculations, use `self.log(..., batch_size=batch_size)`.\n",
      "Metric val_loss improved. New best score: 2.010\n",
      "Epoch 0, global step 138: 'val_loss' reached 2.01020 (best 2.01020), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "cd6e80c2337a47da9209bc2bf1e83db8",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.482 >= min_delta = 0.0. New best score: 1.528\n",
      "Epoch 1, global step 276: 'val_loss' reached 1.52797 (best 1.52797), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e5473ae6de7f4406873b8c235209ca04",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.237 >= min_delta = 0.0. New best score: 1.291\n",
      "Epoch 2, global step 414: 'val_loss' reached 1.29128 (best 1.29128), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "9ab07273db644a2597a0b792d0cc49d9",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.135 >= min_delta = 0.0. New best score: 1.156\n",
      "Epoch 3, global step 552: 'val_loss' reached 1.15638 (best 1.15638), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "6a8edbed6cf24c839e5b81a48a5b13a4",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.091 >= min_delta = 0.0. New best score: 1.066\n",
      "Epoch 4, global step 690: 'val_loss' reached 1.06576 (best 1.06576), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "3c0c354d09cf40f897ab6f005492bca2",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.081 >= min_delta = 0.0. New best score: 0.984\n",
      "Epoch 5, global step 828: 'val_loss' reached 0.98430 (best 0.98430), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e15be2a55b144602b23e9642de524433",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.046 >= min_delta = 0.0. New best score: 0.938\n",
      "Epoch 6, global step 966: 'val_loss' reached 0.93836 (best 0.93836), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "88a7a3477fe14c0b8cda93328d890563",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.050 >= min_delta = 0.0. New best score: 0.888\n",
      "Epoch 7, global step 1104: 'val_loss' reached 0.88809 (best 0.88809), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "abdb49c14845416c9ccbcd0f2dd713c9",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.030 >= min_delta = 0.0. New best score: 0.858\n",
      "Epoch 8, global step 1242: 'val_loss' reached 0.85797 (best 0.85797), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "a74a61624c3d4bde9c6155e542108fa0",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.016 >= min_delta = 0.0. New best score: 0.842\n",
      "Epoch 9, global step 1380: 'val_loss' reached 0.84230 (best 0.84230), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "76b70bcda39b44a98b9564ce442a4615",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.023 >= min_delta = 0.0. New best score: 0.820\n",
      "Epoch 10, global step 1518: 'val_loss' reached 0.81950 (best 0.81950), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "37846c1e69f74dc4b52cb08efe1ddca3",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.008 >= min_delta = 0.0. New best score: 0.812\n",
      "Epoch 11, global step 1656: 'val_loss' reached 0.81186 (best 0.81186), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "2e958287b34b4b198ed4fbbb488e4e08",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.029 >= min_delta = 0.0. New best score: 0.782\n",
      "Epoch 12, global step 1794: 'val_loss' reached 0.78248 (best 0.78248), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "4e4dfe55d5d4440f8a131310ad378a19",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.007 >= min_delta = 0.0. New best score: 0.775\n",
      "Epoch 13, global step 1932: 'val_loss' reached 0.77506 (best 0.77506), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "3b2de83c6b09427fb74dd0bb8690aee2",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 14, global step 2070: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e7e9d5c842f04cb2ac9d686982347175",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.015 >= min_delta = 0.0. New best score: 0.760\n",
      "Epoch 15, global step 2208: 'val_loss' reached 0.75980 (best 0.75980), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "4b820bc6bec143529515019d6e4f7f18",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 16, global step 2346: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "048939d79a0a4caab45ac270fc263f35",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 17, global step 2484: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "64eb67de55f5430abc2fefb0b16c5bbd",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Metric val_loss improved by 0.012 >= min_delta = 0.0. New best score: 0.748\n",
      "Epoch 18, global step 2622: 'val_loss' reached 0.74766 (best 0.74766), saving model to '/data/XXXXXX/speech_decoding_BCI/.checkpoints/gru_ctc/best_model.ckpt' as top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "a3305e914f564dbfb35db24c8cdeb8eb",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 19, global step 2760: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "c330d548eb6e4b7797d91af55377ed53",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 20, global step 2898: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "46f7fd75f6fa4347bfcc53209dc8a921",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 21, global step 3036: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "1081c93fbc094f5482cc8e12e0aa54c0",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Epoch 22, global step 3174: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "280558ae16d04d389983d3694827cf5b",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Validation: |          | 0/? [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Monitored metric val_loss did not improve in the last 5 records. Best score: 0.748. Signaling Trainer to stop.\n",
      "Epoch 23, global step 3312: 'val_loss' was not in top 1\n"
     ]
    },
    {
     "data": {
      "text/html": [],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<br>    <style><br>        .wandb-row {<br>            display: flex;<br>            flex-direction: row;<br>            flex-wrap: wrap;<br>            justify-content: flex-start;<br>            width: 100%;<br>        }<br>        .wandb-col {<br>            display: flex;<br>            flex-direction: column;<br>            flex-basis: 100%;<br>            flex: 1;<br>            padding: 10px;<br>        }<br>    </style><br><div class=\"wandb-row\"><div class=\"wandb-col\"><h3>Run history:</h3><br/><table class=\"wandb\"><tr><td>epoch</td><td>▁▁▁▁▁▁▂▂▂▂▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▅▅▆▆▆▆▆▆▆▆▇▇▇██</td></tr><tr><td>train_loss_epoch</td><td>█▅▄▄▃▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁</td></tr><tr><td>train_loss_step</td><td>█▇▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁</td></tr><tr><td>trainer/global_step</td><td>▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███</td></tr><tr><td>val_CER</td><td>█▅▄▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁</td></tr><tr><td>val_loss</td><td>█▅▄▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁</td></tr></table><br/></div><div class=\"wandb-col\"><h3>Run summary:</h3><br/><table class=\"wandb\"><tr><td>epoch</td><td>23</td></tr><tr><td>train_loss_epoch</td><td>0.25766</td></tr><tr><td>train_loss_step</td><td>0.27079</td></tr><tr><td>trainer/global_step</td><td>3311</td></tr><tr><td>val_CER</td><td>0.18522</td></tr><tr><td>val_loss</td><td>0.75747</td></tr></table><br/></div></div>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       " View run <strong style=\"color:#cdcd00\">GRU_CTC</strong> at: <a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset/runs/5ml9qn9j' target=\"_blank\">https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset/runs/5ml9qn9j</a><br> View project at: <a href='https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset' target=\"_blank\">https://wandb.ai/XXXXXXXXXXXXXX/ECOG_Sentence_dataset</a><br>Synced 8 W&B file(s), 0 media file(s), 3 artifact file(s) and 0 other file(s)"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "Find logs at: <code>./wandb/run-20250515_085136-5ml9qn9j/logs</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "model = LightningGRUDecoder(\n",
    "            neural_dim=nInputFeatures,\n",
    "            n_classes=nClasses,\n",
    "            hidden_dim=hidden_dim,\n",
    "            layer_dim=nlayers,\n",
    "            strideLen=stride_len,\n",
    "            kernelLen=kernel_len,\n",
    "            gaussianSmoothWidth=gaussian_smooth_width,\n",
    "            bidirectional=bidirectional,\n",
    "            dropout=dropout,\n",
    "            white_noise_SD=white_noise_SD,\n",
    "            constant_offset_SD=constant_offset_SD,\n",
    "            weight_decay=l2_decay,\n",
    "            learning_rate=lr_start)\n",
    "\n",
    "wandb_logger = WandbLogger(project=\"ECOG_Sentence_dataset\", name=f\"GRU_CTC\",\n",
    "                            reinit=True)\n",
    "\n",
    "# Define ModelCheckpoint to save the best model based on validation loss\n",
    "checkpoint_callback = ModelCheckpoint(\n",
    "    monitor=\"val_loss\",  # Ensure your validation step logs \"val_loss\"\n",
    "    mode=\"min\",          # Save the model with the lowest validation loss\n",
    "    save_top_k=1,        # Keep only the best model\n",
    "    dirpath=f\".checkpoints/{output_name}/\",  # Directory to save checkpoints\n",
    "    filename=f\"best_model\",  # Model filename\n",
    "    verbose=True\n",
    ")\n",
    "\n",
    "# Define EarlyStopping callback with patience of 3 epochs\n",
    "early_stopping_callback = EarlyStopping(\n",
    "    monitor=\"val_loss\",\n",
    "    patience=5,   # Stop training if no improvement in 3 epochs\n",
    "    mode=\"min\",\n",
    "    verbose=True\n",
    ")\n",
    "\n",
    "\n",
    "# Train model\n",
    "trainer = pl.Trainer(max_epochs=60,devices =[0], callbacks=[checkpoint_callback, early_stopping_callback], logger=wandb_logger)\n",
    "\n",
    "trainer.fit(model, train_loader, test_loader)\n",
    "\n",
    "#reload state_dict of best model\n",
    "# model.load_state_dict(torch.load(f\".checkpoints/robust_sm_gru_ctc/best_model.ckpt\")[\"state_dict\"])\n",
    "\n",
    "\n",
    "# close wandb logger\n",
    "wandb.finish()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "6ddd9bd0",
   "metadata": {},
   "source": [
    "## Evaluation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "a43de8ab",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "LightningGRUDecoder(\n",
       "  (inputLayerNonlinearity): Softsign()\n",
       "  (unfolder): Unfold(kernel_size=(32, 1), dilation=1, padding=0, stride=4)\n",
       "  (gaussianSmoother): GaussianSmoothing()\n",
       "  (gru_decoder): GRU(8192, 1024, num_layers=5, batch_first=True, dropout=0.4, bidirectional=True)\n",
       "  (fc_decoder_out): Linear(in_features=2048, out_features=41, bias=True)\n",
       "  (ctc_loss): CTCLoss()\n",
       ")"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "device = \"cuda:1\"\n",
    "model.to(device)\n",
    "model.train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "15e3dd71",
   "metadata": {},
   "outputs": [],
   "source": [
    "tokens = [\"<blank>\"] + PHONE_DEF + [\" \"]\n",
    "decoder = ctc_decoder(tokens= tokens,   \n",
    "                      lexicon=None,  \n",
    "                      blank_token = '<blank>', \n",
    "                      sil_token = ' ',\n",
    "                      )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "55953441",
   "metadata": {},
   "outputs": [],
   "source": [
    "def decode_ctc_output(logits):\n",
    "    \"\"\"\n",
    "    Converts model logits to predicted phoneme sequences.\n",
    "    - Removes repeated phonemes.\n",
    "    - Removes blank tokens (0).\n",
    "    \"\"\"\n",
    "\n",
    "    predictions = torch.argmax(logits, dim=-1)  # Get most probable phoneme indices\n",
    "    predictions = [torch.unique_consecutive(seq[seq != 0]).cpu().numpy() for seq in predictions]  # Remove blanks\n",
    "    return predictions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "13f45c26",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 14/14 [00:27<00:00,  1.94s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Character Error Rate (CER): 19.32%\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "best_models =[model]\n",
    "\n",
    "# Run inference on test set\n",
    "all_pred_phonemes = []\n",
    "all_true_phonemes = []\n",
    "all_decoded_phonemes_ensemble = []\n",
    "all_true_texts = []\n",
    "cer_list = []\n",
    "day_indices =[]\n",
    "\n",
    "with torch.no_grad():\n",
    "    for X, y, X_len, y_len,days, transcriptions in tqdm.tqdm(test_loader):\n",
    "\n",
    "        # Move data to device\n",
    "        X = X.to(device)\n",
    "        y = y.to(device)\n",
    "\n",
    "        day_indices.append(days)\n",
    "        days = days.to(device)\n",
    "        X_len = X_len.to(device)\n",
    "        y_len = y_len.to(device)\n",
    "\n",
    "        all_decoded_phonemes_ensemble_tmp = []\n",
    "        logits_ensemble = []\n",
    "        for model in best_models:\n",
    "            model.eval()\n",
    "\n",
    "            logits = model(X,days)\n",
    "            decoded = decoder(torch.nn.functional.log_softmax(logits, dim=-1).cpu())\n",
    "            all_decoded_phonemes_ensemble_tmp.append(decoded)\n",
    "            logits_ensemble.append(logits)\n",
    "        \n",
    "        all_decoded_phonemes_ensemble.append(all_decoded_phonemes_ensemble_tmp)\n",
    "\n",
    "        # Get model predictions\n",
    "        # pred = torch.median(torch.stack(logits_ensemble),0).values\n",
    "        pred = torch.mean(torch.stack(logits_ensemble),0)\n",
    "        # Compute CER (Phoneme Error Rate)\n",
    "        total_edit_distance, total_seq_length = 0, 0\n",
    "        for i in range(pred.shape[0]):\n",
    "            decodedSeq = torch.argmax(pred[i, : int(X_len[i] / model.strideLen), :], dim=-1)\n",
    "            decodedSeq = torch.unique_consecutive(decodedSeq, dim=-1)\n",
    "            decodedSeq = decodedSeq[decodedSeq != 0].cpu().numpy()\n",
    "\n",
    "            trueSeq = y[i][:y_len[i]].cpu().numpy()\n",
    "            matcher = SequenceMatcher(a=trueSeq.tolist(), b=decodedSeq.tolist())\n",
    "            total_edit_distance += matcher.distance()\n",
    "            total_seq_length += len(trueSeq)\n",
    "\n",
    "            cer = total_edit_distance / total_seq_length if total_seq_length > 0 else 1.0\n",
    "            cer_list.append(cer)\n",
    "        log_probs = torch.nn.functional.log_softmax(logits, dim=-1)  # Convert to log probabilities\n",
    "\n",
    "        # Decode predicted phonemes\n",
    "        pred_phonemes = decode_ctc_output(log_probs)\n",
    "        all_pred_phonemes.extend(pred_phonemes)\n",
    "        all_true_phonemes.extend([y[i][:y_len[i]].cpu().numpy() for i in range(len(y))])\n",
    "\n",
    "        # Store transcriptions\n",
    "        all_true_texts.extend(transcriptions)\n",
    "        # Convert predicted phonemes to words (Placeholder: Replace with actual phoneme-to-text conversion)\n",
    "\n",
    "# Compute CER & WER\n",
    "cer = np.mean(cer_list)\n",
    "\n",
    "# Print final results\n",
    "print(f\"Character Error Rate (CER): {cer * 100:.2f}%\") \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "68244d09",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 14/14 [00:30<00:00,  2.19s/it]\n"
     ]
    }
   ],
   "source": [
    "## predit all teh test set \n",
    "pred_phonemes = []\n",
    "pred_logits = []\n",
    "true_phonemes = []\n",
    "true_sentences = []\n",
    "day_indices = []\n",
    "cer_list = []\n",
    "\n",
    "with torch.no_grad():\n",
    "    for X, y, X_len, y_len,days, transcriptions in tqdm.tqdm(test_loader):\n",
    "        # Move data to device\n",
    "        X = X.to(device)\n",
    "        y = y.to(device)\n",
    "\n",
    "        day_indices.append(days)\n",
    "        days = days.to(device)\n",
    "        X_len = X_len.to(device)\n",
    "        y_len = y_len.to(device)\n",
    "\n",
    "        logits = model(X,days)\n",
    "        pred = torch.nn.functional.log_softmax(logits, dim=-1).cpu()\n",
    "        decoded = decoder(pred)\n",
    "        pred_logits.append(pred)\n",
    "\n",
    "        total_edit_distance, total_seq_length = 0, 0\n",
    "\n",
    "        for i in range(pred.shape[0]):\n",
    "            decodedSeq = torch.argmax(pred[i, : int(X_len[i] / model.strideLen), :], dim=-1)\n",
    "            decodedSeq = torch.unique_consecutive(decodedSeq, dim=-1)\n",
    "            decodedSeq = decodedSeq[decodedSeq != 0].cpu().numpy()\n",
    "\n",
    "            trueSeq = y[i][:y_len[i]].cpu().numpy()\n",
    "            matcher = SequenceMatcher(a=trueSeq.tolist(), b=decodedSeq.tolist())\n",
    "            total_edit_distance += matcher.distance()\n",
    "            total_seq_length += len(trueSeq)\n",
    "\n",
    "            cer = total_edit_distance / total_seq_length if total_seq_length > 0 else 1.0\n",
    "            cer_list.append(cer)\n",
    "        \n",
    "        \n",
    "        true_phonemes.extend([y[i][:y_len[i]].cpu().numpy() for i in range(len(y))])\n",
    "\n",
    "        pp = decode_ctc_output(pred)\n",
    "\n",
    "        pred_phonemes.extend(pp)\n",
    "        true_sentences.extend(transcriptions)\n",
    "\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "80bd7295",
   "metadata": {},
   "outputs": [],
   "source": [
    "def compute_accuracy(preds, targets):\n",
    "    \n",
    "\n",
    "    accs= []\n",
    "    for pred, target in zip(preds, targets):\n",
    "        \n",
    "        #truncate to the length of the shortest sequence\n",
    "        min_len = min(len(pred), len(target))\n",
    "\n",
    "\n",
    "        pred = pred[:min_len]\n",
    "        target = target[:min_len]\n",
    "\n",
    "        equal_inference = (pred == target)\n",
    "        acc = np.sum(equal_inference)/ len(pred)\n",
    "        accs.append(acc)\n",
    "\n",
    "    return np.mean(accs)\n",
    "   \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "a796af7a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "overall_acc 0.5155072171243137\n"
     ]
    }
   ],
   "source": [
    "overall_acc = compute_accuracy(pred_phonemes, true_phonemes)\n",
    "print(\"overall_acc\", overall_acc)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "29053a08",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Range of Accuracy per day 0.20219025390956072 0.695663519683872\n"
     ]
    }
   ],
   "source": [
    "day_indices_flat = [item.item() for sublist in day_indices for item in sublist]\n",
    "\n",
    "\n",
    "#compute accuracy per day by selecting indices of the same day\n",
    "day_accs = []\n",
    "for day_index in set(day_indices_flat):\n",
    "    indices = [idx for idx, day in enumerate(day_indices_flat) if day == day_index]\n",
    "    acc = compute_accuracy([pred_phonemes[idx] for idx in indices], [true_phonemes[idx] for idx in indices])\n",
    "    day_accs.append(acc)\n",
    "\n",
    "day_accs\n",
    "print(\"Range of Accuracy per day\", min(day_accs), max(day_accs))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "b47ef28a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Range of CER per day 0.13472513121077995 0.39956984205390644\n"
     ]
    }
   ],
   "source": [
    "cer_list_per_day = []\n",
    "for day_index in set(day_indices_flat):\n",
    "    indices = [idx for idx, day in enumerate(day_indices_flat) if day == day_index]\n",
    "    cer_list_per_day.append(np.array(cer_list)[indices].mean())\n",
    "\n",
    "cer_list_per_day\n",
    "\n",
    "print(\"Range of CER per day\", min(cer_list_per_day), max(cer_list_per_day))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "7b299ddc",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Average lenght diff: -10.661363636363637 +- 7.507654152114933\n"
     ]
    }
   ],
   "source": [
    "diffs = []\n",
    "for i in range(len(true_phonemes)):\n",
    "    true = true_phonemes[i]\n",
    "    pred = pred_phonemes[i]\n",
    "    diffs.append(np.array(len(true)) - np.array(len(pred)))\n",
    "\n",
    "print(f\"Average lenght diff: {np.mean(diffs)} +- {np.std(diffs)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "ec649ac4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Range of diff lenghts per day: -16.225 - -0.3\n"
     ]
    }
   ],
   "source": [
    "## compute diff lenghts per day\n",
    "diffs_per_day = []\n",
    "for day_index in set(day_indices_flat):\n",
    "    indices = [idx for idx, day in enumerate(day_indices_flat) if day == day_index]\n",
    "    diffs_per_day.append(np.array(diffs)[indices].mean())\n",
    "\n",
    "diffs_per_day\n",
    "print(f\"Range of diff lenghts per day: {min(diffs_per_day)} - {max(diffs_per_day)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "b02b0ad0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Decoded phonemes:\n",
      "['SH', 'IH', 'AA', 'K', 'AH', 'S', 'SIL', 'R', 'IH', 'K', 'AA', 'N', 'T', 'D', 'ER', 'SIL', 'D', 'IH']\n",
      "Target phonemes:\n",
      "['TH', 'IY', 'AA', 'K', 'R', 'AH', 'S', 'IY', 'SIL', 'R', 'IY', 'K', 'AH', 'N', 'S', 'IH', 'D', 'ER', 'D', 'SIL']\n",
      "Target sentence\n",
      "Theocracy reconsidered.\n",
      "\n",
      "Decoded phonemes:\n",
      "['R', 'EY', 'S', 'SIL', 'P', 'OY', 'CH', 'IH', 'T', 'SIL', 'S', 'EH', 'V', 'AH', 'L', 'SIL', 'S', 'AE', 'N', 'D', 'SIL', 'L', 'IH', 'TH', 'AH', 'F', 'SIL', 'D', 'EH']\n",
      "Target phonemes:\n",
      "['R', 'IH', 'CH', 'SIL', 'P', 'ER', 'CH', 'AH', 'S', 'T', 'SIL', 'S', 'EH', 'V', 'R', 'AH', 'L', 'SIL', 'S', 'AY', 'N', 'D', 'SIL', 'L', 'IH', 'TH', 'AH', 'G', 'R', 'AE', 'F', 'S', 'SIL']\n",
      "Target sentence\n",
      "Rich purchased several signed lithographs.\n",
      "\n",
      "Decoded phonemes:\n",
      "['S', 'OW', 'SIL', 'R', 'IH', 'L', 'SIL', 'B', 'IY', 'SIL', 'M', 'EY', 'D', 'SIL', 'IH', 'N', 'SIL', 'IH', 'N', 'D', 'AH', 'V', 'AE', 'SH', 'T', 'SIL', 'K', 'AH', 'L', 'UW', 'ZH', 'AH', 'N', 'SIL', 'D', 'IH', 'IY']\n",
      "Target phonemes:\n",
      "['S', 'OW', 'SIL', 'R', 'UW', 'L', 'Z', 'SIL', 'W', 'IY', 'SIL', 'M', 'EY', 'D', 'SIL', 'IH', 'N', 'SIL', 'AH', 'N', 'AH', 'B', 'AE', 'SH', 'T', 'SIL', 'K', 'AH', 'L', 'UW', 'ZH', 'AH', 'N', 'SIL']\n",
      "Target sentence\n",
      "So rules we made, in unabashed collusion.\n",
      "\n",
      "Decoded phonemes:\n",
      "['K', 'R', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', 'AW', 'S', 'HH', 'AH', 'M', 'SIL', 'N', 'IY', 'D', 'Z', 'SIL', 'B', 'EY', 'K', 'SIL', 'L', 'AH', 'V', 'Z', 'SIL', 'UW', 'Z', 'SIL', 'B', 'IY', 'SIL', 'S', 'AH', 'M', 'P', 'IY', 'T', 'IY', 'SIL', 'AE', 'L', 'AH', 'N', 'D', 'SIL', 'D', 'AH', 'EH', 'IY']\n",
      "Target phonemes:\n",
      "['L', 'AO', 'R', 'IY', 'Z', 'SIL', 'K', 'AA', 'S', 'T', 'UW', 'M', 'SIL', 'N', 'IY', 'D', 'AH', 'D', 'SIL', 'B', 'L', 'AE', 'K', 'SIL', 'G', 'L', 'AH', 'V', 'Z', 'SIL', 'T', 'UW', 'SIL', 'B', 'IY', 'SIL', 'K', 'AH', 'M', 'P', 'L', 'IY', 'T', 'L', 'IY', 'SIL', 'EH', 'L', 'AH', 'G', 'AH', 'N', 'T', 'SIL']\n",
      "Target sentence\n",
      "Lori's costume needed black gloves to be completely elegant.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'S', 'UW', 'TH', 'SIL', 'V', 'EH', 'R', 'IY', 'SIL', 'R', 'IH', 'AA', 'T', 'AH', 'SIL', 'T', 'UW', 'SIL', 'K', 'AH', 'M', 'SIL', 'F', 'R', 'AE', 'N', 'SIL', 'R', 'EH', 'JH', 'ER', 'Z', 'SIL', 'TH', 'ER', 'TH', 'SIL', 'F', 'V', 'AE', 'T', 'SIL', 'AW', 'T', 'SIL', 'D', 'AH', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'T', 'UW', 'TH', 'SIL', 'F', 'EH', 'R', 'IY', 'SIL', 'F', 'ER', 'G', 'AA', 'T', 'SIL', 'T', 'UW', 'SIL', 'K', 'AH', 'M', 'SIL', 'W', 'EH', 'N', 'SIL', 'R', 'AA', 'JH', 'ER', 'Z', 'SIL', 'T', 'UW', 'TH', 'SIL', 'F', 'EH', 'L', 'SIL', 'AW', 'T', 'SIL']\n",
      "Target sentence\n",
      "The tooth fairy forgot to come when Roger's tooth fell out.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AE', 'T', 'SIL', 'T', 'IH', 'NG', 'IH', 'NG', 'SIL', 'B', 'IH', 'P', 'SIL', 'P', 'ER', 'SIL', 'W', 'AA', 'Z', 'SIL', 'K', 'OW', 'Z', 'SIL', 'B', 'AH', 'SIL', 'R', 'AY', 'D', 'IH', 'D', 'SIL', 'S', 'P', 'IY', 'P', 'S', 'ER', 'SIL', 'AY', 'Z', 'SIL', 'L', 'IH', 'SH', 'AH', 'N', 'SIL', 'D']\n",
      "Target phonemes:\n",
      "['DH', 'AE', 'T', 'SIL', 'S', 'T', 'IH', 'NG', 'IH', 'NG', 'SIL', 'V', 'EY', 'P', 'ER', 'SIL', 'W', 'AA', 'Z', 'SIL', 'K', 'AA', 'Z', 'D', 'SIL', 'B', 'AY', 'SIL', 'K', 'L', 'AO', 'R', 'AY', 'D', 'SIL', 'V', 'EY', 'P', 'ER', 'AH', 'Z', 'EY', 'SH', 'AH', 'N', 'SIL']\n",
      "Target sentence\n",
      "That stinging vapor was caused by chloride vaporization.\n",
      "\n",
      "Decoded phonemes:\n",
      "['B', 'OY', 'S', 'SIL', 'S', 'F', 'AO', 'R', 'SIL', 'TH', 'ER', 'Z', 'IY', 'SIL', 'K', 'AH', 'T', 'AE', 'M', 'SIL', 'B', 'IH', 'EH', 'R', 'SIL', 'EH', 'V', 'ER', 'SIL', 'F', 'ER', 'M', 'Y', 'L', 'ER', 'SIL', 'D', 'AH', 'EH', 'IY']\n",
      "Target phonemes:\n",
      "['B', 'IH', 'F', 'AO', 'R', 'SIL', 'TH', 'ER', 'Z', 'D', 'IY', 'Z', 'SIL', 'IH', 'G', 'Z', 'AE', 'M', 'SIL', 'R', 'IY', 'V', 'Y', 'UW', 'SIL', 'EH', 'V', 'ER', 'IY', 'SIL', 'F', 'AO', 'R', 'M', 'Y', 'AH', 'L', 'AH', 'SIL']\n",
      "Target sentence\n",
      "Before Thursday's exam, review every formula.\n",
      "\n",
      "Decoded phonemes:\n",
      "['G', 'AE', 'L', 'D', 'AA', 'R', 'SIL', 'D', 'UW', 'SIL', 'T', 'AH', 'N', 'D', 'AH', 'SIL', 'HH', 'IH', 'Z', 'SIL', 'P', 'OW', 'R', 'K', 'T', 'SIL', 'D', 'EH', 'S', 'EH']\n",
      "Target phonemes:\n",
      "['W', 'AY', 'L', 'D', 'F', 'AY', 'ER', 'SIL', 'N', 'IH', 'R', 'SIL', 'S', 'AH', 'N', 'SH', 'AY', 'N', 'SIL', 'F', 'AO', 'R', 'S', 'IH', 'Z', 'SIL', 'P', 'AA', 'R', 'K', 'SIL', 'K', 'L', 'OW', 'ZH', 'ER', 'Z', 'SIL']\n",
      "Target sentence\n",
      "Wildfire near Sunshine forces park closures.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'W', 'UH', 'AH', 'N', 'D', 'SIL', 'M', 'EY', 'N', 'SIL', 'IH', 'T', 'SIL', 'W', 'ER', 'N', 'T', 'SIL', 'B', 'IH', 'L', 'SIL', 'AH', 'W', 'EY', 'SIL', 'Y', 'IH', 'Z', 'AH', 'L', 'IY', 'SIL', 'N', 'AY', 'IH', 'NG', 'SIL', 'D', 'EH', 'S', 'SIL', 'D', 'EH', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'W', 'ER', 'D', 'SIL', 'M', 'IY', 'N', 'Z', 'SIL', 'IH', 'T', 'SIL', 'W', 'OW', 'N', 'T', 'SIL', 'B', 'OY', 'L', 'SIL', 'AH', 'W', 'EY', 'SIL', 'IY', 'Z', 'AH', 'L', 'IY', 'SIL', 'N', 'AH', 'TH', 'IH', 'NG', 'SIL', 'EH', 'L', 'S', 'SIL']\n",
      "Target sentence\n",
      "The word means it won't boil away easily, nothing else.\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'UH', 'T', 'SIL', 'AH', 'SIL', 'B', 'OW', 'L', 'TH', 'SIL', 'S', 'IH', 'Z', 'IY', 'ER', 'SIL', 'IH', 'N', 'SIL', 'AH', 'SIL', 'M', 'AE', 'N', 'Z', 'SIL', 'HH', 'EY', 'D', 'SIL', 'B', 'IH', 'K', 'SIL', 'HH', 'IH', 'M', 'SIL', 'AH', 'P', 'AH', 'T', 'SIL', 'OW', 'L', 'SIL', 'D', 'IY', 'SIL', 'D', 'IH', 'IY']\n",
      "Target phonemes:\n",
      "['W', 'UH', 'D', 'SIL', 'AH', 'SIL', 'B', 'L', 'UW', 'SIL', 'F', 'EH', 'DH', 'ER', 'SIL', 'IH', 'N', 'SIL', 'AH', 'SIL', 'M', 'AE', 'N', 'Z', 'SIL', 'HH', 'AE', 'T', 'SIL', 'M', 'EY', 'K', 'SIL', 'HH', 'IH', 'M', 'SIL', 'HH', 'AE', 'P', 'IY', 'SIL', 'AO', 'L', 'SIL', 'D', 'EY', 'SIL']\n",
      "Target sentence\n",
      "Would a blue feather in a man's hat make him happy all day?\n",
      "\n",
      "Decoded phonemes:\n",
      "['HH', 'IY', 'SIL', 'CH', 'AH', 'K', 'SIL', 'AH', 'B', 'AW', 'T', 'SIL', 'IH', 'N', 'SIL', 'AH', 'TH', 'AE', 'D', 'IH', 'K', 'SIL', 'T', 'R', 'OY', 'L', 'AY', 'N', 'SIL', 'Y', 'ER', 'SIL', 'D', 'AH', 'IH']\n",
      "Target phonemes:\n",
      "['HH', 'IY', 'SIL', 'T', 'AO', 'K', 'T', 'SIL', 'AH', 'B', 'AW', 'T', 'SIL', 'AH', 'N', 'AO', 'TH', 'EH', 'N', 'T', 'IH', 'K', 'SIL', 'S', 'T', 'AO', 'R', 'IY', 'L', 'AY', 'N', 'Z', 'SIL', 'T', 'UW', 'SIL']\n",
      "Target sentence\n",
      "He talked about unauthentic storylines too.\n",
      "\n",
      "Decoded phonemes:\n",
      "['P', 'R', 'AA', 'S', 'T', 'SIL', 'JH', 'AH', 'NG', 'SIL', 'W', 'AE', 'Z', 'SIL', 'ER', 'L', 'IY', 'SIL', 'EH', 'V', 'ER', 'IY', 'SIL', 'M', 'AO', 'N', 'IH', 'NG', 'SIL', 'D', 'EH', 'IY']\n",
      "Target phonemes:\n",
      "['M', 'OW', 'S', 'T', 'SIL', 'Y', 'AH', 'NG', 'SIL', 'R', 'AY', 'Z', 'SIL', 'ER', 'L', 'IY', 'SIL', 'EH', 'V', 'ER', 'IY', 'SIL', 'M', 'AO', 'R', 'N', 'IH', 'NG', 'SIL']\n",
      "Target sentence\n",
      "Most young rise early every morning.\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'IH', 'DH', 'TH', 'SIL', 'IH', 'S', 'SIL', 'N', 'AA', 'SIL', 'TH', 'OW', 'AH', 'L', 'SIL', 'K', 'IH', 'L', 'D', 'AH', 'D', 'SIL', 'K', 'AE', 'N', 'SIL', 'S', 'K', 'UW', 'AH', 'L', 'SIL', 'D', 'EH']\n",
      "Target phonemes:\n",
      "['W', 'IH', 'DH', 'SIL', 'DH', 'IH', 'S', 'SIL', 'N', 'OW', 'SIL', 'L', 'OY', 'AH', 'L', 'SIL', 'S', 'IH', 'T', 'AH', 'Z', 'AH', 'N', 'SIL', 'K', 'AE', 'N', 'SIL', 'K', 'W', 'AO', 'R', 'AH', 'L', 'SIL']\n",
      "Target sentence\n",
      "With this no loyal citizen can quarrel.\n",
      "\n",
      "Decoded phonemes:\n",
      "['P', 'M', 'EY', 'D', 'ER', 'SIL', 'T', 'AA', 'M', 'B', 'Z', 'SIL', 'HH', 'AE', 'V', 'SIL', 'AE', 'N', 'SIL', 'AH', 'P', 'B', 'IH', 'T', 'SIL', 'AE', 'D', 'AH', 'T', 'D', 'SIL', 'D', 'IH']\n",
      "Target phonemes:\n",
      "['P', 'R', 'IH', 'M', 'AH', 'T', 'IH', 'V', 'SIL', 'T', 'R', 'AY', 'B', 'Z', 'SIL', 'HH', 'AE', 'V', 'SIL', 'AE', 'N', 'SIL', 'AH', 'P', 'B', 'IY', 'T', 'SIL', 'AE', 'T', 'AH', 'T', 'UW', 'D', 'SIL']\n",
      "Target sentence\n",
      "Primitive tribes have an upbeat attitude.\n",
      "\n",
      "Decoded phonemes:\n",
      "['AH', 'N', 'D', 'SIL', 'W', 'IH', 'DH', 'SIL', 'N', 'AA', 'SIL', 'AH', 'SIL', 'JH', 'EY', 'JH', 'SIL', 'B', 'AH', 'T', 'SIL', 'AH', 'SIL', 'CH', 'EH', 'S', 'AH', 'Z', 'SIL', 'AH', 'V', 'SIL', 'DH', 'AH', 'SIL', 'P', 'OY', 'S', 'SIL', 'HH', 'ER', 'D', 'SIL', 'B', 'IH', 'D', 'SIL', 'DH', 'AH', 'SIL', 'D', 'IH', 'S', 'AH', 'N', 'SIL', 'D', 'AH', 'IY']\n",
      "Target phonemes:\n",
      "['AH', 'N', 'D', 'SIL', 'IH', 'T', 'SIL', 'W', 'AA', 'Z', 'SIL', 'N', 'AA', 'T', 'SIL', 'AH', 'SIL', 'JH', 'AH', 'JH', 'SIL', 'B', 'AH', 'T', 'SIL', 'AH', 'SIL', 'JH', 'AH', 'S', 'T', 'AH', 'S', 'SIL', 'AH', 'V', 'SIL', 'DH', 'AH', 'SIL', 'P', 'IY', 'S', 'SIL', 'HH', 'UW', 'SIL', 'M', 'EY', 'D', 'SIL', 'DH', 'AH', 'SIL', 'D', 'IH', 'S', 'IH', 'ZH', 'AH', 'N', 'SIL']\n",
      "Target sentence\n",
      "And it was not a judge, but a justice of the peace who made the decision.\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'IY', 'SIL', 'S', 'IY', 'M', 'D', 'SIL', 'T', 'OW', 'SIL', 'B', 'IY', 'SIL', 'ER', 'N', 'AH', 'N', 'S', 'IH', 'NG', 'SIL', 'DH', 'AH', 'SIL', 'P', 'R', 'AH', 'CH', 'ER', 'L', 'EH', 'JH', 'EY', 'SH', 'AH', 'N', 'SIL', 'IH', 'M', 'S', 'P', 'L', 'OW', 'ER', 'Z', 'SIL', 'R', 'AY', 'T', 'SIL', 'IH', 'N', 'SIL', 'AA', 'R', 'SIL', 'HH', 'OW', 'N', 'SIL', 'B', 'AE', 'K', 'Z', 'SIL', 'D', 'AH']\n",
      "Target phonemes:\n",
      "['W', 'IY', 'SIL', 'S', 'IY', 'M', 'D', 'SIL', 'T', 'UW', 'SIL', 'B', 'IY', 'SIL', 'W', 'IH', 'T', 'N', 'AH', 'S', 'IH', 'NG', 'SIL', 'DH', 'AH', 'SIL', 'P', 'AA', 'P', 'Y', 'AH', 'L', 'EY', 'SH', 'AH', 'N', 'SIL', 'IH', 'K', 'S', 'P', 'L', 'OW', 'ZH', 'AH', 'N', 'SIL', 'R', 'AY', 'T', 'SIL', 'IH', 'N', 'SIL', 'AW', 'ER', 'SIL', 'OW', 'N', 'SIL', 'B', 'AE', 'K', 'Y', 'AA', 'R', 'D', 'Z', 'SIL']\n",
      "Target sentence\n",
      "We seemed to be witnessing the population explosion right in our own backyards.\n",
      "\n",
      "Decoded phonemes:\n",
      "['D', 'AH', 'M', 'B', 'R', 'AY', 'N', 'Z', 'SIL', 'D', 'IH', 'P', 'ER', 'OY', 'T', 'SIL', 'M', 'EH', 'ZH', 'ER', 'Z', 'SIL', 'K', 'AE', 'N', 'D', 'SIL', 'AO', 'L', 'S', 'SIL', 'Y', 'UW', 'SIL', 'IH', 'N', 'T', 'UW', 'HH', 'AH', 'L', 'T', 'AH', 'D', 'SIL', 'M', 'OW', 'V', 'SIL', 'F', 'IH', 'R', 'SIL', 'DH', 'S', 'SIL', 'F', 'ER', 'CH', 'ER', 'SIL', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['S', 'AH', 'M', 'T', 'AY', 'M', 'Z', 'SIL', 'D', 'EH', 'S', 'P', 'R', 'IH', 'T', 'SIL', 'M', 'EH', 'ZH', 'ER', 'Z', 'SIL', 'K', 'AE', 'N', 'SIL', 'AO', 'L', 'S', 'OW', 'SIL', 'T', 'ER', 'N', 'SIL', 'IH', 'N', 'T', 'UW', 'SIL', 'S', 'AA', 'L', 'AH', 'D', 'SIL', 'M', 'UW', 'V', 'Z', 'SIL', 'F', 'AO', 'R', 'SIL', 'DH', 'AH', 'SIL', 'F', 'Y', 'UW', 'CH', 'ER', 'SIL']\n",
      "Target sentence\n",
      "Sometimes, desperate measures can also turn into solid moves for the future.\n",
      "\n",
      "Decoded phonemes:\n",
      "['S', 'ER', 'Z', 'SIL', 'AE', 'N', 'CH', 'AH', 'Z', 'SIL', 'W', 'IH', 'L', 'SIL', 'B', 'IY', 'SIL', 'T', 'EY', 'T', 'SIL', 'V', 'AW', 'D', 'ER', 'D', 'SIL', 'IH', 'F', 'SIL', 'IH', 'F', 'SIL', 'ER', 'R', 'SIL', 'DH', 'IY', 'NG', 'K', 'SIL', 'AH', 'M', 'SIL', 'DH', 'UW', 'SIL', 'K', 'AE', 'F', 'AH', 'L', 'IY', 'SIL', 'V', 'AH', 'P', 'ER', 'S', 'SIL', 'F', 'ER', 'S', 'SIL']\n",
      "Target phonemes:\n",
      "['DH', 'OW', 'Z', 'SIL', 'AE', 'N', 'S', 'ER', 'Z', 'SIL', 'W', 'IH', 'L', 'SIL', 'B', 'IY', 'SIL', 'S', 'T', 'R', 'EY', 'T', 'F', 'AO', 'R', 'W', 'ER', 'D', 'SIL', 'IH', 'F', 'SIL', 'Y', 'UW', 'SIL', 'TH', 'IH', 'NG', 'K', 'SIL', 'DH', 'EH', 'M', 'SIL', 'TH', 'R', 'UW', 'SIL', 'K', 'EH', 'R', 'F', 'AH', 'L', 'IY', 'SIL', 'F', 'ER', 'S', 'T', 'SIL']\n",
      "Target sentence\n",
      "Those answers will be straightforward if you think them through carefully first.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'IY', 'SIL', 'K', 'IY', 'SIL', 'G', 'EH', 'S', 'SIL', 'G', 'R', 'AE', 'S', 'T', 'SIL', 'F', 'EY', 'SH', 'ER', 'Z', 'SIL', 'AH', 'N', 'D', 'SIL', 'P', 'EH', 'N', 'Z', 'SIL', 'L', 'EH', 'S', 'SIL', 'EH', 'N', 'ER', 'IY', 'SIL', 'M', 'EY', 'NG', 'SIL', 'K', 'OW', 'L', 'IH', 'NG', 'SIL', 'D', 'IH', 'S', 'IH', 'ZH', 'AH', 'N', 'SIL', 'D', 'IH']\n",
      "Target phonemes:\n",
      "['SH', 'IY', 'SIL', 'G', 'EH', 'T', 'S', 'SIL', 'D', 'R', 'EH', 'S', 'T', 'SIL', 'F', 'AE', 'S', 'T', 'ER', 'SIL', 'AH', 'N', 'D', 'SIL', 'S', 'P', 'EH', 'N', 'D', 'Z', 'SIL', 'L', 'EH', 'S', 'SIL', 'EH', 'N', 'ER', 'JH', 'IY', 'SIL', 'M', 'EY', 'K', 'IH', 'NG', 'SIL', 'K', 'L', 'OW', 'DH', 'IH', 'NG', 'SIL', 'D', 'IH', 'S', 'IH', 'ZH', 'AH', 'N', 'Z', 'SIL']\n",
      "Target sentence\n",
      "She gets dressed faster and spends less energy making clothing decisions.\n",
      "\n",
      "Decoded phonemes:\n",
      "['AE', 'G', 'R', 'AA', 'AH', 'M', 'AH', 'N', 'SIL', 'AE', 'K', 'S', 'T', 'UW', 'T', 'AH', 'N', 'SIL', 'D', 'IH', 'N', 'T', 'ER', 'R', 'T', 'IY', 'Z', 'SIL', 'Y', 'AO', 'R', 'SIL', 'D', 'IH', 'P', 'L', 'M', 'ER', 'SIL', 'D', 'IH', 'IY']\n",
      "Target phonemes:\n",
      "['AE', 'K', 'AH', 'D', 'EH', 'M', 'IH', 'K', 'SIL', 'AE', 'P', 'T', 'AH', 'T', 'UW', 'D', 'SIL', 'G', 'EH', 'R', 'AH', 'N', 'T', 'IY', 'Z', 'SIL', 'Y', 'AO', 'R', 'SIL', 'D', 'IH', 'P', 'L', 'OW', 'M', 'AH', 'SIL']\n",
      "Target sentence\n",
      "Academic aptitude guarantees your diploma.\n",
      "\n",
      "Decoded phonemes:\n",
      "['T', 'UW', 'SIL', 'S', 'AH', 'SIL', 'T', 'EH', 'K', 'S', 'IH', 'NG', 'SIL', 'P', 'R', 'IY', 'D', 'EH', 'S', 'T', 'IH', 'P', 'AH', 'EY', 'SH', 'T', 'AH', 'NG', 'SIL', 'AA', 'R', 'SIL', 'K', 'IY', 'P', 'SIL', 'B', 'AY', 'SIL', 'IH', 'K', 'S', 'P', 'EH', 'SH', 'AH', 'Z', 'SIL', 'T', 'UW', 'SIL', 'G', 'R', 'OW', 'P', 'SIL', 'IH', 'N', 'V', 'AY', 'AH', 'N', 'S', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['T', 'UW', 'SIL', 'S', 'AH', 'M', 'SIL', 'IH', 'K', 'S', 'T', 'EH', 'N', 'T', 'SIL', 'P', 'R', 'IY', 'D', 'IH', 'S', 'P', 'AH', 'Z', 'IH', 'SH', 'AH', 'N', 'Z', 'SIL', 'AA', 'R', 'SIL', 'SH', 'EY', 'P', 'T', 'SIL', 'B', 'AY', 'SIL', 'IH', 'K', 'S', 'P', 'OW', 'ZH', 'ER', 'SIL', 'T', 'UW', 'SIL', 'G', 'R', 'UW', 'P', 'SIL', 'IH', 'N', 'V', 'AY', 'R', 'AH', 'N', 'M', 'AH', 'N', 'T', 'S', 'SIL']\n",
      "Target sentence\n",
      "To some extent predispositions are shaped by exposure to group environments.\n",
      "\n",
      "Decoded phonemes:\n",
      "['AE', 'N', 'SIL', 'IH', 'D', 'AH', 'OW', 'L', 'D', 'SIL', 'B', 'IH', 'L', 'SIL', 'R', 'IH', 'B', 'ER', 'OW', 'N', 'Z', 'SIL', 'S', 'IH', 'TH', 'SIL', 'AW', 'R', 'SIL', 'N', 'AA', 'T', 'SIL', 'T', 'UW', 'B', 'AH', 'L', 'SIL', 'F', 'AO', 'R', 'SIL', 'EY', 'T', 'IH', 'NG', 'SIL', 'D', 'EH', 'F', 'R', 'EH', 'SH', 'SIL', 'D', 'AH', 'Z', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['AE', 'N', 'SIL', 'AH', 'D', 'AH', 'L', 'T', 'SIL', 'M', 'EY', 'L', 'SIL', 'B', 'AE', 'B', 'UW', 'N', 'Z', 'SIL', 'T', 'IY', 'TH', 'SIL', 'AA', 'R', 'SIL', 'N', 'AA', 'T', 'SIL', 'S', 'UW', 'T', 'AH', 'B', 'AH', 'L', 'SIL', 'F', 'AO', 'R', 'SIL', 'IY', 'T', 'IH', 'NG', 'SIL', 'SH', 'EH', 'L', 'F', 'IH', 'SH', 'SIL']\n",
      "Target sentence\n",
      "An adult male baboon's teeth are not suitable for eating shellfish.\n",
      "\n",
      "Decoded phonemes:\n",
      "['IH', 'N', 'SIL', 'DH', 'IH', 'AH', 'SIL', 'K', 'AH', 'NG', 'G', 'L', 'EY', 'T', 'SIL', 'IY', 'T', 'SIL', 'W', 'OW', 'T', 'SIL', 'D', 'UW', 'SIL', 'W', 'EH', 'L', 'SIL', 'W', 'AO', 'R', 'SIL', 'AH', 'S', 'SIL', 'T', 'UW', 'SIL', 'P', 'IH', 'T', 'ER', 'SIL', 'IH', 'N', 'SIL', 'M', 'AY', 'N', 'SIL', 'DH', 'AH', 'SIL', 'V', 'IH', 'ZH', 'AH', 'N', 'SIL', 'AH', 'V', 'SIL', 'P', 'IY', 'S', 'SIL', 'D', 'Z', 'D', 'IH', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['IH', 'N', 'SIL', 'DH', 'IH', 'S', 'SIL', 'K', 'AA', 'N', 'T', 'EH', 'K', 'S', 'T', 'SIL', 'IH', 'T', 'SIL', 'W', 'UH', 'D', 'SIL', 'D', 'UW', 'SIL', 'W', 'EH', 'L', 'SIL', 'F', 'AO', 'R', 'SIL', 'AH', 'S', 'SIL', 'T', 'UW', 'SIL', 'B', 'EH', 'R', 'SIL', 'IH', 'N', 'SIL', 'M', 'AY', 'N', 'D', 'SIL', 'DH', 'AH', 'SIL', 'V', 'IH', 'ZH', 'AH', 'N', 'SIL', 'AH', 'V', 'SIL', 'P', 'IY', 'S', 'SIL']\n",
      "Target sentence\n",
      "In this context, it would do well for us to bear in mind the vision of peace.\n",
      "\n",
      "Decoded phonemes:\n",
      "['Y', 'UH', 'R', 'SIL', 'B', 'OY', 'L', 'IH', 'NG', 'SIL', 'M', 'IH', 'K', 'SIL', 'AE', 'N', 'D', 'UW', 'SIL', 'Y', 'UW', 'SIL', 'D', 'AH', 'S', 'Z', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['Y', 'UH', 'R', 'SIL', 'B', 'OY', 'L', 'IH', 'NG', 'SIL', 'M', 'IH', 'L', 'K', 'SIL', 'EY', 'N', 'T', 'SIL', 'Y', 'UW', 'SIL']\n",
      "Target sentence\n",
      "You're boiling milk, ain't you?\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'IY', 'K', 'SIL', 'L', 'UH', 'K', 'SIL', 'F', 'AO', 'R', 'SIL', 'S', 'P', 'AA', 'N', 'T', 'AH', 'D', 'SIL', 'AY', 'AH', 'N', 'AH', 'Z', 'SIL', 'AH', 'N', 'D', 'SIL', 'R', 'AE', 'G', 'R', 'ER', 'Z', 'SIL', 'AA', 'N', 'SIL', 'DH', 'AH', 'SIL', 'D', 'IH', 'P', 'R', 'AA', 'R', 'IY', 'SIL', 'D', 'IH', 'S', 'SIL', 'R', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['R', 'IH', 'CH', 'SIL', 'L', 'UH', 'K', 'T', 'SIL', 'F', 'AO', 'R', 'SIL', 'S', 'P', 'AA', 'T', 'AH', 'D', 'SIL', 'HH', 'AY', 'IY', 'N', 'AH', 'Z', 'SIL', 'AH', 'N', 'D', 'SIL', 'JH', 'AE', 'G', 'W', 'AA', 'R', 'Z', 'SIL', 'AA', 'N', 'SIL', 'DH', 'AH', 'SIL', 'S', 'AH', 'F', 'AA', 'R', 'IY', 'SIL']\n",
      "Target sentence\n",
      "Rich looked for spotted hyenas and jaguars on the safari.\n",
      "\n",
      "Decoded phonemes:\n",
      "['T', 'R', 'AE', 'F', 'IH', 'AH', 'K', 'S', 'SIL', 'F', 'AH', 'R', 'AH', 'K', 'AH', 'T', 'L', 'IY', 'SIL', 'AE', 'Z', 'SIL', 'P', 'IY', 'OW', 'L', 'D', 'SIL', 'T', 'UW', 'SIL', 'M', 'EH', 'S', 'SIL', 'AA', 'B', 'SIL', 'T', 'UW', 'SIL', 'EH', 'N', 'JH', 'ER', 'IY', 'SIL', 'W', 'AO', 'T', 'ER', 'IY', 'SIL', 'EH', 'Z', 'AH', 'M', 'AH', 'N', 'T', 'S', 'SIL', 'D', 'AH', 'S', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['T', 'R', 'AE', 'F', 'IH', 'K', 'SIL', 'F', 'R', 'IY', 'K', 'W', 'AH', 'N', 'T', 'L', 'IY', 'SIL', 'HH', 'AE', 'Z', 'SIL', 'F', 'EY', 'L', 'D', 'SIL', 'T', 'UW', 'SIL', 'M', 'EH', 'ZH', 'ER', 'SIL', 'AH', 'P', 'SIL', 'T', 'UW', 'SIL', 'EH', 'N', 'JH', 'AH', 'N', 'IH', 'R', 'Z', 'SIL', 'SIL', 'R', 'OW', 'Z', 'IY', 'SIL', 'EH', 'S', 'T', 'AH', 'M', 'AH', 'T', 'S', 'SIL']\n",
      "Target sentence\n",
      "Traffic frequently has failed to measure up to engineers' rosy estimates.\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'AA', 'L', 'F', 'SIL', 'P', 'IY', 'P', 'EH', 'R', 'D', 'SIL', 'R', 'EH', 'D', 'SIL', 'T', 'EY', 'M', 'SIL', 'W', 'IH', 'DH', 'SIL', 'F', 'R', 'IH', 'SH', 'SIL', 'L', 'IY', 'M', 'AH', 'N', 'SIL', 'K', 'AY', 'Z', 'SIL', 'F', 'AO', 'R', 'SIL', 'D', 'EH', 'N', 'ER', 'SIL', 'D', 'IH', 'S', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['R', 'AE', 'L', 'F', 'SIL', 'P', 'R', 'IY', 'P', 'EH', 'R', 'D', 'SIL', 'R', 'EH', 'D', 'SIL', 'S', 'N', 'AE', 'P', 'ER', 'SIL', 'W', 'IH', 'DH', 'SIL', 'F', 'R', 'EH', 'SH', 'SIL', 'L', 'EH', 'M', 'AH', 'N', 'SIL', 'S', 'AO', 'S', 'SIL', 'F', 'AO', 'R', 'SIL', 'D', 'IH', 'N', 'ER', 'SIL']\n",
      "Target sentence\n",
      "Ralph prepared red snapper with fresh lemon sauce for dinner.\n",
      "\n",
      "Decoded phonemes:\n",
      "['IH', 'D', 'SIL', 'Y', 'UW', 'SIL', 'B', 'AY', 'SIL', 'AE', 'N', 'SIL', 'K', 'AO', 'R', 'N', 'JH', 'OY', 'SIL', 'OW', 'V', 'ER', 'OY', 'L', 'Z', 'SIL', 'D', 'IH', 'S', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['D', 'IH', 'D', 'SIL', 'Y', 'UW', 'SIL', 'B', 'AY', 'SIL', 'EH', 'N', 'IY', 'SIL', 'K', 'AO', 'R', 'D', 'ER', 'OY', 'SIL', 'OW', 'V', 'ER', 'AO', 'L', 'Z', 'SIL']\n",
      "Target sentence\n",
      "Did you buy any corduroy overalls?\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'EH', 'R', 'SIL', 'P', 'AH', 'N', 'SH', 'SIL', 'IH', 'Z', 'SIL', 'AH', 'P', 'IY', 'T', 'AH', 'D', 'SIL', 'D', 'IH', 'S', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['K', 'L', 'IH', 'R', 'SIL', 'P', 'R', 'OW', 'N', 'AH', 'N', 'S', 'IY', 'EY', 'SH', 'AH', 'N', 'SIL', 'IH', 'Z', 'SIL', 'AH', 'P', 'R', 'IY', 'SH', 'IY', 'EY', 'T', 'IH', 'D', 'SIL']\n",
      "Target sentence\n",
      "Clear pronunciation is appreciated.\n",
      "\n",
      "Decoded phonemes:\n",
      "['P', 'R', 'EY', 'SIL', 'T', 'UW', 'IH', 'NG', 'SIL', 'DH', 'IH', 'S', 'SIL', 'K', 'ER', 'T', 'SIL', 'F', 'AO', 'R', 'SIL', 'CH', 'OY', 'S', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['P', 'L', 'IY', 'Z', 'SIL', 'SH', 'AO', 'R', 'T', 'AH', 'N', 'SIL', 'DH', 'IH', 'S', 'SIL', 'S', 'K', 'ER', 'T', 'SIL', 'F', 'AO', 'R', 'SIL', 'JH', 'OY', 'S', 'SIL']\n",
      "Target sentence\n",
      "Please shorten this skirt for Joyce.\n",
      "\n",
      "Decoded phonemes:\n",
      "['HH', 'UW', 'SIL', 'AH', 'DH', 'TH', 'ER', 'Z', 'SIL', 'DH', 'AH', 'SIL', 'AH', 'N', 'AH', 'M', 'AA', 'D', 'SIL', 'IH', 'K', 'S', 'P', 'EH', 'N', 'T', 'S', 'SIL', 'AH', 'K', 'AW', 'N', 'T', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['HH', 'UW', 'SIL', 'AO', 'TH', 'ER', 'AY', 'Z', 'D', 'SIL', 'DH', 'AH', 'SIL', 'AH', 'N', 'L', 'IH', 'M', 'AH', 'T', 'AH', 'D', 'SIL', 'IH', 'K', 'S', 'P', 'EH', 'N', 'S', 'SIL', 'AH', 'K', 'AW', 'N', 'T', 'SIL']\n",
      "Target sentence\n",
      "Who authorized the unlimited expense account?\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'F', 'AA', 'M', 'AH', 'L', 'IY', 'SIL', 'R', 'ER', 'Z', 'SH', 'AH', 'N', 'Z', 'SIL', 'DH', 'AE', 'T', 'SIL', 'K', 'AW', 'B', 'ER', 'Z', 'SIL', 'B', 'IY', 'SIL', 'AH', 'M', 'AH', 'N', 'AH', 'T', 'SIL', 'D', 'IH', 'Z', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'F', 'AE', 'M', 'AH', 'L', 'IY', 'SIL', 'R', 'IH', 'K', 'W', 'EH', 'S', 'T', 'S', 'SIL', 'DH', 'AE', 'T', 'SIL', 'F', 'L', 'AW', 'ER', 'Z', 'SIL', 'B', 'IY', 'SIL', 'OW', 'M', 'IH', 'T', 'AH', 'D', 'SIL']\n",
      "Target sentence\n",
      "The family requests that flowers be omitted.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'M', 'AH', 'S', 'ZH', 'IY', 'M', 'SIL', 'HH', 'AY', 'ER', 'Z', 'SIL', 'P', 'AH', 'SH', 'AH', 'N', 'SIL', 'EH', 'V', 'ER', 'IY', 'SIL', 'IY', 'V', 'N', 'IH', 'N', 'T', 'SIL', 'D', 'IH', 'Z', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'M', 'Y', 'UW', 'Z', 'IY', 'AH', 'M', 'SIL', 'HH', 'AY', 'ER', 'Z', 'SIL', 'M', 'Y', 'UW', 'Z', 'IH', 'SH', 'AH', 'N', 'Z', 'SIL', 'EH', 'V', 'ER', 'IY', 'SIL', 'IY', 'V', 'N', 'IH', 'NG', 'SIL']\n",
      "Target sentence\n",
      "The museum hires musicians every evening.\n",
      "\n",
      "Decoded phonemes:\n",
      "['W', 'EH', 'L', 'SIL', 'S', 'T', 'OW', 'V', 'SIL', 'V', 'ER', 'R', 'AA', 'B', 'SIL', 'P', 'AY', 'SIL', 'AE', 'F', 'T', 'ER', 'R', 'K', 'SH', 'AH', 'W', 'AH', 'L', 'SIL', 'L', 'AY', 'K', 'SIL', 'D', 'EH', 'Z', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['W', 'IY', 'L', 'SIL', 'S', 'ER', 'V', 'SIL', 'R', 'UW', 'B', 'AA', 'R', 'B', 'SIL', 'P', 'AY', 'SIL', 'AE', 'F', 'T', 'ER', 'SIL', 'R', 'EY', 'CH', 'AH', 'L', 'Z', 'SIL', 'T', 'AO', 'K', 'SIL']\n",
      "Target sentence\n",
      "We'll serve rhubarb pie after Rachel's talk.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'EY', 'SIL', 'AH', 'N', 'JH', 'OY', 'D', 'SIL', 'IH', 'T', 'SIL', 'W', 'EH', 'N', 'SIL', 'AY', 'SIL', 'AH', 'D', 'IH', 'SH', 'AH', 'N', 'SIL', 'D', 'AH', 'SIL', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'EY', 'SIL', 'EH', 'N', 'JH', 'OY', 'SIL', 'IH', 'T', 'SIL', 'W', 'EH', 'N', 'SIL', 'AY', 'SIL', 'AA', 'D', 'IH', 'SH', 'AH', 'N', 'SIL']\n",
      "Target sentence\n",
      "They enjoy it when I audition.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'AO', 'F', 'AH', 'K', 'OW', 'SIL', 'T', 'R', 'UW', 'D', 'SIL', 'HH', 'AE', 'F', 'SIL', 'AH', 'SIL', 'G', 'IH', 'F', 'SIL', 'SH', 'UW', 'T', 'SIL', 'AE', 'Z', 'SIL', 'Y', 'UW', 'SIL', 'K', 'OY', 'L', 'T', 'AH', 'T', 'SIL', 'W', 'EH', 'N', 'T', 'SIL', 'IH', 'T', 'SIL', 'IH', 'Z', 'SIL', 'T', 'R', 'AY', 'P', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'AE', 'V', 'AH', 'K', 'AA', 'D', 'OW', 'SIL', 'SH', 'UH', 'D', 'SIL', 'HH', 'AE', 'V', 'SIL', 'AH', 'SIL', 'G', 'IH', 'V', 'SIL', 'T', 'UW', 'SIL', 'IH', 'T', 'SIL', 'AE', 'Z', 'SIL', 'Y', 'UW', 'SIL', 'HH', 'OW', 'L', 'D', 'SIL', 'IH', 'T', 'SIL', 'W', 'EH', 'N', 'SIL', 'IH', 'T', 'SIL', 'IH', 'Z', 'SIL', 'R', 'AY', 'P', 'SIL']\n",
      "Target sentence\n",
      "The avocado should have a give to it, as you hold it, when it is ripe.\n",
      "\n",
      "Decoded phonemes:\n",
      "['EH', 'N', 'IY', 'SIL', 'P', 'AY', 'ER', 'Z', 'SIL', 'Y', 'UW', 'ZH', 'AH', 'W', 'AH', 'L', 'IY', 'SIL', 'L', 'IY', 'L', 'SIL', 'W', 'IH', 'L', 'SIL', 'Y', 'IY', 'Z', 'SIL', 'B', 'AY', 'SIL', 'K', 'AH', 'N', 'D', 'AH', 'K', 'IH', 'NG', 'SIL', 'V', 'EH', 'G', 'Y', 'AH', 'L', 'IY', 'SIL', 'IH', 'S', 'P', 'EH', 'K', 'SH', 'AH', 'N', 'SIL', 'AH', 'N', 'D', 'SIL', 'T', 'R', 'IY', 'M', 'AH', 'NG', 'SIL', 'D', 'EH', 'S', 'IY', 'D', 'IY', 'IH']\n",
      "Target phonemes:\n",
      "['EH', 'N', 'ER', 'JH', 'IY', 'SIL', 'S', 'AH', 'P', 'L', 'AY', 'ER', 'Z', 'SIL', 'Y', 'UW', 'ZH', 'AH', 'W', 'AH', 'L', 'IY', 'SIL', 'D', 'IY', 'L', 'SIL', 'W', 'IH', 'DH', 'SIL', 'DH', 'IH', 'S', 'SIL', 'B', 'AY', 'SIL', 'K', 'AH', 'N', 'D', 'AH', 'K', 'T', 'IH', 'NG', 'SIL', 'R', 'EH', 'G', 'Y', 'AH', 'L', 'ER', 'SIL', 'IH', 'N', 'S', 'P', 'EH', 'K', 'SH', 'AH', 'N', 'Z', 'SIL', 'AH', 'N', 'D', 'SIL', 'T', 'R', 'IH', 'M', 'IH', 'NG', 'SIL']\n",
      "Target sentence\n",
      "Energy suppliers usually deal with this by conducting regular inspections and trimming.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'S', 'AO', 'SIL', 'IH', 'Z', 'SIL', 'B', 'ER', 'K', 'IH', 'NG', 'SIL', 'S', 'OW', 'SIL', 'T', 'AA', 'P', 'SIL', 'DH', 'AH', 'SIL', 'F', 'UH', 'D', 'SIL', 'IH', 'N', 'S', 'T', 'EH', 'D', 'SIL', 'D', 'AH', 'Z', 'SIL', 'D', 'AH', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'S', 'AO', 'SIL', 'IH', 'Z', 'SIL', 'B', 'R', 'OW', 'K', 'AH', 'N', 'SIL', 'S', 'OW', 'SIL', 'CH', 'AA', 'P', 'SIL', 'DH', 'AH', 'SIL', 'W', 'UH', 'D', 'SIL', 'IH', 'N', 'S', 'T', 'EH', 'D', 'SIL']\n",
      "Target sentence\n",
      "The saw is broken, so chop the wood instead.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'K', 'L', 'EY', 'N', 'D', 'SIL', 'V', 'ER', 'ZH', 'AH', 'N', 'SIL', 'IH', 'Z', 'SIL', 'S', 'IY', 'V', 'AH', 'N', 'NG', 'SIL', 'B', 'L', 'SIL', 'D', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'K', 'L', 'IY', 'N', 'D', 'SIL', 'V', 'ER', 'ZH', 'AH', 'N', 'SIL', 'IH', 'Z', 'SIL', 'G', 'IH', 'V', 'AH', 'N', 'SIL', 'B', 'IH', 'L', 'OW', 'SIL']\n",
      "Target sentence\n",
      "The cleaned version is given below.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'EY', 'SIL', 'S', 'IY', 'M', 'SIL', 'G', 'AA', 'N', 'T', 'SIL', 'P', 'N', 'D', 'ER', 'SIL', 'AH', 'V', 'SIL', 'IH', 'T', 'SIL', 'D', 'AH', 'S', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'EY', 'SIL', 'S', 'IY', 'M', 'SIL', 'D', 'AA', 'R', 'N', 'D', 'SIL', 'P', 'R', 'AW', 'D', 'SIL', 'AH', 'V', 'SIL', 'IH', 'T', 'SIL']\n",
      "Target sentence\n",
      "They seem darned proud of it.\n",
      "\n",
      "Decoded phonemes:\n",
      "['AH', 'SIL', 'SH', 'JH', 'AA', 'B', 'P', 'SIL', 'K', 'L', 'EH', 'M', 'ER', 'SIL', 'W', 'AA', 'Z', 'SIL', 'F', 'AH', 'L', 'AH', 'D', 'SIL', 'B', 'AY', 'SIL', 'AH', 'SIL', 'JH', 'ER', 'K', 'SIL', 'W', 'OW', 'L', 'SIL', 'D', 'AH', 'S', 'T', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['AH', 'SIL', 'SH', 'AA', 'R', 'P', 'SIL', 'T', 'R', 'EH', 'M', 'ER', 'SIL', 'W', 'AA', 'Z', 'SIL', 'F', 'AA', 'L', 'OW', 'D', 'SIL', 'B', 'AY', 'SIL', 'AH', 'SIL', 'JH', 'ER', 'K', 'IY', 'SIL', 'R', 'OW', 'L', 'SIL']\n",
      "Target sentence\n",
      "A sharp tremor was followed by a jerky roll.\n",
      "\n",
      "Decoded phonemes:\n",
      "['B', 'OY', 'SIL', 'Y', 'UW', 'SIL', 'AE', 'N', 'T', 'SIL', 'W', 'UH', 'L', 'AH', 'N', 'IH', 'NG', 'SIL', 'N', 'EH', 'R', 'AH', 'B', 'AA', 'D', 'IY', 'SIL', 'B', 'IH', 'T', 'SIL', 'Y', 'ER', 'S', 'EH', 'L', 'F', 'SIL', 'D', 'AH', 'S', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['B', 'OY', 'SIL', 'Y', 'UW', 'SIL', 'EY', 'N', 'T', 'SIL', 'F', 'UW', 'L', 'IH', 'NG', 'SIL', 'N', 'OW', 'B', 'AA', 'D', 'IY', 'SIL', 'B', 'AH', 'T', 'SIL', 'Y', 'ER', 'S', 'EH', 'L', 'F', 'SIL']\n",
      "Target sentence\n",
      "Boy, you ain't fooling nobody but yourself.\n",
      "\n",
      "Decoded phonemes:\n",
      "['T', 'EY', 'K', 'IY', 'SIL', 'D', 'AY', 'D', 'SIL', 'AA', 'R', 'SIL', 'IH', 'N', 'K', 'L', 'AH', 'T', 'AH', 'N', 'SIL', 'W', 'IH', 'DH', 'SIL', 'IH', 'CH', 'S', 'SIL', 'K', 'R', 'EH', 'K', 'ER', 'D', 'SIL', 'D', 'AH', 'T', 'SIL', 'D', 'AH', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['T', 'IY', 'CH', 'IH', 'NG', 'SIL', 'G', 'AY', 'D', 'Z', 'SIL', 'AA', 'R', 'SIL', 'IH', 'N', 'K', 'L', 'UW', 'D', 'AH', 'D', 'SIL', 'W', 'IH', 'DH', 'SIL', 'IY', 'CH', 'SIL', 'R', 'EH', 'K', 'ER', 'D', 'SIL']\n",
      "Target sentence\n",
      "Teaching guides are included with each record.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'AH', 'SIL', 'M', 'EY', 'N', 'Z', 'SIL', 'AY', 'L', 'IY', 'S', 'SIL', 'F', 'L', 'AH', 'T', 'ER', 'D', 'SIL', 'D', 'AH', 'SIL', 'D', 'AH', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'AH', 'SIL', 'M', 'AE', 'N', 'Z', 'SIL', 'AY', 'L', 'IH', 'D', 'Z', 'SIL', 'F', 'L', 'AH', 'T', 'ER', 'D', 'SIL']\n",
      "Target sentence\n",
      "The man's eyelids fluttered.\n",
      "\n",
      "Decoded phonemes:\n",
      "['DH', 'IH', 'S', 'SIL', 'K', 'IH', 'D', 'Z', 'SIL', 'F', 'OW', 'Z', 'SIL', 'B', 'AE', 'D', 'SIL', 'D', 'AH', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['DH', 'IH', 'S', 'SIL', 'K', 'IH', 'D', 'Z', 'SIL', 'F', 'R', 'OW', 'Z', 'SIL', 'B', 'AE', 'D', 'SIL']\n",
      "Target sentence\n",
      "This kid's froze bad.\n",
      "\n",
      "Decoded phonemes:\n",
      "['SH', 'IY', 'SIL', 'R', 'AY', 'AH', 'T', 'IY', 'SIL', 'M', 'OW', 'M', 'TH', 'SIL', 'AH', 'N', 'D', 'SIL', 'G', 'UH', 'D', 'T', 'SIL', 'F', 'AE', 'L', 'SH', 'IH', 'P', 'SIL', 'D', 'AH', 'S', 'T', 'SIL', 'D', 'IY', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['SH', 'IY', 'SIL', 'R', 'EY', 'D', 'IY', 'EY', 'T', 'AH', 'D', 'SIL', 'W', 'AO', 'R', 'M', 'TH', 'SIL', 'AH', 'N', 'D', 'SIL', 'G', 'UH', 'D', 'SIL', 'F', 'EH', 'L', 'OW', 'SH', 'IH', 'P', 'SIL']\n",
      "Target sentence\n",
      "She radiated warmth and good fellowship.\n",
      "\n",
      "Decoded phonemes:\n",
      "['D', 'UW', 'SIL', 'Y', 'UW', 'SIL', 'N', 'OW', 'SIL', 'W', 'EH', 'R', 'SIL', 'IH', 'T', 'SIL', 'M', 'AY', 'T', 'SIL', 'HH', 'AE', 'V', 'SIL', 'G', 'AO', 'N', 'SIL', 'D', 'AH', 'S', 'T', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['D', 'UW', 'SIL', 'Y', 'UW', 'SIL', 'N', 'OW', 'SIL', 'W', 'EH', 'R', 'SIL', 'IH', 'T', 'SIL', 'M', 'AY', 'T', 'SIL', 'HH', 'AE', 'V', 'SIL', 'G', 'AO', 'N', 'SIL']\n",
      "Target sentence\n",
      "Do you know where it might have gone?\n",
      "\n",
      "Decoded phonemes:\n",
      "['IH', 'N', 'SIL', 'DH', 'AH', 'SIL', 'P', 'L', 'EY', 'S', 'SIL', 'F', 'AO', 'R', 'SIL', 'DH', 'EH', 'M', 'SIL', 'HH', 'IH', 'Z', 'SIL', 'K', 'AH', 'N', 'T', 'AH', 'L', 'IY', 'S', 'SIL', 'W', 'ER', 'SIL', 'G', 'AO', 'N', 'SIL', 'D', 'AH', 'S', 'T', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['IH', 'N', 'SIL', 'DH', 'AH', 'SIL', 'P', 'IH', 'T', 'IY', 'SIL', 'F', 'AO', 'R', 'SIL', 'DH', 'EH', 'M', 'SIL', 'HH', 'IH', 'Z', 'SIL', 'L', 'OW', 'N', 'L', 'IY', 'N', 'AH', 'S', 'SIL', 'W', 'AA', 'Z', 'SIL', 'G', 'AO', 'N', 'SIL']\n",
      "Target sentence\n",
      "In the pity for them his loneliness was gone.\n",
      "\n",
      "Decoded phonemes:\n",
      "['JH', 'OY', 'N', 'SIL', 'AH', 'S', 'SIL', 'AA', 'N', 'SIL', 'S', 'T', 'R', 'EH', 'T', 'ER', 'SIL', 'AH', 'N', 'D', 'SIL', 'F', 'EY', 'S', 'B', 'UH', 'K', 'SIL', 'D', 'AH', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['JH', 'OY', 'N', 'SIL', 'AH', 'S', 'SIL', 'AA', 'N', 'SIL', 'T', 'W', 'IH', 'T', 'ER', 'SIL', 'AH', 'N', 'D', 'SIL', 'F', 'EY', 'S', 'B', 'UH', 'K', 'SIL']\n",
      "Target sentence\n",
      "Join us on Twitter and Facebook\n",
      "\n",
      "Decoded phonemes:\n",
      "['HH', 'IY', 'SIL', 'S', 'EH', 'D', 'SIL', 'EY', 'L', 'SIL', 'B', 'IY', 'SIL', 'W', 'ER', 'K', 'IH', 'K', 'NG', 'SIL', 'S', 'T', 'AO', 'T', 'AH', 'D', 'SIL', 'AH', 'SIL', 'D', 'IH', 'S', 'IH', 'ZH', 'AH', 'N', 'SIL', 'B', 'AH', 'T', 'SIL', 'D', 'AH', 'SIL', 'D', 'IY', 'D', 'IY']\n",
      "Target phonemes:\n",
      "['HH', 'IY', 'SIL', 'S', 'EH', 'D', 'SIL', 'DH', 'EY', 'L', 'SIL', 'B', 'IY', 'SIL', 'W', 'ER', 'K', 'IH', 'NG', 'SIL', 'T', 'AH', 'W', 'AO', 'R', 'D', 'SIL', 'AH', 'SIL', 'D', 'IH', 'S', 'IH', 'ZH', 'AH', 'N', 'SIL']\n",
      "Target sentence\n",
      "He said they'll be working toward a decision.\n",
      "\n"
     ]
    }
   ],
   "source": [
    "idx = 0\n",
    "\n",
    "for idx in range(50):\n",
    "\n",
    "    print(\"Decoded phonemes:\")\n",
    "    print(idsToPhonemes(pred_phonemes[idx]))\n",
    "\n",
    "    #print the true phonemes\n",
    "    print(\"Target phonemes:\")\n",
    "    print(idsToPhonemes(all_true_phonemes[idx]))\n",
    "\n",
    "    print(\"Target sentence\")\n",
    "    #print the true sentence\n",
    "    print(all_true_texts[idx])\n",
    "    print()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "f68ecedf",
   "metadata": {},
   "outputs": [],
   "source": [
    "results_dir = f\"results/{output_name}/\"\n",
    "os.makedirs(results_dir, exist_ok=True)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "1bdec729",
   "metadata": {},
   "outputs": [],
   "source": [
    "#create a dataframe with the results\n",
    "df = pd.DataFrame({\n",
    "    'True Phonemes': [idsToPhonemes(p) for p in true_phonemes],\n",
    "    'Predicted Phonemes': [idsToPhonemes(p) for p in pred_phonemes],\n",
    "    'True Sentence': all_true_texts,\n",
    "    'Day Index': day_indices_flat,\n",
    "    'CER': cer_list\n",
    "})\n",
    "\n",
    "#save it \n",
    "df.to_csv(os.path.join(results_dir, \"results.csv\"), index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "3ffba35f",
   "metadata": {},
   "outputs": [],
   "source": [
    "#create a dataframe with all the metrics\n",
    "df_metrics = pd.DataFrame({\n",
    "    'Overall Accuracy': [overall_acc],\n",
    "    'Range of Accuracy per day': f\"{[min(day_accs), max(day_accs)]}\",\n",
    "    'Range of CER per day': f\"{[min(cer_list_per_day), max(cer_list_per_day)]}\",\n",
    "    'Average length diff': f\"{[np.mean(diffs), np.std(diffs)]}\",\n",
    "    'Range of length diff per day': f\"{[min(diffs_per_day), max(diffs_per_day)]}\"\n",
    "})\n",
    "df_metrics.to_csv(os.path.join(results_dir,\"metrics.csv\"), index=False)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "evo",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
