{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "29f140a5",
   "metadata": {},
   "outputs": [],
   "source": [
    "import hapi\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import os\n",
    "\n",
    "hapi_data_dir_path = \"../data\"\n",
    "hapi.config.data_dir = hapi_data_dir_path\n",
    "pd.set_option(\"display.max_columns\", 50)\n",
    "pd.options.mode.chained_assignment = None  # default='warn'\n",
    "if not os.path.exists(os.path.join(hapi_data_dir_path, \"tasks\")):\n",
    "    hapi.download()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "96733f81",
   "metadata": {},
   "source": [
    "## Missing Face++ predictions on AFNET dataset for 2022\n",
    "We've noticed that there don't seem to be Face++ predictions on AFNET for 2022, even though these are included in the HAPI paper. As a result, we use 2021 data for analyses that only examine a single year."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "0edda664",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'fer', 'ner', 'mic', 'sa', 'str', 'scr'}\n",
      "Datasets: {'ferplus', 'rafdb', 'afnet', 'expw'} \n",
      "\n",
      "APIs: {'microsoft_fer', 'google_fer', 'facepp_fer', 'vgg19_fer'} \n",
      "\n"
     ]
    }
   ],
   "source": [
    "df = hapi.summary()\n",
    "\n",
    "print(set(df[\"task\"]))\n",
    "\n",
    "TASK = \"fer\"\n",
    "df = df[df[\"task\"] == TASK]\n",
    "\n",
    "print(\"Datasets:\", set(df[\"dataset\"]), \"\\n\")\n",
    "print(\"APIs:\", set(df[\"api\"]), \"\\n\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "e4c02645",
   "metadata": {},
   "outputs": [],
   "source": [
    "DATASET = \"afnet\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "6bd07071",
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_prediction_df(task, dataset):\n",
    "    hapi_labels = hapi.get_labels(task=task, dataset=dataset)\n",
    "    hapi_label_dict = {\n",
    "        k[\"example_id\"]: k[\"true_label\"]\n",
    "        for k in hapi_labels[list(hapi_labels.keys())[0]]\n",
    "    }\n",
    "\n",
    "    df_preds = []\n",
    "\n",
    "    res = hapi.get_predictions(task=TASK, dataset=DATASET)\n",
    "    print(res.keys())\n",
    "    for k in res:  # k encodes api provider, date of queries, and dataset queried on\n",
    "        curr_df = pd.DataFrame(res[k])\n",
    "        curr_df[\"api\"] = k\n",
    "        df_preds.append(curr_df)\n",
    "\n",
    "    df_preds = pd.concat(df_preds)\n",
    "    df_preds[\"gt_label\"] = df_preds.apply(\n",
    "        lambda x: hapi_label_dict[x[\"example_id\"]], axis=1\n",
    "    )\n",
    "    df_preds[\"is_correct\"] = df_preds.apply(\n",
    "        lambda x: x[\"predicted_label\"] == x[\"gt_label\"], axis=1\n",
    "    )\n",
    "    df_preds[\"date\"] = df_preds.apply(lambda x: x[\"api\"].split(\"/\")[-1], axis=1)\n",
    "    df_preds[\"year\"] = df_preds.apply(lambda x: x[\"date\"].split(\"-\")[0], axis=1)\n",
    "    df_preds[\"api\"] = df_preds.apply(lambda x: x[\"api\"].split(\"/\")[-2], axis=1)\n",
    "    return df_preds"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "cfa9098b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "10336d1dc3ff48d6bbb827f76e2b5845",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/1 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "08937bb44d4a477c95a57450f3b4e4c1",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/9 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['fer/afnet/microsoft_fer/22-05-23', 'fer/afnet/google_fer/22-05-23', 'fer/afnet/facepp_fer/20-03-05', 'fer/afnet/google_fer/20-03-05', 'fer/afnet/vgg19_fer/20-03-05', 'fer/afnet/microsoft_fer/20-03-05', 'fer/afnet/facepp_fer/21-02-17', 'fer/afnet/microsoft_fer/21-02-17', 'fer/afnet/google_fer/21-02-17'])\n"
     ]
    }
   ],
   "source": [
    "df_preds = generate_prediction_df(TASK, DATASET)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8cceeb3e",
   "metadata": {},
   "source": [
    "### Lack of instances for (faceapp_fer, 22)\n",
    "Note below that we don't see any rows for faceapp_fer in 2022."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "3d53ed53",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>api</th>\n",
       "      <th>year</th>\n",
       "      <th>is_correct</th>\n",
       "      <th>is_wrong</th>\n",
       "      <th>num_rows</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>facepp_fer</td>\n",
       "      <td>20</td>\n",
       "      <td>0.640662</td>\n",
       "      <td>0.359338</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>facepp_fer</td>\n",
       "      <td>21</td>\n",
       "      <td>0.640690</td>\n",
       "      <td>0.359310</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>google_fer</td>\n",
       "      <td>20</td>\n",
       "      <td>0.682565</td>\n",
       "      <td>0.317435</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>google_fer</td>\n",
       "      <td>21</td>\n",
       "      <td>0.682625</td>\n",
       "      <td>0.317375</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>google_fer</td>\n",
       "      <td>22</td>\n",
       "      <td>0.682635</td>\n",
       "      <td>0.317365</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>microsoft_fer</td>\n",
       "      <td>20</td>\n",
       "      <td>0.722997</td>\n",
       "      <td>0.277003</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>microsoft_fer</td>\n",
       "      <td>21</td>\n",
       "      <td>0.723108</td>\n",
       "      <td>0.276892</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>microsoft_fer</td>\n",
       "      <td>22</td>\n",
       "      <td>0.723108</td>\n",
       "      <td>0.276892</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>vgg19_fer</td>\n",
       "      <td>20</td>\n",
       "      <td>0.638613</td>\n",
       "      <td>0.361387</td>\n",
       "      <td>287401</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             api year  is_correct  is_wrong  num_rows\n",
       "0     facepp_fer   20    0.640662  0.359338    287401\n",
       "1     facepp_fer   21    0.640690  0.359310    287401\n",
       "2     google_fer   20    0.682565  0.317435    287401\n",
       "3     google_fer   21    0.682625  0.317375    287401\n",
       "4     google_fer   22    0.682635  0.317365    287401\n",
       "5  microsoft_fer   20    0.722997  0.277003    287401\n",
       "6  microsoft_fer   21    0.723108  0.276892    287401\n",
       "7  microsoft_fer   22    0.723108  0.276892    287401\n",
       "8      vgg19_fer   20    0.638613  0.361387    287401"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "df_preds_api_acc = (\n",
    "    df_preds.groupby([\"api\", \"year\"], as_index=False)\n",
    "    .agg({\"is_correct\": np.mean})\n",
    "    .sort_values(by=[\"api\", \"year\"])\n",
    ")\n",
    "df_preds_api_acc[\"is_wrong\"] = 1 - df_preds_api_acc[\"is_correct\"]\n",
    "\n",
    "df_preds_api_count = df_preds.groupby([\"api\", \"year\"], as_index=False).count()\n",
    "\n",
    "df_preds_api_acc[\"num_rows\"] = df_preds_api_count[\"example_id\"]\n",
    "display(df_preds_api_acc)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c6a581e5",
   "metadata": {},
   "source": [
    "## Non unique IDs on CMD dataset\n",
    "On the command dataset, we've noticed that many example_ids have multiple predictions in the same year from the same API. For example, \"COMMAND_00176480_nohash_0.wav\" has 6 predictions from google in the year 2020. Each row has a different prediction from the google api. We didn't know how to calculate ecosystem-level outcomes in this case since it would appear that the same input has different outcomes. As such, we exclude this dataset from our analysis."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "5eb16e73",
   "metadata": {},
   "outputs": [],
   "source": [
    "TASK = \"scr\"\n",
    "DATASET = \"command\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "f2c1f1b8",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "14cd58be34d84974ac9054c18fab5812",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/1 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "aa3994dd39be4be78fb5150bb671e358",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/10 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "dict_keys(['scr/command/google_scr/20-03-29', 'scr/command/microsoft_scr/20-03-29', 'scr/command/ibm_scr/20-03-29', 'scr/command/deepspeech_lib_scr/20-03-29', 'scr/command/microsoft_scr/22-05-23', 'scr/command/google_scr/22-05-23', 'scr/command/ibm_scr/22-05-23', 'scr/command/microsoft_scr/21-04-14', 'scr/command/google_scr/21-04-14', 'scr/command/ibm_scr/21-04-14'])\n"
     ]
    }
   ],
   "source": [
    "df_preds = generate_prediction_df(TASK, DATASET)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "f011b628",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>confidence</th>\n",
       "      <th>predicted_label</th>\n",
       "      <th>gt_label</th>\n",
       "      <th>is_correct</th>\n",
       "      <th>date</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>example_id</th>\n",
       "      <th>year</th>\n",
       "      <th>api</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">COMMAND_00176480_nohash_0.wav</th>\n",
       "      <th rowspan=\"4\" valign=\"top\">20</th>\n",
       "      <th>deepspeech_lib_scr</th>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>google_scr</th>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ibm_scr</th>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>microsoft_scr</th>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <th>google_scr</th>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <th>...</th>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">COMMAND_fffcabd1_nohash_2.wav</th>\n",
       "      <th rowspan=\"2\" valign=\"top\">21</th>\n",
       "      <th>ibm_scr</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>microsoft_scr</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">22</th>\n",
       "      <th>google_scr</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ibm_scr</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>microsoft_scr</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>53080 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                       confidence  \\\n",
       "example_id                    year api                              \n",
       "COMMAND_00176480_nohash_0.wav 20   deepspeech_lib_scr           6   \n",
       "                                   google_scr                   6   \n",
       "                                   ibm_scr                      6   \n",
       "                                   microsoft_scr                6   \n",
       "                              21   google_scr                   6   \n",
       "...                                                           ...   \n",
       "COMMAND_fffcabd1_nohash_2.wav 21   ibm_scr                      2   \n",
       "                                   microsoft_scr                2   \n",
       "                              22   google_scr                   2   \n",
       "                                   ibm_scr                      2   \n",
       "                                   microsoft_scr                2   \n",
       "\n",
       "                                                       predicted_label  \\\n",
       "example_id                    year api                                   \n",
       "COMMAND_00176480_nohash_0.wav 20   deepspeech_lib_scr                6   \n",
       "                                   google_scr                        6   \n",
       "                                   ibm_scr                           6   \n",
       "                                   microsoft_scr                     6   \n",
       "                              21   google_scr                        6   \n",
       "...                                                                ...   \n",
       "COMMAND_fffcabd1_nohash_2.wav 21   ibm_scr                           2   \n",
       "                                   microsoft_scr                     2   \n",
       "                              22   google_scr                        2   \n",
       "                                   ibm_scr                           2   \n",
       "                                   microsoft_scr                     2   \n",
       "\n",
       "                                                       gt_label  is_correct  \\\n",
       "example_id                    year api                                        \n",
       "COMMAND_00176480_nohash_0.wav 20   deepspeech_lib_scr         6           6   \n",
       "                                   google_scr                 6           6   \n",
       "                                   ibm_scr                    6           6   \n",
       "                                   microsoft_scr              6           6   \n",
       "                              21   google_scr                 6           6   \n",
       "...                                                         ...         ...   \n",
       "COMMAND_fffcabd1_nohash_2.wav 21   ibm_scr                    2           2   \n",
       "                                   microsoft_scr              2           2   \n",
       "                              22   google_scr                 2           2   \n",
       "                                   ibm_scr                    2           2   \n",
       "                                   microsoft_scr              2           2   \n",
       "\n",
       "                                                       date  \n",
       "example_id                    year api                       \n",
       "COMMAND_00176480_nohash_0.wav 20   deepspeech_lib_scr     6  \n",
       "                                   google_scr             6  \n",
       "                                   ibm_scr                6  \n",
       "                                   microsoft_scr          6  \n",
       "                              21   google_scr             6  \n",
       "...                                                     ...  \n",
       "COMMAND_fffcabd1_nohash_2.wav 21   ibm_scr                2  \n",
       "                                   microsoft_scr          2  \n",
       "                              22   google_scr             2  \n",
       "                                   ibm_scr                2  \n",
       "                                   microsoft_scr          2  \n",
       "\n",
       "[53080 rows x 5 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "count_unique = df_preds.groupby([\"example_id\", \"year\", \"api\"]).count()\n",
    "display(count_unique[count_unique[\"predicted_label\"] > 1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "339490f1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>confidence</th>\n",
       "      <th>predicted_label</th>\n",
       "      <th>example_id</th>\n",
       "      <th>api</th>\n",
       "      <th>gt_label</th>\n",
       "      <th>is_correct</th>\n",
       "      <th>date</th>\n",
       "      <th>year</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>2376</th>\n",
       "      <td>0.824559</td>\n",
       "      <td>1</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4746</th>\n",
       "      <td>0.773346</td>\n",
       "      <td>10</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11669</th>\n",
       "      <td>0.912839</td>\n",
       "      <td>14</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19892</th>\n",
       "      <td>0.749404</td>\n",
       "      <td>27</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22245</th>\n",
       "      <td>0.912839</td>\n",
       "      <td>19</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28739</th>\n",
       "      <td>0.579967</td>\n",
       "      <td>28</td>\n",
       "      <td>COMMAND_00176480_nohash_0.wav</td>\n",
       "      <td>google_scr</td>\n",
       "      <td>21</td>\n",
       "      <td>False</td>\n",
       "      <td>20-03-29</td>\n",
       "      <td>20</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       confidence  predicted_label                     example_id         api  \\\n",
       "2376     0.824559                1  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "4746     0.773346               10  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "11669    0.912839               14  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "19892    0.749404               27  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "22245    0.912839               19  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "28739    0.579967               28  COMMAND_00176480_nohash_0.wav  google_scr   \n",
       "\n",
       "       gt_label  is_correct      date year  \n",
       "2376         21       False  20-03-29   20  \n",
       "4746         21       False  20-03-29   20  \n",
       "11669        21       False  20-03-29   20  \n",
       "19892        21       False  20-03-29   20  \n",
       "22245        21       False  20-03-29   20  \n",
       "28739        21       False  20-03-29   20  "
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_preds[\n",
    "    (df_preds[\"example_id\"] == \"COMMAND_00176480_nohash_0.wav\")\n",
    "    & (df_preds[\"api\"] == \"google_scr\")\n",
    "    & (df_preds[\"year\"] == \"20\")\n",
    "]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "675cc8c4",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e79885c1",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:homog]",
   "language": "python",
   "name": "conda-env-homog-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
