{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "da0e66aa-7526-4e7a-bfac-ea4d74afc962",
   "metadata": {},
   "source": [
    "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').\n",
    "\n",
    "\n",
    "This S dump contains 22 data sets from the book Visualizing Data published by Hobart Press (books@hobart.com). The dump was created by data.dump() and can be read back into S by data.restore(). The name of each S data set is the name of the data set used in the book. To find the description of the data set in the book look under the entry - data, name - in the index. For example, one data set is barley. To find the description of barley, look in the index under the entry - data, barley.\n",
    "\n",
    "File: ../data/visualizing/hamster.csv\n",
    "\n",
    "Information about the dataset CLASSTYPE: numeric CLASSINDEX: none specific"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0235adab-7d84-459c-a813-9564d1adf220",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import openml\n",
    "import numpy as np\n",
    "import scipy\n",
    "from sklearn.model_selection import train_test_split\n",
    "from collections import defaultdict\n",
    "from prompting import Prompting, compute_error_rate\n",
    "import tqdm\n",
    "from num2words import num2words\n",
    "from sklearn.ensemble import AdaBoostClassifier\n",
    "\n",
    "from sklearn.cluster import AgglomerativeClustering\n",
    "# normalize the embeddings to unit length\n",
    "from sklearn.metrics.pairwise import cosine_similarity\n",
    "\n",
    "from pathlib import Path\n",
    "import matplotlib.pyplot as plt\n",
    "import pickle\n",
    "import pdb\n",
    "import torch\n",
    "import math\n",
    "from tenacity import *\n",
    "from itertools import permutations\n",
    "\n",
    "import seaborn as sns\n",
    "import numpy as np\n",
    "sns.set_style(\"whitegrid\")\n",
    "\n",
    "import sys\n",
    "sys.path.insert(0, '/Users/hariharan/hari_works/prompting-tabular-data')\n",
    "from summarizer_utils import train_model, batch_predict, sample, normalize\n",
    "from xgboost_utils import xgboost_benchmark\n",
    "\n",
    "import openai\n",
    "import os\n",
    "openai.api_key = os.getenv(\"OPENAI_API_KEY\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "e64c12be-5756-41b4-9a3f-b2fa47d6e63a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>binaryClass</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>N</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>N</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney binaryClass\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003           P\n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103           P\n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001           N\n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003           P\n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003           N\n",
       "..       ...       ...       ...     ...       ...         ...\n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402           P\n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103           P\n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603           P\n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302           P\n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800           P\n",
       "\n",
       "[73 rows x 6 columns]"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Get dataset by name\n",
    "dataset = openml.datasets.get_dataset(893)\n",
    "# Get the data itself as a dataframe (or otherwise)\n",
    "df, y, _, _ = dataset.get_data(dataset_format=\"dataframe\")\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "9f8856f5-056c-4d16-991d-991ed2e22205",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>result of testing the hamster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>N</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>N</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>P</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney  \\\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003   \n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103   \n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001   \n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003   \n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003   \n",
       "..       ...       ...       ...     ...       ...   \n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402   \n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103   \n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603   \n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302   \n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800   \n",
       "\n",
       "   result of testing the hamster  \n",
       "0                              P  \n",
       "1                              P  \n",
       "2                              N  \n",
       "3                              P  \n",
       "4                              N  \n",
       "..                           ...  \n",
       "68                             P  \n",
       "69                             P  \n",
       "70                             P  \n",
       "71                             P  \n",
       "72                             P  \n",
       "\n",
       "[73 rows x 6 columns]"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = df.rename(columns = {\n",
    "    'binaryClass': 'result of testing the hamster'\n",
    "})\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "dc071ed7-86c5-4c1b-b843-5c9388ea0c53",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>result of testing the hamster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>negative</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>negative</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney  \\\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003   \n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103   \n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001   \n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003   \n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003   \n",
       "..       ...       ...       ...     ...       ...   \n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402   \n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103   \n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603   \n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302   \n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800   \n",
       "\n",
       "   result of testing the hamster  \n",
       "0                       positive  \n",
       "1                       positive  \n",
       "2                       negative  \n",
       "3                       positive  \n",
       "4                       negative  \n",
       "..                           ...  \n",
       "68                      positive  \n",
       "69                      positive  \n",
       "70                      positive  \n",
       "71                      positive  \n",
       "72                      positive  \n",
       "\n",
       "[73 rows x 6 columns]"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df['result of testing the hamster'] = df['result of testing the hamster'].map({\n",
    "    'P': 'positive',\n",
    "    'N': 'negative'\n",
    "})\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "32c642fe-7232-473d-86a4-505009966ef8",
   "metadata": {},
   "outputs": [],
   "source": [
    "df.to_csv('visualizing_hamster_table.csv')"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5421abb1-1269-4d98-bf30-07a797c1afc3",
   "metadata": {},
   "source": [
    "### xgboost"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "132c4b00-94cf-462b-b400-40a0d1883603",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "100%|█| 1500/1500 [38:50<00:00,  1.55s/trial, best l\n",
      "100%|█| 1500/1500 [25:16<00:00,  1.01s/trial, best l\n",
      "err rates: [0.405, 0.417]\n",
      "f1 scores: [0.5626477541371159, 0.5555555555555555]\n"
     ]
    }
   ],
   "source": [
    "df = pd.read_csv('visualizing_hamster_table.csv', index_col = 0)\n",
    "xgboost_benchmark(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a8d3f355-7cb2-420c-952c-22840880c651",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "24f0446a-e248-4adf-a55a-b029cd475be7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "b795f8e9-9dfa-4b05-a3c4-a83769b4071c",
   "metadata": {},
   "source": [
    "**LIFT**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "deaa7b96-806d-4dd2-872d-9ed4f9d7ebf1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>result of testing the hamster</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>negative</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>negative</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>positive</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney  \\\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003   \n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103   \n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001   \n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003   \n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003   \n",
       "..       ...       ...       ...     ...       ...   \n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402   \n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103   \n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603   \n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302   \n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800   \n",
       "\n",
       "   result of testing the hamster  \n",
       "0                       positive  \n",
       "1                       positive  \n",
       "2                       negative  \n",
       "3                       positive  \n",
       "4                       negative  \n",
       "..                           ...  \n",
       "68                      positive  \n",
       "69                      positive  \n",
       "70                      positive  \n",
       "71                      positive  \n",
       "72                      positive  \n",
       "\n",
       "[73 rows x 6 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_csv('visualizing_hamster_table.csv', index_col = 0)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "e54f22b7-8a9a-4eb3-99c7-fc27f39e49cf",
   "metadata": {},
   "outputs": [
    {
     "ename": "ModuleNotFoundError",
     "evalue": "No module named 'lift_utils3'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mModuleNotFoundError\u001b[0m                       Traceback (most recent call last)",
      "\u001b[0;32m/var/folders/ll/g4b6wylx35j6mmv9gvrczch40000gp/T/ipykernel_19795/1221910504.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0;32mfrom\u001b[0m \u001b[0mlift_utils3\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mlift_benchmark\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'lift_utils3'"
     ]
    }
   ],
   "source": [
    "from lift_utils3 import lift_benchmark"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "id": "8f6ef3ab-01c3-4782-b001-f726c83a7a70",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "30    lung is 0.64, heart is 0.67, liver is 0.47, sp...\n",
      "13    lung is 0.1, heart is 0.11, liver is 0.09, spl...\n",
      "9     lung is 0.16, heart is 0.08, liver is 0.12, sp...\n",
      "8     lung is 0.13, heart is 0.0, liver is 0.07, spl...\n",
      "Name: text, dtype: object 30    1\n",
      "13    0\n",
      "9     0\n",
      "8     0\n",
      "dtype: object\n",
      "[{'prompt': 'lung is 0.64, heart is 0.67, liver is 0.47, spleen is 0.41, kidney is 0.58 -> ', 'completion': '1'}, {'prompt': 'lung is 0.1, heart is 0.11, liver is 0.09, spleen is 0.1, kidney is 0.2 -> ', 'completion': '0'}, {'prompt': 'lung is 0.16, heart is 0.08, liver is 0.12, spleen is 0.17, kidney is 0.15 -> ', 'completion': '0'}, {'prompt': 'lung is 0.13, heart is 0.0, liver is 0.07, spleen is 0.1, kidney is 0.27 -> ', 'completion': '0'}]\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Upload progress: 100%|██████████| 4.12k/4.12k [00:00<00:00, 2.45Mit/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Uploaded file from ./visualizing_hamster_rawnumbers_train.jsonl: file-hXYXh7pmP4DRhCdyTieGrNJE\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Upload progress: 100%|██████████| 4.01k/4.01k [00:00<00:00, 9.39Mit/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Uploaded file from ./visualizing_hamster_rawnumbers_test.jsonl: file-wWAbpSPH7Ztb8sfPRFnwMxgo\n",
      "\n",
      "Created fine-tune: ft-5m7cCztZQrGEAFDz8rjAo0Jc\n",
      "\n",
      "[2023-01-25 02:33:19] Created fine-tune: ft-5m7cCztZQrGEAFDz8rjAo0Jc\n"
     ]
    },
    {
     "ename": "KeyboardInterrupt",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "\u001b[0;32m/var/folders/ll/g4b6wylx35j6mmv9gvrczch40000gp/T/ipykernel_4284/124679532.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mlift_benchmark\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdataset_name\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m'visualizing_hamster'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mpath\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m'.'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mn_epochs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;36m20\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[0;32m~/hari_works/prompting-tabular-data/lift_utils.py\u001b[0m in \u001b[0;36mlift_benchmark\u001b[0;34m(df, dataset_name, path, n_epochs)\u001b[0m\n",
      "\u001b[0;32m~/hari_works/prompting-tabular-data/lift_utils.py\u001b[0m in \u001b[0;36mexecute\u001b[0;34m(cmd)\u001b[0m\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
     ]
    }
   ],
   "source": [
    "lift_benchmark(df, dataset_name = 'visualizing_hamster', path = '.', n_epochs = 20)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a525361c-2e1a-4156-84e7-5ff3fba2f55f",
   "metadata": {},
   "outputs": [],
   "source": [
    "'ft-5m7cCztZQrGEAFDz8rjAo0Jc'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a101e0d3-a98f-42a0-9c04-26cee783129c",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "75db6893-342a-4d39-81ba-05887f05ebd7",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f31aeff4-d893-4175-8339-bb496291a4d0",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "id": "e8fa9b2d-1456-4749-b18a-269d83ece12b",
   "metadata": {},
   "source": [
    "This is some data about an hamster."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "796ab772-b887-4d22-b54d-0d7f826d6556",
   "metadata": {},
   "outputs": [],
   "source": [
    "def quartile(value, field, categories = None):\n",
    "    first_q = np.percentile(field, 25)\n",
    "    median = np.percentile(field, 50)\n",
    "    third_q = np.percentile(field, 75)\n",
    "    \n",
    "    if value < first_q:\n",
    "        if categories is not None: return 'is ' + categories[0]\n",
    "        return 'is below the first quartile value'\n",
    "    \n",
    "    if value < median:\n",
    "        if categories is not None: return 'is ' + categories[1]\n",
    "        return 'is between the first quartile and median values'\n",
    "    \n",
    "    if value < third_q:\n",
    "        if categories is not None: return 'is ' + categories[2]\n",
    "        return 'is between median and third quartile values'\n",
    "    \n",
    "    if categories is not None: return 'is ' + categories[3]\n",
    "    return 'is more than the third quartile value'"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5c48e731-0803-4f66-b74d-9a1f937b4718",
   "metadata": {},
   "source": [
    "### text format"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "8f778072-fe60-4720-87c7-7ed08d9db51e",
   "metadata": {},
   "source": [
    "This is some information about an hamster."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "55591885-7094-4902-8fcb-d4d02c02d41b",
   "metadata": {},
   "outputs": [],
   "source": [
    "def quartile(value, field, categories = None):\n",
    "    first_q = np.percentile(field, 25)\n",
    "    median = np.percentile(field, 50)\n",
    "    third_q = np.percentile(field, 75)\n",
    "    \n",
    "    if value < first_q:\n",
    "        if categories is not None: return 'is ' + categories[0]\n",
    "        return 'is below the first quartile value'\n",
    "    \n",
    "    if value < median:\n",
    "        if categories is not None: return 'is ' + categories[1]\n",
    "        return 'is between the first quartile and median values'\n",
    "    \n",
    "    if value < third_q:\n",
    "        if categories is not None: return 'is ' + categories[2]\n",
    "        return 'is between median and third quartile values'\n",
    "    \n",
    "    if categories is not None: return 'is ' + categories[3]\n",
    "    return 'is more than the third quartile value'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "2fdc835b-a1d9-4e90-b39b-c1ccff4aa451",
   "metadata": {},
   "outputs": [],
   "source": [
    "import openai, os\n",
    "import tqdm\n",
    "openai.api_key = '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'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "33416b88-05ae-4a72-9b61-017bdbb84d91",
   "metadata": {},
   "outputs": [],
   "source": [
    "model = 'text-davinci-002'\n",
    "\n",
    "from tenacity import *\n",
    "\n",
    "@retry(stop=(stop_after_attempt(10)), wait=wait_fixed(5))\n",
    "def describe(prompt):\n",
    "    response = openai.Completion.create(\n",
    "        model= model,\n",
    "        prompt= prompt,\n",
    "        temperature= 0.80,\n",
    "        max_tokens=500,\n",
    "        # top_p=0.8,\n",
    "        # frequency_penalty=0.0,\n",
    "        # presence_penalty=0.0\n",
    "    )\n",
    "    result = response.choices[0].text\n",
    "    return result.strip()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "ad46b391-894b-46e5-a833-b76f9d3b3560",
   "metadata": {},
   "outputs": [],
   "source": [
    "df['text'] = ''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "d2fe781c-a6df-41dc-bd5d-0896e8b33f78",
   "metadata": {},
   "outputs": [],
   "source": [
    "rep = quartile"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "4cd43458-a3f5-4c73-9b30-3df39a755e7c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "10"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(\"The given data suggests that the orthopaedic patients are abnormal.\".split(' ')) # ### Hence the patient was classified as normal."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "a4a4c88b-a77b-4011-94a3-0d08ffd05fed",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>result of testing the hamster</th>\n",
       "      <th>text</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>negative</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>negative</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>positive</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney  \\\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003   \n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103   \n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001   \n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003   \n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003   \n",
       "..       ...       ...       ...     ...       ...   \n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402   \n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103   \n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603   \n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302   \n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800   \n",
       "\n",
       "   result of testing the hamster text  \n",
       "0                       positive       \n",
       "1                       positive       \n",
       "2                       negative       \n",
       "3                       positive       \n",
       "4                       negative       \n",
       "..                           ...  ...  \n",
       "68                      positive       \n",
       "69                      positive       \n",
       "70                      positive       \n",
       "71                      positive       \n",
       "72                      positive       \n",
       "\n",
       "[73 rows x 7 columns]"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "34e67b1e-8648-4d99-a773-e777aa32484e",
   "metadata": {},
   "outputs": [],
   "source": [
    "categories = ['very small', 'small', 'big', 'very big']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "55b9aab1-8907-46bd-ac57-752573750e1b",
   "metadata": {
    "collapsed": true,
    "jupyter": {
     "outputs_hidden": true
    },
    "tags": []
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  0%|                        | 0/73 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  1%|▏               | 1/73 [00:01<01:39,  1.39s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big, heart is very big, liver is big, spleen is very big, and kidney is big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  3%|▍               | 2/73 [00:07<04:50,  4.10s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all significantly larger than average, with the exception of the kidney which is only slightly larger. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is big\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  4%|▋               | 3/73 [00:08<03:06,  2.66s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big, heart is big, liver is big, spleen is very small, and kidney is very small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  5%|▉               | 4/73 [00:15<04:56,  4.29s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has a small lung, a big heart, a very big liver, a big spleen, and a big kidney. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  7%|█               | 5/73 [00:15<03:19,  2.94s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has large organs, including a big lung, heart, and liver, as well as a large spleen and kidney. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  8%|█▎              | 6/73 [00:17<02:48,  2.52s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, heart is big, liver is very big, spleen is very big, and kidney is big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 10%|█▌              | 7/73 [00:42<10:51,  9.86s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very small in comparison to other animals. The lungs, heart, liver, spleen, and kidney are all much smaller than average. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 11%|█▊              | 8/73 [00:43<07:44,  7.15s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are very small in comparison to other animals. The lungs, heart, liver, spleen, and kidney are all diminutive in size. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 12%|█▉              | 9/73 [01:04<12:04, 11.32s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are small in comparison to other animals. The lungs, heart, liver, spleen, and kidney are all petite in size. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 14%|██             | 10/73 [01:06<09:06,  8.68s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very small, heart is very small, liver is small, spleen is small, and kidney is very small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 15%|██▎            | 11/73 [01:08<06:45,  6.55s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all small in size. The lungs and heart are very small, while the liver, spleen, and kidney are just small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 16%|██▍            | 12/73 [01:16<07:02,  6.92s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are very small in comparison to other animals. The lungs, heart, liver, spleen, and kidneys are all much smaller than average. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 18%|██▋            | 13/73 [01:20<06:11,  6.20s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very small in comparison to other animals. The lung, heart, liver, spleen, and kidney are all disproportionately small compared to the rest of the hamster's body. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 19%|██▉            | 14/73 [01:25<05:40,  5.77s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very small. The lung, heart, liver, spleen, and kidney are all very small in comparison to other animals. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is very small\n",
      "    - liver : is small\n",
      "    - spleen : is very small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 21%|███            | 15/73 [01:26<04:07,  4.27s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is very small, liver is small, spleen is very small, and kidney is small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 22%|███▎           | 16/73 [01:28<03:31,  3.71s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big, heart is very small, liver is very small, spleen is small, and kidney is very small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 23%|███▍           | 17/73 [01:31<03:04,  3.29s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has very small lungs, heart, liver, and kidney. The spleen is small in comparison to the other organs. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 25%|███▋           | 18/73 [01:31<02:18,  2.51s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very small, as is their heart and liver. The hamster's spleen is also very small, and their kidney is small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 26%|███▉           | 19/73 [01:41<04:04,  4.54s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has very small lungs, heart, liver, and kidney. The spleen is small in comparison to the other organs. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 27%|████           | 20/73 [01:44<03:35,  4.07s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all small in size. The lungs, heart, liver, and spleen are particularly small, while the kidney is only slightly larger. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is very small\n",
      "    - liver : is small\n",
      "    - spleen : is very small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 29%|████▎          | 21/73 [01:45<02:40,  3.09s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is very small, liver is small, spleen is very small, and kidney is small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is small\n",
      "    - liver : is very small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 30%|████▌          | 22/73 [01:46<02:09,  2.53s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very small, heart is small, liver is very small, spleen is small, and kidney is small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 32%|████▋          | 23/73 [01:46<01:37,  1.94s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "This data describes the organs of a hamster. The hamster's lung is very small, as is its heart, liver, spleen, and kidney. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 33%|████▉          | 24/73 [01:47<01:15,  1.53s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has small lungs and a small heart. Its liver is very large, and its spleen and kidney are both big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is very small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 34%|█████▏         | 25/73 [01:48<01:03,  1.33s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has small lungs, a very small heart, a small liver, and a small spleen. The hamster's kidneys are very small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 36%|█████▎         | 26/73 [01:50<01:14,  1.59s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, heart is small, liver is small, spleen is small, and kidney is very small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 37%|█████▌         | 27/73 [01:51<01:02,  1.36s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is large, and its heart is very large. Its liver is also large, as is its spleen. The hamster's kidney is also large. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 38%|█████▊         | 28/73 [01:52<00:55,  1.23s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is large, while the heart, liver, and spleen are all very small. The kidney is small as well. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 40%|█████▉         | 29/73 [01:53<00:55,  1.25s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is small, liver is very big, spleen is big, and kidney is very big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 41%|██████▏        | 30/73 [02:12<04:45,  6.63s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are small in comparison to other animals. The lungs, heart, liver, spleen, and kidney are all smaller than average. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 42%|██████▎        | 31/73 [02:13<03:23,  4.84s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all larger than average, with the exception of the kidney. The lung and heart are especially large, while the spleen is very large. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is big\n",
      "    - spleen : is small\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 44%|██████▌        | 32/73 [02:13<02:26,  3.58s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung, heart, and liver are all large, while its spleen is small and its kidney is very large. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 45%|██████▊        | 33/73 [02:15<01:59,  2.98s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is large, while the heart is very large in comparison. The liver and spleen are both large, and the kidney is very large. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 47%|██████▉        | 34/73 [02:25<03:15,  5.02s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lungs are small, and the heart is big in comparison. The liver and spleen are both small, and the kidneys are even smaller. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is small\n",
      "    - liver : is big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 48%|███████▏       | 35/73 [02:25<02:20,  3.71s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very small, heart is small, liver is big, spleen is big, and kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 49%|███████▍       | 36/73 [02:40<04:17,  6.96s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lungs are small, but their heart and liver are large. The hamster's spleen is also large, but their kidneys are even larger. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 51%|███████▌       | 37/73 [02:42<03:11,  5.33s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "This hamster has very small lungs, a small heart, and a small liver. However, its kidney is much larger in comparison. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is very big\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 52%|███████▊       | 38/73 [02:42<02:16,  3.90s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very small, heart is small, liver is small, spleen is very big, and kidney is small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is small\n",
      "    - liver : is big\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 53%|████████       | 39/73 [02:43<01:39,  2.93s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, while the heart is small. The liver and spleen are both big, and the kidney is also big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is small\n",
      "    - liver : is big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 55%|████████▏      | 40/73 [02:44<01:15,  2.27s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, while the heart is small. The liver is big, and so is the spleen. The kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 56%|████████▍      | 41/73 [02:44<00:58,  1.83s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are large compared to the size of the animal. The lungs, heart, liver, and spleen are all bigger than average, while the kidney is especially large. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 58%|████████▋      | 42/73 [02:53<02:03,  3.99s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "This hamster has very large organs compared to the average hamster. Its lung, heart, liver, spleen, and kidney are all significantly larger than normal. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 59%|████████▊      | 43/73 [02:54<01:30,  3.00s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung, heart, and liver are all larger than average, while its spleen and kidney are both very large. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very small\n",
      "    - heart : is very small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 60%|█████████      | 44/73 [03:00<01:49,  3.79s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very small. The lung, heart, liver, spleen, and kidney are all tiny in comparison to other mammals. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 62%|█████████▏     | 45/73 [03:01<01:28,  3.14s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, heart is very big, liver is big, spleen is very big, and kidney is big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 63%|█████████▍     | 46/73 [03:03<01:10,  2.60s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big and its heart is big. Its liver is small, as are its spleen and kidney. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 64%|█████████▋     | 47/73 [03:03<00:53,  2.05s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is small, liver is very small, spleen is very small, and kidney is very small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 66%|█████████▊     | 48/73 [03:04<00:43,  1.76s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is big, liver is very big, spleen is big, and kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 67%|██████████     | 49/73 [03:19<02:12,  5.52s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big in comparison to its other organs. Its heart, liver, spleen, and kidney are all small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 68%|██████████▎    | 50/73 [03:21<01:43,  4.51s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small and its heart is small. However, its liver is very big and its spleen is very big. Its kidney is also big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is big\n",
      "    - spleen : is very small\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 70%|██████████▍    | 51/73 [03:22<01:13,  3.35s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has a small lung, a big heart, a big liver, a very small spleen, and a very big kidney. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 71%|██████████▋    | 52/73 [03:22<00:53,  2.54s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big, heart is very big, liver is big, spleen is very big, and kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 73%|██████████▉    | 53/73 [03:23<00:41,  2.08s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lungs and heart are both abnormally large, while its liver, spleen, and kidneys are all much larger than average. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 74%|███████████    | 54/73 [03:24<00:32,  1.69s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is big, heart is very big, liver is very big, spleen is very big, and kidney is big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is small\n",
      "    - spleen : is very big\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 75%|███████████▎   | 55/73 [03:25<00:24,  1.36s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung and heart are both very large, while the liver and kidney are small. The spleen is very big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 77%|███████████▌   | 56/73 [03:27<00:29,  1.74s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, heart is big, liver is very big, spleen is very big and kidney is big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 78%|███████████▋   | 57/73 [03:28<00:24,  1.52s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung, heart, and liver are all larger than average, while its spleen is very large. Its kidney, however, is small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is big\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 79%|███████████▉   | 58/73 [03:36<00:50,  3.38s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lungs are small, but their heart and spleen are big. Their kidney is small in comparison to the other organs. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 81%|████████████   | 59/73 [03:38<00:40,  2.87s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very big in comparison to the rest of its body. Its lung, heart, liver, spleen, and kidney are all significantly larger than average. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 82%|████████████▎  | 60/73 [03:39<00:33,  2.55s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very large in comparison to the size of the animal. The lungs and heart are especially large, while the liver, spleen, and kidney are all big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 84%|████████████▌  | 61/73 [03:42<00:31,  2.63s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are all very large compared to the rest of its body. Its lung, heart, liver, spleen, and kidney are all significantly bigger than what would be expected. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is big\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 85%|████████████▋  | 62/73 [03:48<00:39,  3.56s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, but the heart is big. The liver is small, but the spleen is big. The kidney is small. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 86%|████████████▉  | 63/73 [03:49<00:26,  2.68s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lungs and heart are very large, while its liver and spleen are very small. Its kidney is big. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very small\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 88%|█████████████▏ | 64/73 [03:49<00:18,  2.06s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has very large lungs and heart, a big liver, and small spleen. The kidney is also large in size. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 89%|█████████████▎ | 65/73 [03:51<00:16,  2.05s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has big lungs, a very big heart, a very big liver, a very big spleen, and very big kidneys. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is big\n",
      "    - liver : is small\n",
      "    - spleen : is small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 90%|█████████████▌ | 66/73 [03:53<00:13,  1.96s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very large compared to its other organs. The heart is also significantly larger than the liver, spleen, and kidneys. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is big\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 92%|█████████████▊ | 67/73 [04:05<00:29,  4.93s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has a small lung, a big heart, a very big liver, a big spleen, and a big kidney. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is very big\n",
      "    - liver : is big\n",
      "    - spleen : is very big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 93%|█████████████▉ | 68/73 [04:06<00:18,  3.76s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's organs are significantly larger than average, with the lungs and heart being especially large. The liver is also larger than average, while the spleen and kidney are very large. ### Hence, this hamster tested negative.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is small\n",
      "    - liver : is very small\n",
      "    - spleen : is very small\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 95%|██████████████▏| 69/73 [04:07<00:11,  2.84s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is small, liver is very small, spleen is very small, and kidney is very small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is small\n",
      "    - heart : is very big\n",
      "    - liver : is very big\n",
      "    - spleen : is small\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 96%|██████████████▍| 70/73 [04:07<00:06,  2.17s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is small, heart is very big, liver is very big, spleen is small, and kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is very big\n",
      "    - heart : is small\n",
      "    - liver : is very big\n",
      "    - spleen : is big\n",
      "    - kidney : is very big\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 97%|██████████████▌| 71/73 [04:08<00:03,  1.72s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is very big, heart is small, liver is very big, spleen is big, and kidney is very big. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is small\n",
      "    - liver : is big\n",
      "    - spleen : is very small\n",
      "    - kidney : is small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      " 99%|██████████████▊| 72/73 [04:09<00:01,  1.52s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster has large lungs, a small heart, a large liver, and a very small spleen. The kidneys are small. ### Hence, this hamster tested positive.\n",
      "-\n",
      "data:\n",
      "    - lung : is big\n",
      "    - heart : is small\n",
      "    - liver : is small\n",
      "    - spleen : is big\n",
      "    - kidney : is very small\n",
      "\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|███████████████| 73/73 [04:10<00:00,  3.43s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The hamster's lung is large, while the heart and liver are small. The spleen is large, and the kidney is very small. ### Hence, this hamster tested positive.\n",
      "-\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "for i, record_dict in tqdm.tqdm(enumerate(df.to_dict(orient = 'records')), total = len(df)):\n",
    "    if df.iloc[i, -1]!='': continue\n",
    "    target_class = ''\n",
    "    \n",
    "    # for j, rep in enumerate(diff_reps):\n",
    "    record = \"\"\n",
    "    # print(rep.__name__)\n",
    "    for k, v in record_dict.items():\n",
    "        if k == 'text': continue\n",
    "        # target class.\n",
    "        if k == 'result of testing the hamster':\n",
    "            target_class = v\n",
    "        # numerical attributes.\n",
    "        else:\n",
    "            string = rep(v, df[k], categories)\n",
    "            # else: string = rep(v, df[k])\n",
    "            record += f'    - {k} : {string}\\n'\n",
    "\n",
    "    prompt = f'''This is some information about an hamster.\n",
    "\n",
    "Goal: Describe the given information in words.\n",
    "\n",
    "Case:\n",
    "{record}\n",
    "\n",
    "Use your creativity to describe this data concisely. \n",
    "'''\n",
    "    print('data:')\n",
    "    print(record)\n",
    "# The result part should strictly come after the ### separator. Add your inference.\n",
    "    while True:\n",
    "        result = describe(prompt)\n",
    "        if 20 <= len(result.split(' ')) <= 90:\n",
    "            break\n",
    "    text = f\"{result} ### Hence, this hamster tested {target_class}.\"\n",
    "    print(text)\n",
    "    df.iloc[i, -1] = text\n",
    "    print('-')\n",
    "    # break"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "b042f9ce-fd77-4988-acb8-f9e3dcdd8150",
   "metadata": {},
   "outputs": [],
   "source": [
    "df.to_csv('visualizing_hamster_quartile-categorical.csv')"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f30fff40-ca9e-43ee-ae52-8b6077b7bdd2",
   "metadata": {},
   "source": [
    "**Experiments**"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f1d5c673-5986-40d0-ab6d-bd2b57b3afb0",
   "metadata": {},
   "source": [
    "**summarizer curie**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "4c5cea9b-7323-4401-b92a-73ffc0afb9ff",
   "metadata": {},
   "outputs": [],
   "source": [
    "def train_model(X_train, y_train, temperature, sorted, summarize_prompt):\n",
    "    examples = p.prepare_incontext_examples(X_train, y_train, sorted = sorted)\n",
    "    summary = p.summarize(examples, task_prefix = desc, temperature = temperature, summarize_prompt = summarize_prompt).strip()\n",
    "    return summary\n",
    "\n",
    "import random\n",
    "from tenacity import retry\n",
    "\n",
    "model = 'text-curie-001'\n",
    "\n",
    "from tenacity import *\n",
    "\n",
    "@retry(stop=(stop_after_attempt(10)), wait=wait_fixed(5))\n",
    "def describe(prompt):\n",
    "    response = openai.Completion.create(\n",
    "        model= model,\n",
    "        prompt= prompt,\n",
    "        temperature= 0.80,\n",
    "        max_tokens=500,\n",
    "        # top_p=0.8,\n",
    "        # frequency_penalty=0.0,\n",
    "        # presence_penalty=0.0\n",
    "    )\n",
    "    result = response.choices[0].text\n",
    "    return result.strip()\n",
    "    \n",
    "def normalize(arr):\n",
    "    return arr/arr.sum()\n",
    "\n",
    "def sample(X_train, y_train, w, num_examples = 20):\n",
    "    indices = list(range(len(X_train)))\n",
    "    sampled_indices = np.random.choice(indices, size = num_examples, replace = True, p = w)\n",
    "    # print('sampled indices:', sampled_indices)\n",
    "    # print('top sampled indices: ', pd.Series(sampled_indices).value_counts().index.tolist()[:5])\n",
    "    return X_train[sampled_indices], y_train[sampled_indices], sampled_indices\n",
    "\n",
    "def cluster_sample(embeddings, X_train, y_train, w = None, num_examples = 15):\n",
    "    sampled_indices = []\n",
    "    for cls, required_samples_cnt in np.round((pd.Series(y_train).value_counts() / len(y_train) * num_examples)).astype(int).items():\n",
    "        cls_samples = embeddings[y_train == cls]\n",
    "        \n",
    "        sample_indices = np.where(y_train == cls)[0].tolist()\n",
    "\n",
    "        cm = AgglomerativeClustering(n_clusters=None, affinity='cosine', linkage='average', distance_threshold=0.05)\n",
    "        cm.fit(cls_samples)\n",
    "        cluster_assignment = cm.labels_\n",
    "\n",
    "        cluster_weights = len(cls_samples) / pd.Series(cluster_assignment).value_counts()\n",
    "        sample_weights = pd.Series(cluster_assignment).map(cluster_weights).to_numpy()\n",
    "        sample_weights = normalize(sample_weights)\n",
    "        \n",
    "        if w is not None:\n",
    "            w_cls = w[y_train == cls]\n",
    "            sample_weights*= w_cls\n",
    "            sample_weights = normalize(sample_weights)\n",
    "            \n",
    "        picked_example_indices = np.random.choice(sample_indices, size= required_samples_cnt, replace=False, p= sample_weights)\n",
    "        sampled_indices.extend(picked_example_indices)\n",
    "    \n",
    "    return X_train[sampled_indices], y_train[sampled_indices], sampled_indices\n",
    "\n",
    "@retry(stop=(stop_after_attempt(10)), wait=wait_fixed(5))\n",
    "def batch_predict(summary, X, y, cot):\n",
    "    pred_texts = p.run_predictions(\n",
    "                taskname = '', #desc,\n",
    "                texts = X,\n",
    "                summary = summary,\n",
    "                temperature = 0.,\n",
    "                query_instruct_text = query_instruct_text,\n",
    "                cot_text = cot,\n",
    "                printf = False,\n",
    "                sleep = .1\n",
    "            )\n",
    "    # print('pred texts:', pred_texts)\n",
    "    y_preds = []\n",
    "    for pred in pred_texts:\n",
    "        y_pred = 'unk'\n",
    "        for cls in classes:\n",
    "            if pred and cls in pred.lower():\n",
    "                y_pred = cls\n",
    "                break\n",
    "        if y_pred == 'unk':\n",
    "            print('this couldnt be parsed : ', pred)\n",
    "        y_preds.append(y_pred)\n",
    "    y_preds = np.array(y_preds)\n",
    "    err_rate, num_errors, total, err_indices = compute_error_rate(y, y_preds, return_indices = True)\n",
    "\n",
    "    # indicator fn vector.    \n",
    "    misclassifications_vector = np.array([1. if i in err_indices else 0. for i in range(len(X))])\n",
    "    \n",
    "    return err_rate, num_errors, total, err_indices, misclassifications_vector, y_preds"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "4d954eee-536f-4707-a832-1ac733e3c303",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>lung</th>\n",
       "      <th>heart</th>\n",
       "      <th>liver</th>\n",
       "      <th>spleen</th>\n",
       "      <th>kidney</th>\n",
       "      <th>result of testing the hamster</th>\n",
       "      <th>text</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0.969500</td>\n",
       "      <td>1.352002</td>\n",
       "      <td>8.185496</td>\n",
       "      <td>0.2255</td>\n",
       "      <td>1.348003</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's lung is big, heart is very big, ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1.141003</td>\n",
       "      <td>1.499403</td>\n",
       "      <td>8.544507</td>\n",
       "      <td>0.2705</td>\n",
       "      <td>1.322103</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's organs are all significantly lar...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>0.872000</td>\n",
       "      <td>1.268503</td>\n",
       "      <td>6.823009</td>\n",
       "      <td>0.0500</td>\n",
       "      <td>0.897001</td>\n",
       "      <td>negative</td>\n",
       "      <td>The hamster's lung is big, heart is big, liver...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>0.739900</td>\n",
       "      <td>1.270203</td>\n",
       "      <td>9.067509</td>\n",
       "      <td>0.1130</td>\n",
       "      <td>1.278003</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster has a small lung, a big heart, a v...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1.139302</td>\n",
       "      <td>1.496203</td>\n",
       "      <td>9.621993</td>\n",
       "      <td>0.1198</td>\n",
       "      <td>1.415003</td>\n",
       "      <td>negative</td>\n",
       "      <td>The hamster has large organs, including a big ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>0.723700</td>\n",
       "      <td>0.939400</td>\n",
       "      <td>2.631203</td>\n",
       "      <td>0.0421</td>\n",
       "      <td>1.030402</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's lung is small, heart is small, l...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>0.838500</td>\n",
       "      <td>1.301503</td>\n",
       "      <td>8.527997</td>\n",
       "      <td>0.0664</td>\n",
       "      <td>1.369103</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's lung is small, heart is very big...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>1.066703</td>\n",
       "      <td>1.035703</td>\n",
       "      <td>8.859700</td>\n",
       "      <td>0.1019</td>\n",
       "      <td>1.369603</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's lung is very big, heart is small...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>0.975000</td>\n",
       "      <td>1.046203</td>\n",
       "      <td>7.803905</td>\n",
       "      <td>0.0568</td>\n",
       "      <td>1.144302</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster has large lungs, a small heart, a ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>1.005203</td>\n",
       "      <td>1.015003</td>\n",
       "      <td>5.739195</td>\n",
       "      <td>0.0950</td>\n",
       "      <td>0.896800</td>\n",
       "      <td>positive</td>\n",
       "      <td>The hamster's lung is large, while the heart a...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>73 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        lung     heart     liver  spleen    kidney  \\\n",
       "0   0.969500  1.352002  8.185496  0.2255  1.348003   \n",
       "1   1.141003  1.499403  8.544507  0.2705  1.322103   \n",
       "2   0.872000  1.268503  6.823009  0.0500  0.897001   \n",
       "3   0.739900  1.270203  9.067509  0.1130  1.278003   \n",
       "4   1.139302  1.496203  9.621993  0.1198  1.415003   \n",
       "..       ...       ...       ...     ...       ...   \n",
       "68  0.723700  0.939400  2.631203  0.0421  1.030402   \n",
       "69  0.838500  1.301503  8.527997  0.0664  1.369103   \n",
       "70  1.066703  1.035703  8.859700  0.1019  1.369603   \n",
       "71  0.975000  1.046203  7.803905  0.0568  1.144302   \n",
       "72  1.005203  1.015003  5.739195  0.0950  0.896800   \n",
       "\n",
       "   result of testing the hamster  \\\n",
       "0                       positive   \n",
       "1                       positive   \n",
       "2                       negative   \n",
       "3                       positive   \n",
       "4                       negative   \n",
       "..                           ...   \n",
       "68                      positive   \n",
       "69                      positive   \n",
       "70                      positive   \n",
       "71                      positive   \n",
       "72                      positive   \n",
       "\n",
       "                                                 text  \n",
       "0   The hamster's lung is big, heart is very big, ...  \n",
       "1   The hamster's organs are all significantly lar...  \n",
       "2   The hamster's lung is big, heart is big, liver...  \n",
       "3   The hamster has a small lung, a big heart, a v...  \n",
       "4   The hamster has large organs, including a big ...  \n",
       "..                                                ...  \n",
       "68  The hamster's lung is small, heart is small, l...  \n",
       "69  The hamster's lung is small, heart is very big...  \n",
       "70  The hamster's lung is very big, heart is small...  \n",
       "71  The hamster has large lungs, a small heart, a ...  \n",
       "72  The hamster's lung is large, while the heart a...  \n",
       "\n",
       "[73 rows x 7 columns]"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_csv('visualizing_hamster_quartile-categorical.csv', index_col = 0)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "204108a3-e4b0-4bef-8834-97ac039e77b9",
   "metadata": {},
   "outputs": [],
   "source": [
    "# multi-class classification\n",
    "dataset_name = 'visualizing_hamster'\n",
    "desc = '''This data gives information about hamsters that tested positive and negative for some disease.'''\n",
    "classes = ['positive', 'negative']\n",
    "simple_prompt = \"Tl;dr\"\n",
    "# detail_prompt = \"Using these examples and based on their treatments and attributes, summarize how we can tell if the person will have recurrence or non-relapse of the same breast cancer ?\"\n",
    "query_instruct_text = 'Therefore, this hamster is likely to be tested (positive or negative): '\n",
    "detail_prompt = 'Using these examples, summarize how can we differentiate hamsters that test positive and negative.' #'Summarize this text for a ML model that will predict whether heart disease is present or absent in a patient.' #'Using these examples, summarize under what conditions are the heart disease present and absent.'\n",
    "# cot_text = 'Therefore, this woman will have a (recurrence or non-relapse): '\n",
    "ycol = 'result of testing the hamster'\n",
    "model = 'text-curie-001'\n",
    "\n",
    "global_best_params = {\n",
    "    'cot': None,\n",
    "    'sorted': False,\n",
    "    'summarize_prompt': detail_prompt,\n",
    "    'temperature': 0.79\n",
    "}\n",
    "\n",
    "# dataset_name = 'tae'\n",
    "# desc = '''This data is from TA evaluations in UW Madison Statistics Department that gives details about class scores achieved when assisted by a TA. The goal is to infer based on the information about the TA and the class, whether the class scores will be low or high or medium.'''\n",
    "# classes = ['high', 'medium', 'low']\n",
    "# simple_prompt = \"Tl;dr\"\n",
    "# detail_prompt = \"Using these examples, summarize when will the class score low, medium or high.\"\n",
    "# query_instruct_text = 'Predict if this class will score low or medium or high:'\n",
    "# cot_text = 'Therefore, this class will score as (low, medium, high):'\n",
    "# model = 'text-curie-001'\n",
    "# ycol = 'Class_scores'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "f66d7726-bb9e-475f-81ea-20224cf60a55",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset_file = 'visualizing_hamster_quartile-categorical.csv' #f'datasets/{dataset_name}/'\n",
    "table = pd.read_csv(dataset_file, index_col = 0)\n",
    "\n",
    "# ycol = 'positive_or_negative'\n",
    "X = table['text']\n",
    "y = table[ycol]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "2afa2b8b-39d3-4842-816f-1a73532fa6a4",
   "metadata": {},
   "outputs": [],
   "source": [
    "from sklearn.metrics.pairwise import cosine_similarity"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "023660ae-1726-409e-aa6e-8cc15a9cb65a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<AxesSubplot:>"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAWAAAAD3CAYAAAAjdY4DAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAA+iUlEQVR4nO2de1yU1fb/PwwDw100xdsRNQ0PlqZS2rG8IHktUzsdwAvmUUvREpEUFS+oIKBftItaWWaJGVB2zMy0yAteMhVT0yOUmKZgpqLCjMLAzPP7g194Oaw1D3IbpvXuNa9X8mHtZ7Pnmc3D3mt/lp2iKAoEQRCEGkdT2x0QBEH4qyITsCAIQi0hE7AgCEItIROwIAhCLSETsCAIQi2hrdbGHZuzekSznqT2xu/72NgfWzxCaif19UktVjnLtuvl4EFqK93NbOyQq9dJ7Wnn1mzs9MZ/kJrGnk5U6Zd9i213WysXUtuS24yN7YoCUhtqOMPGnhzditTCNunY2GZwJLVzSiGpTbcrZtu9XuhEau070+MPANNPNSS1fka6XQD4yoF+j4KK+LE452BPagPrXSa1IZdvsO2+pm1LauE3DrCxhSZ6nGd5PcXGPm9P9+uRM1vYWDUUX+HvyztxaPhgpa9XWap1AhYEQahRzKba7kGFUD0Bm81maDSyYiEIghWj8H+lWhvsBHz+/HnExcXhxIkT0Gq1MJvN8PHxwaxZs9C6Nf8ntSAIQo1jtqEJOCoqChEREXj00UfLvnb06FHMmjULycnJ1d45QRCEiqDY0hOw0Wi8a/IFgE6dOlVnfwRBEO4fU0lt96BCsBNwu3btMGvWLPTo0QPu7u4wGAzYvXs32rVrp6pxLssBABJz00ntpWZPsrEHbtI75QHNL5Ja3yvebLvc78/9N+gdaQB4HZ6k9hn4zYHNTEbCqAH0Dv2g3CZsuy5Ncknth0t8BkWJyZ3Uluk6srE7kunMjYcd+b2ERsxQvdyU3kW/dJHOYAGAdU50nxIb8tshixpfI7Xvf2vKxhaCnhSyHOksFQA4ozGSmmdeI1Ib4NyA7xMzxpMbdmVjtYodqe0wXWJjR7rzn6FKY0ubcNHR0UhLS0NGRgb0ej3c3Nzg7++Pvn371lT/BEEQ1GNLSxB2dnbo27evTLiCINQNbGkTThAEoS5R1zbhJLFXEATbwWxW/2KbMWPevHkICgpCSEgIzp079z/fk5eXh/79+6OoqAgAUFhYiFdffRUjRozASy+9hLy8PIvdlQlYEATbwVSs/sWQlpYGo9GIlJQUREREID4+/i59z549GDt2LC5fvn0c/JNPPoGPjw82bNiAoUOHYtWqVRa7W61LEJb8HLhMh/dy+dixjeid2vMXaC+IZOMJtt1H3VqS2mgHevcXAMLsaJ+CtkyGBAD0c6fP9ZdcKSK1pOvH2HYjzfRO+YMK72HQsZi+bhjo7AoA2NWXbnv3HrpPAKAwt+XbVxqTWmhTfge+fw6fMcLxziU69u92/H3B0aKYL0hj70Bn+zyqozNCIq/zngjLnDqR2ow83gvCxPyZH+HFZy9p7HnPjUpTgSWIlJQUpKSklP07KCgIQUFBAICMjAz06NEDQGnq7YkTd88bGo0Ga9euxT//+c+yr2VkZGD8+PEAgJ49e9b+BCwIglCjVGAT7s4J917+zPr6E3t7e5SUlECrLZ0yn3zyf3/R6PV6uLuXpm66urqioIA2s/qTCk/ARqMRjo70b2VBEIRao4o24dzc3GAwGMr+bTabyyZfNTEGgwEeHnxeOsCsAe/YsaMs53fr1q1lX//zEVsQBMHqqKJNuC5duiA9vfSg2NGjR+Hj42Px0l26dMHu3bsBAOnp6fDz87MYQ07p77zzDjZt2gSz2YywsDAUFRVh2LBhkCLKgiBYK4qZ31xTS9++fbFv3z4EBwdDURQsXrwYa9euhbe3NwICAsqNGT58OCIjIzF8+HA4ODggMTHR4nXICdjBwQH16tUDAKxatQovvvgimjZtCrtKbDgIgiBUK1V0EEOj0WDhwoV3fa1Nmzb/8307duwo+39nZ2e8+eabFbqOnUI80s6YMQP169dHWFgYXFxccPHiRYwbNw75+fnYu3evqsZPPTSI1Q/cpM+rPwIDqQHAPy4fJLVrk7qQ2rnN/BO8sZg+qz6u+Aobu3uwK6lt/sqLjU2yv0pqrxR7klprF36hf3sJHVtgx4/Fp4WnSW3vU85s7NhDtI9ErAP/Ibl+k86g6DSP9swoSD3OtvvHWXpN7kBxPTZ21AI6C+KlhXzGQUAJ7fewi6mWAQAPwIHUNjAZMN/WpyteAMBhI/3zPunB3+ca5r45dJ2uHAIAeg39APfShfVsrBoKMzap/l4nv6GVvl5lIdeAFy9ejHbt2pU98TZt2hTr1q3DwIEDa6xzgiAIFcJsUv+yAsglCK1Wi+eff/6urzVs2BBRUVHV3ilBEIT7oo4dRZY8YEEQbAcx4xEEQaglbMmQXRAEoU4hT8CCIAi1g6JYx+aaWqp1Aj6pp01xAL50EGeoA/CpZvVXHaHjXn6U1ABgy+d0es6eF/lyKuOS6d++KzucZ2OH9aRNgF5fTd9UvQfwN5zhKzplKLz372xshCudJvjaVjdSA4BPvvw3qf37udVsrKeOHufZsadI7UEtb/Kz8s0nSG3X5KNs7LPz6RS3WDM/Fm5O10ltqJ+ejT219wFSWzSFvpfNV2ijHgDYsJW+V7szJYcAIE1Pp5rdsjCjFFb3MYI69gSs2o7y6lU6T1UQBMEqUMzqX1YA+fvq119/vevfkZGRSEhIAAC0bt26enslCIJwP9SxJ2ByAv73v/8NJycneHl5QVEU/Prrr5g3bx7s7Oywbt26muyjIAiCOmwlC2Ljxo2YP38+hg8fjieffBIhISFISkqqyb4JgiBUDCtZWlALOQE/8MADeP3115GQkICffvqpJvskCIJwf9jKEgRQehw5KioKn3/++X3ZUMYqZ1m97xVvUrNUOmjrZjprgMt0qL+aL+GT0MSf1PK+43eW/c1NSW1RFl/+J7KAzpKYtpTuk8eod9l28z+i/ZuXzWRD0d9EGyI10NImMQBwMzqB1CYU8sZELRrR41xspIsBtJxB308A8MarR0ktbE13NrZ/2GZSMxYZ2dgPmCyJful8BkUx4z6Y8+k1UmufzT805fagzXo6HOZLO3m70vdFlPlvbGy/mbRJU5VgSxPwnzz//PP/4wshCIJgddjKEoQgCEKdw1Y24QRBEOoctrgEIQiCUCeQJQhBEIRaoo49AZMliaqC/i346hkd7D1JLcvMl9pZoNB+AVkmemc5V8sfRo/8fSepffJAbzZ2i66Q1E4Z+TIv0SY6g8LnAXq3O8XAl4DxN9J92uvIlxV60EjfGh875LOxH/a6SWoBaXzWQGtH2oPiKYXeRe9gIRvBrx99nP7nHXwJ8f32dLkpjYVP0BbQ1+2poX9WALhoR69pjjXR7+3XGj67QgP6c3AcvD9FgUIXvuwN3sOlrZGeIIf+voGNVcOt1IWWv+n/4xw4r9LXqyyqvSAAIC8vT6oiC4JgvSiK+pcVwC5BbNy4ERcvXoS/vz8iIiKg0+lQWFiI+fPno3t3Pm9SEAShximxoSyIDRs2ICkpCaGhoXj77bfRunVrXLp0CZMmTZIJWBAE68OWNuEcHBzg4uICV1dXtGjRAgDQuHHjskrJgiAIVkUd24RjJ+A+ffogNDQUPj4+mDBhAnr06IE9e/bgiSdoY2tBEIRaw0rWdtXCTsAvv/wyDh48iL1796JZs2a4evUqQkJC0Lt3b1WNr3Tnfxvtv0FnMox24J+yXyykswq4yhWW/By8i3uT2vCru9jYa2M7kNr7W1uwsRElP5PaG1cfJLWRTf9g2/3wGu274G7hXo0spqtPZPSkK4cAwNw99HVX2NG76ABwqYj2zegX24TUDKmH2HaLmUSUr7UubOz0RfT7t3DeOTZ2QiGdGfC1E5+5UZ/5iE40XSe1TxvRfg0AsO0PehzjGvKxHNkX+fd2tzP98wy976vegS09AQNA165d0bVr15roiyAIQuWwtQlYEAShrqCYpCinIAhC7SBPwIIgCLWELaWhCYIg1CnMNpQFUVmGXL3O6q/Dk9TC7Ohz7gCwezB9Nn9cMv1bkKtaAQDf626RGpflAAD1P6CrEOxs8A829uWX6Aof366hT4xvudqYbdevmF4Ta98wj40d70/v3jf7NJuNvbI5iNQCx25hY5to6CyWceF0ZYqJDR5j250ZRN9TTx3hd++bT/6M1Na7+LGx2Y70x2xeI/49OP4bnU0ydzjtX/HRRj5LpZAxIQjL0/F9MtDVW6a48vdjW36YK48tL0EYjUaYzWY4OfHldQRBEGoFW9qE+/XXX7F8+XI4ODggJCQEkZGRKCkpQUREBAYNGlRTfRQEQVBHFT0Bm81mREdHIysrC46OjoiJiUHLlrf/Sk1NTUVycjK0Wi1CQ0Ph7++P3NxczJgxA4qioF69ekhMTISzM+84yLqhzZ07F8HBwejXrx8mTJiAdevW4csvv8RHH31UJT+kIAhClWJW1L8Y0tLSYDQakZKSgoiICMTHx5dply9fRlJSEpKTk7FmzRosW7YMRqMRH374IQYOHIiPP/4YDz30ED77jF62+hN2Ai4pKUH37t3Rr18/eHp6onHjxnBxcYFWK3t3giBYIYpZ/YshIyMDPXr0AAB06tQJJ07crtJ+/PhxdO7cGY6OjnB3d4e3tzcyMzPh6+uL/PxSn2y9Xq9qnmS/o3nz5ggPD4fJZIKrqyuWL18ONzc3NGrUyGLDgiAINU4FsiBSUlKQkpJS9u+goCAEBZVuHuv1eri53Ta1t7e3R0lJCbRaLfR6PdzdbxcGcHV1hV6vR5MmTZCYmIgtW7bAaDTilVdesdgHdgJOSEjA7t270apVK7i6uuLDDz+Ek5MTFi9erOoHfNq5Nat/BnrBvC2TIQEAm7+id2pXdqB3aRdl8RuIXOUKS34OXKaDf973bGxikj+pjX2B3imftYWuEAEA/2pzidTiz9J+AADgsJv24/igHh97NpTOVmit4fvcVHEgtVPd6CwWp4f5Kip539FVOjp1531kf77ZjNS2nOCfdPZr6AoTP/zBZys0Z5YQ81PpLIhMRz7dYHgh/dk748T7YnRwf5jUvHhrC/i3yuG/oZIoFVgDvnPCvRc3NzcYDLc9Mcxmc9kT7b2awWCAu7s75s2bh7i4OPTo0QO7du1CZGQkVq9ezfaBvXO0Wi0CAgLK/j1z5kzLP5UgCEJtUUVZEF26dMHOnTsxaNAgHD16FD4+PmVax44d8frrr6OoqAhGoxHZ2dnw8fGBh4dH2ZOxl5dX2XIEhyzmCoJgO1TRQYy+ffti3759CA4OhqIoWLx4MdauXQtvb28EBAQgJCQEI0aMgKIoCA8Ph06nw9y5c7Fw4UKYzWYoioJ58yzXnJMJWBAE26GK0tA0Gg0WLry7wGebNm3K/j8wMBCBgYF36W3btsW6desqdB2ZgAVBsB3kKLIgCEItUcfMeOyUaqwzf6FbH1bfnEvvLPdzv8zGTi6gU5g/n0inyd34is6QAICj2fRZ9gjlDBt7mPFzeD+JP18f8ftOUsvt0ZbUjHraNwEAjp+lvQR2OPNVR7LMdFbBhkF81sCUbbRXR5QLnRUAAIWFdBZEm7jHSa1kJ59pUphN+3z8dJz3MPjH251I7etJJ0gNAHTMR2yLM79pZA/6PTpnpitXvNOczvgAgOxfHyC1h9oypUMAaBzoSS7rFH2/AcAV0O/t879vYGPVYIj6l+rvdY39tNLXqywWn4DT0tLw/fffo6CgAB4eHvDz88OAAQOkMKcgCFaHUmJDXhALFiyA2WxGz5494erqCoPBgPT0dOzduxexsbE11UdBEAR12NIa8C+//IL169ff9bWAgAAEBwdXa6cEQRDuizq2Bsx6QZjNZhw+fPiurx06dAgODvQ6jiAIQq1RRWY8NQX7BBwfH4+4uDhMmzYNiqJAo9Ggffv2WLRoUU31TxAEQTWKlUysaqnWLIjc7rS/AQC4PUw/SZdcKWJj931PZ1Ac19EP9tOWtmPbzYneR2pnrtIVIgDgph193YAXrrOxt07RO9rN9pwmtYKPxrPtPjZ1G6kdnExnVwDA9lX0reGp8FkQ3V6mtY0fOLKxucxjQQvG4uCgI9+nhNR/klqPoW+xsa8ptA/INS2/IR34GJ15k2fBm8TJnf6Bfz3XgNQee4Ov3rJsxs+kFvYvPkvl0ja6ssiVPDr7BQCi7elMlK/Pf83GqqHgFfU+5e4rtlb6epWFfQIOCQlBcXH5N0BycnK1dEgQBOG+qWNPwOwE/Nprr2HOnDlYuXIl7O35fFNBEIRax5Ym4EcffRRDhgxBVlYW+vbtW1N9EgRBuC+qcUW1WrB4EGP8eH6NURAEwWqwpSdgQRCEOoVMwLfpx5y9B4BBuXRVhaTrx9jYbxvQVRV6D6CPI3qMepdtN7ppb1Ib2fQPNnbLVdpPwFLlipmN6Z1lLtPB/cX32XYLPhhDaq9HnWNjn7an/QQ+ceC9LTpn/k5qTUr4ahqPu9BG1iZ7OtNk2Iw2pAYAK174gtTSVw9lY8+Gp5FakZH/GC36ka7i0Zf/iKA4j/55fevTlVI8QvhKDL919SG1Nu9dZGObuzQktXkK7TEBABvD+AoglUUpsaGDGHl5eYiPj8fy5ctx7dq1sq+vWLGi2jsmCIJQYcwVeFkB7AQ8Y8YMtG7dGl5eXhg1ahRyckrrOR08eLBGOicIglARFLOi+mUNsH87GY3GsqJ1vr6+mDRpEpKSkurcTqMgCH8RrGRiVQv7BGwymZCVlQWgtEjdhAkTEBoaCr2ePykjCIJQK9jSEsScOXMQExODK1dKDZoHDRqEwMBA5Obm1kjnBEEQKkJdW4K4Ly8Is9kMjYaduwFYrojh0oTOVrDkKvfhMfpsvsGO/pGmx/P+Bz9Oo6sbfOPIn9v3K6I73fXv/M5yxik6M2A6fiW1w4lPs+26j/2Q1PJefJiNfecburpB10Leq8PXl65osuX039jYk1ra06FnIX3fbXYysu2uXE3fjy1eeJ2Nfd/lMVI7qeO9ICa0v0Bqx47wGSH1HensmCyTG6kNXdKKbTdqTjapLXiO/wv3jx20P0XOFQ82NsaBrrLyzXnat0QtecN6qf7eBv/ZXenrVRbxghAEwXawkqUFtYgXhCAINkMd82MXLwhBEGwIW5qAAfGCEASh7mBTT8CCIAh1CQt1AqyOap2At+TSVSsA4IdL9EH4BxU+48DEZDqE96Z9CJbNZJuFg6MzqblbyBdp35A+mx9/lt/ttnemd9IPjqUzNyz5OXCZDg0+OsnGvtmYzoKop+MzDt7/tTmptbLwlPKyI+0F0awv/QkL0PG38+dj9pPar6N4Hwml+AqplWxpxMb2O0pn+/Rm3ncA2GLIIbVhrg+R2umos2y7I0x0dsX7mzzZ2PpM5ffzOv5Dsr6tBfOLSlLXnoAt55LdQVxcXHX1QxAEodIoZvUva4B9ZLiz/LyiKMjOzsaxY6UuZZKGJgiC1aHwf1FYG+wEPHLkSGzcuBFRUVFwdnZGREQEEhMTa6pvgiAIFcJanmzVwk7AgwcPRps2bbB06VLMnDkTOp0OzZvTa3uCIAi1iWK2oSdgAGjfvj0SEhIwZ86cuzyBBUEQrA2zycYmYACoX78+3nrrLZw8ye+a30tX0Oe+AaDERFeJ6FjMew2EKr+RWoRrA1LrbzKw7Z41uZJaZPEpNna8f31Sc9jN3xinzPRYbV9Fn6/nqlYAvJ8Dl+UAAFMu7SS13/15Tw1NJv3eeploLwEAyMz3JDXvTvR7W5j2E9vuk170dVM309VMAGD4PDrT4dC3dNYNAIw3tSK1H8Hf5+Nd/k5qnxnPk9pKO3qcAOAXhb7P/e3pLBQA0Orov/Pr3+S9ID44TXu4WEhQUoVNLUGU5wWhKArs7OxkE04QBKujqpYgzGYzoqOjkZWVBUdHR8TExKBly5ZlempqKpKTk6HVahEaGgp/f3/cvHkT0dHRuHDhAoqLizF37lx07NiRvY54QQiCYDNUVa2ItLQ0GI1GpKSk4OjRo4iPj8fbb78NALh8+TKSkpKwceNGFBUVYcSIEXjyySexZs0aPPTQQ1iyZAkyMzORmZlZuQlYvCAEQahLVNUTcEZGBnr06AEA6NSpE06cuG1Te/z4cXTu3BmOjo5wdHSEt7c3MjMzsXfvXgwcOBDjxo2Dq6sr5s+fb/E64gUhCILNUJFNuJSUFKSkpJT9OygoqKwEm16vh5vbbb9le3t7lJSUQKvVQq/Xw9399h6Hq6sr9Ho9rl27hvz8fKxZswabNm1CQkIClixZwvZBvCAEQbAZKvIEfOeEey9ubm4wGG5v2JvNZmi12nI1g8EAd3d3eHp6ok+fUtN/f39/rF692mIfqnUCHmo4w+rLdPT6SBj4skd7n6I9G17bSlcKaKB1YNvN1NA7wBk967GxzT6lqwx8UI/3gpg7hPY4OPQfWvvEQce2+9wtepfdkp8Dl+nQZOdpNrZgfQCp/fO1A2xsCw29Qx8+bw+pTXXtwLY7phddlaTjDj475pHZdAbQ/2l92dhTjD/Ca0589YmjNxxJ7dsB9L0cu5P3UmnOTFRvlvDZS2dvXCK1mR5d2FgfpmpMVaBU0Um4Ll26YOfOnRg0aBCOHj0KHx+fMq1jx454/fXXUVRUBKPRiOzsbPj4+MDPzw+7d+/GI488gkOHDqFtWz5TCLAwAZ8/fx5nzpxBt27dsHr1apw8eRJt27bFxIkT73oEFwRBsAaqKg2tb9++2LdvH4KDg6EoChYvXoy1a9fC29sbAQEBCAkJwYgRI6AoCsLDw6HT6TBhwgTMmTMHQUFB0Gq1SEhIsHgddgKOjIxEWFgYYmNj0aRJE0ydOhWHDh1CRESEqsdrQRCEmsRcRU/AGo0GCxcuvOtrbdrcdswLDAxEYGDgXbqnpydWrFhRsetwor29Pbp164YLFy5g8uTJ8PX1xejRo1FQwP+JIgiCUBsoip3qlzXATsDu7u7Ytm0bevXqhU2bNuHGjRvYvHkznJ3p9VdBEITawmyyU/2yBtgliJiYGCxduhRHjhxBTk4OPD094efnh5iYmJrqnyAIgmrqmhmPnaJU1dmR/6Vg6mBW35FMb+T17kvvtALAmN0upPbJl6GkdjOaXxi3d6N/J83d05CNTXjfn9TOhm5mY5cU039VrAihTyEaM/9g2zVepjWuagUAaEDfzFOX+pAaALiPepfU8mP7s7FwpHf+HYZHkFrxhv9jm/1pCT0YPv+gq5kAgNu7H5DawUdmsLGO9nQJid32dMYHALgwn87tdtdJba0fv0xop6XfW/sGfGaNfWPa8+TX9XxWR8t+dEaP+zvb2Fg1nHjwWdXf+8iZLZW+XmWpsBfEn4gXhCAI1oa1rO2qRbwgBEGwGarv7/nqQbwgBEGwGaoqDa2mEC8IQRBsBnMd24QTLwhBEGyGuvYEXK1ZEGNbvcDqD5vp8+o5Gnq3FADG29O7vItK6DPyEwp5L4jXNHR1gxV2dFUEAIjV0t4KrRl/AwCY4nKd1PbfoK/bpIQfp/MO9O9YJwvHNrnKFct1/C77Z6/S3hceUdvZ2F5eD5Oat5bOnGmn8Pnpr75Ea5++zYYi3aGQ1FopfNZAth0d25vJfgGA4w70+ztOQ2ccXDTw99sWZ3qi8lL4/Z5M3CK1h8D/PHo7+qZbcvYTNlYNh5oPU/29j+f8p9LXqyzyBCwIgs1Q156ALU7Au3btglarRdeuXREfH4/8/HxMmzYNzZo1q4n+CYIgqKaOJUHwE3BUVBSKiopgMBjw1ltv4bnnnkPjxo0xd+5crFmzpqb6KAiCoAqTmXVXsDrYCfjs2bP4+OOPoSgKnnnmGYwcORIA8NFHH9VI5wRBECpCHSuKzE/AJSUl2LNnD65du4arV68iOzsbbm5uKLGw8SMIglAbKMzxeWuEnYCjo6OxcuVK+Pr6Yt68eQgJCYGnpycWLVqkqvFmoM/0A0Aj+og8FAvL09eL6AwKTx29i9ui0Q223dYFDUjtEnNNAGiioa/bVOGzLwqZ7IxcZiged6EreADAtmIPUnvZkY/NzPckNa5qBQDWz4HLcgCA3X/Q1SemNutJanl2zA0FAEW0/gP/9qAR6G+4Ysc/kAww0vdNPRMf25H5HDh60LHeFt7bkwb6WbFHCe95otfRP8818O/BddCZNVWBuY4tArOznK+v710Gw88880y1d0gQBOF+MdvSE7CY8QiCUJewqSUIMeMRBKEuYbKlCVjMeARBqEvYVBYEIGY8giDUHWxuAq4M5xT6DDwAvNyUzkh4+0pjNrbTPPok3uzYU6RWbOQzM55SaK+BfrG0vwEAjAunq16c6taUjXUb34fUWoT/Qmomez7xvGchrTfry+/Ae3eiM0LC5+1hYx2Gf0a3u3wmG8tlOryem05qrzbrwbarebwrqQ1efZiNHXqd/nl/at2Bjb1upP0R2gfR/iEAkPsNnVXQIsqP1M4u+JFtd7hC+4v8bmFWOGa+RmovFtPVMgDgpqZ63Q9sag04LS0N33//PQoKCuDh4QE/Pz8MGDAAdnZ164cUBOGvQR1zo6Qn4AULFsBsNqNnz55wdXWFwWBAeno69u7di9jY2JrsoyAIgipsJg3tl19+wfr16+/6WkBAAIKDg6u9U4IgCPeDhaM4Vge5QGg2m3H48N3rYocOHYKDg4UjQ4IgCLWE2c5O9csaIJ+A4+PjERcXh4iICCiKAo1GA19fX8yZM6cm+ycIgqCaOnYSmZ6AT58+jczMTDg4OCA8PLzsGPLo0aOxbt06VY1Pt+PPfV+6SPsUhDa9xMYWpOaQ2oNaeoe35Qxvtt0OURdIzZB6iI2d2OAxUnN6mK8gUbLze1I76OhJasNmtGHbXRZPj1OAjt+RLkz7idSmuvI7/8Ub/o/ULFWu4DwduEyHt3L5zIzYLBdS2+rMf3RfcX6K1I7k84eUujeh7+VbJ/nPSD7jTVL4xT5Sazm9M9vuksW/kVpi5ytsbPv9dIbSPt4uBUVMRYyqwGbS0N555x188cUXMJlMCAsLg9FoxLBhw1CNFYwEQRAqhc1kQTg4OMDDo/QJddWqVXjxxRfRtGlTSUETBMFqqWtHkclNuObNmyMuLg43b96Em5sbVqxYgYULF+LMmTM12T9BEATVmO3Uv6wBcgJevHgx2rVrV/bE27RpU6xbtw4DBw6ssc4JgiBUBHMFXtYAuQSh1Wrx/PPP3/W1hg0bIioqqto7JQiCcD/UtR2qaj2Yfb2Q3xJd50QPV/8c3nfh70604//KN58gtTdePcq2G9rvKqkV85vDmBlEe1/kfXeTjXWuT/syJKSOI7UVL3zBtrvyfdpj4vMx+9nYJ73oHfoxvS6ysT8tqUdqr06isxEAsJUrOD8HLssBADyitpOa4fAHbKw5J4vUbq3eyMb+uJ++lx9247N9dA70fZGfTX98Pzl4mW13efc8Utuzk694/jcdfS9rmMohABD1Nv3ZrAqqamnBbDYjOjoaWVlZcHR0RExMDFq2bFmmp6amIjk5GVqtFqGhofD39y/TDh48iOnTp2P37t0Wr0MuQeTl5SE+Ph7Lly/HtWu3zTfurJAhCIJgTVTVEkRaWhqMRiNSUlIQERGB+Pj4Mu3y5ctISkpCcnIy1qxZg2XLlsFoLDVVunjxItauXau6biY5Ac+YMQOtW7eGl5cXRo0ahZyc0nzSgwcPqmpYEAShpjHZqX9xZGRkoEeP0pzzTp064cSJE2Xa8ePH0blzZzg6OsLd3R3e3t7IzMxEUVER5s+fj+joaNX9Jf+GMRqNCAoKAlBaG27SpElISkqSPGBBEKyWimyupaSkICUlpezfQUFBZXOeXq+Hm5tbmWZvb4+SkhJotVro9Xq4u9+2rXV1dYVer8fChQsxduxYNG7MW+neCTkBm0wmZGVloV27dujSpQsmTJiA0NBQ3LzJr2UKgiDUFhWZgO+ccO/Fzc0NBoPhdrtmM7RabbmawWCAg4MDDh8+jN9++w0rV67EjRs3EB4ejuXLl7N9IJcg5s6di5iYGFy9WropNWjQIAQGBiI3N1f9TygIglCDKBV4cXTp0gXp6aXm/0ePHoWPj0+Z1rFjR2RkZKCoqAgFBQXIzs5Gx44dsX37diQlJSEpKQn16tWzOPkCzBNwbm4uLly4gODgYISHh2PQoEEYMmQIUlNTLTb6J+07/8HqiQ3vPwkjdSddYWLX5KOkFramO9vuiX9/S2pfa/ld9qeO0FkDnbrzi/JHmfP1kUPfIrX01UPZdlu88Dqp/TqK95FI3Uz3qeMOA6kBgM8/6F32T9/mx/EHZiOdq1xhyc+By3RwfWwsG7u1Pu1B8Z0znzUwsyedMXJq7wNsrDOTBZGV05DUwtbx2QaTJ+witbde4b0trn9F+5r0+42v0NJ/PJ21k54zhY1VQ1VlQfTt2xf79u1DcHAwFEXB4sWLsXbtWnh7eyMgIAAhISEYMWIEFEVBeHg4dDrdfV1HtRdEUVERhg0bBo2GH2BBEITaoqoOWGg0GixcuPCur7Vpc/uBJTAwEIGBgWT8vn20UdKdiBeEIAg2g80YsosXhCAIdQ3xghAEQaglxAtCEAShlqhrpxSq1Qti+il6lxYAFjW+RmrvXOK9IKIW0Pqz84+TWv+wzWy7++3pPk9f1IKNbT75M1L7+Sa/U/6PtzuR2muTT5La2fA0tt33XegqHYoFc4vh8+jKIo/MpvsEAFnv0v4I6Y/NYGMbMX4CQ6/TVS+4qhUA7+fAZTkAwKBr9HX/24CvDvLzPrqqRYd/FbGxF7+lsyD+vrQLqZ17dSvbbu9iuk9r32VDsd2OzmJ50cxnuLxs58o3XknMdWwKVp3SEBcXV539EARBqDSmCrysAfIJ+M7y84qiIDs7G8eOHQMAJCcnV3/PBEEQKoi1rO2qhZyAR44ciY0bNyIqKgrOzs6IiIhAYmJiTfZNEAShQlhLdoNayAl48ODBaNOmDZYuXYqZM2dCp9OhefPmNdk3QRCECmFTa8Dt27fHkiVLkJiYWOYJ/KfvpSAIgrVRVV4QNYWdQvhL7tixA4sWLYJWq0VYWBi8vb3RsWNHjB49GuvWrVPV+CfNRrK6lhmFIgsn7rY50K5sr9CWDHBz4n+B7Cz2JLVce36FqcctWv9DyyeceJiYWAf69+QTGroyCAB8BXdSa2fhd+khHd2nboX8+9MYdOPfWTg3f8WO3vmfzFRCOZJP7+wDQP9uF0gt4Uc+S2WcM52x0z77JzZ2eWN/Utthd4ONfdTOg9Ru2tHvzyjo2XYXKfQ9Na7QmY29Yk/fy7l8QQw4Mx+hV8+v54NVMKvVCNXfG3d2Q6WvV1nId+Gdd97Bpk2bkJqaitTUVGRnZwOA+AELgmC1mKCoflkDrBdEvXqldb3EC0IQhLpAXcuCEC8IQRBsBjMU1S9rQLwgBEGwGeraJpx4QQiCYDPUtSWIavWC+MrhFqsXQl3p5vJ4poTeHXZzuk5qH5jdSA0ATuIqqU0orM/GZjvSw7lfw+9Kjyqhd54DHztPaot+pCuDAECUL73z3+8ofyBzvKkVqZ3S8c8QLUrotrPtCtnYAUYnUrtupMepe5NLbLs/7qf9Q7iqFQDv58BlOQBA+KWdpDa7WW829ttiul8jNXTmxhp73nNhSDF9r37izH9uNaDTjOzA7xFNtee9LyqLtWyuqYV8F86fP48zZ86gW7duWL16NU6ePIm2bdti4sSJd1UEFQRBsBasZW1XLeQacGRkJJycnBAbGwt7e3tMnToVjRs3RkRERE32TxAEQTV1bQ2YnIDt7e3RrVs3XLhwAZMnT4avry9Gjx6NggK6IJ8gCEJtYjNZEO7u7ti2bRt69eqFTZs24caNG9i8eTOcnflTMoIgCLWFzVTEiImJwdKlS3HkyBHk5OTA09MTfn5+iI2Nrcn+CYIgqEaxkidbtZAT8NGjR3HgwAHY29sjISEBzzzzDABUyAsiqIg/85/lSLvntyjmB3Krjt6pHepHZxz0S+ezIB5wone7v7bgIzGvUR6p/fBHPTZ2izOdNdAui84K6MtvWOPYEXrnv7czv2P9I+gd69ec+KyOL28+QF+X8eoAgHomOjumfRD9Htw6yTf8sBudJXFqL91fgK9cEb+Jvy6X6bA4dxcbG9msF6ntUej3IOQWfc8AgEFDf76GFfKfW3eFvlcLLdR4sHORLIg7ISfgP70gzGYzwsLCYDQaMWzYMPGCEATBarGWpQW1iBeEIAg2g7mOPSCKF4QgCDaDzaShiReEIAh1jbqWhiZeEIIg2Aw2kwVRFZxzsGf1Mxp6R9vewZGNfQC09T63o11sYQ37IlONob6F4Tr+mxepNbeQPm1gtg+c3Old9uI8fte5iYOB1LYYctjY8S5/J7WjN/j3x4UZquMOvAdIR2acc7+hd+DzC/iKGDrmus4W+nTxW1p/1I7PoOD8HLgsBwBIyN1NalOa9SA1ox1/X5xzoD8H9S1Utvydafu4PZ8p1P8WbWPQgY1UR4ktTcC7du2CVqtF165dER8fj/z8fEybNg3NmvHlWwRBEGoDm3kCjoqKQlFREQwGA9566y0899xzaNy4MebOnYs1a9bUZB8FQRBUYTNpaGfPnsXHH38MRVHwzDPPYOTI0gKbH330UY11ThAEoSLUtXMK5ARcUlKC9PR0XL9+HVevXkV2djbc3NxQUnL/Hr6CIAjVibVkN6iFnIAXLFiAlStXwtfXF/PmzUNISAg8PT2xaNGimuyfIAiCaqrqKLLZbEZ0dDSysrLg6OiImJgYtGzZskxPTU1FcnIytFotQkND4e/vj9zcXMyePRsmkwmKomDhwoV48MEH2euQ25m5ubk4ceIE/vOf/wAA9u/fj61bt+KNN96okh9QEAShqqmqPOC0tDQYjUakpKQgIiIC8fHxZdrly5eRlJSE5ORkrFmzBsuWLYPRaMQbb7yBUaNGISkpCRMmTMCyZcss9pf1gvjiiy9gMpnu2wtiYL3LrO6Z14jUHtXdYGP7XjtNaoumPEpqOZ9eY9ttrqeNSCaarrOxc4fTZZLyU2kNADZoaZ/lX8/R6VW+9WkDIADIuEGnSA1zfYiN/cxIl0L6dgCdBggAo7+jzWBi+QwpOHrQy1wtovxIrfCLfWy7+dl00k9WTkM29u9Lu5DazchMNpYrHcQZ6gB8qtmbuXtIbWIbPqnLNY82h2rjxX9GtDo6FbDFeToVEwBuaqrXyqCq1oAzMjLQo0fp2Hfq1AknTpwo044fP47OnTvD0dERjo6O8Pb2RmZmJiIjI8uqBZlMJuh0vKkRYMELwsOjdNIQLwhBEOoCFcmCSElJQUpKStm/g4KCEBQUBADQ6/Vwc7vtnGhvb4+SkhJotVro9fq7yrK5urpCr9ejQYPSB6UzZ84gISEBK1eutNgHcgL+0wsiLCyszAti3LhxyM/Pr8CPKAiCUHNUJA/4zgn3Xtzc3GAw3D7EZDabodVqy9UMBkPZhHzgwAEsWLAAS5Yssbj+C4gXhCAINkRVrQF36dIF6enpAEq90X18fMq0jh07IiMjA0VFRSgoKEB2djZ8fHxw4MABxMbG4v3330eHDurO9YkXhCAINoNJqZqjGH379sW+ffsQHBwMRVGwePFirF27Ft7e3ggICEBISAhGjBgBRVEQHh4OnU6HxYsXo7i4GDNnzgQAtG7dGgsXLmSvU61eEIIgCDVJVR1F1mg0/zN5tmnTpuz/AwMDERgYeJe+efPmCl/H4gSclpaG77//HgUFBfDw8ICfnx8GDBigajNuyGU+k2GAM727H3md9x3+tn5bUjNfoa/bPvsntt0FTXuT2qeNaGMbAPhoI72znOnIl615p+lNUmsw9XFS8whZzbab/8EYUjsddZaNXWlHvz+xO/mSN2v9ckktYz9dJgkAvB3pfYazC34ktZbTO7PtfnKQzsoJW/cEG3vu1a2kNgq86dQae1dSs1Q6iDPV4TIdLN3nF56gM2A6HKPNgwCgpQud6TDbwrzwzDTLmQGVoa4ZsrMT8IIFC2A2m9GzZ0+4urrCYDAgPT0de/fuleKcgiBYHXVr+rUwAf/yyy9Yv379XV8LCAhAcHBwtXZKEAThfqhrR5HZlHiz2YzDhw/f9bWDBw/CwYFPwhcEQagNbKYiBgDEx8cjLi4OERERUBQFRUVFeOSRRxATE1NT/RMEQVBNVWVB1BTsE7DRaISdnR26d++OuLg4uLi44OzZs1KYUxAEq0SpwH/WgJ3CHJ4eOXIkwsLCkJubi5iYGGzfvh06nQ7jx49HcnKyxcY/bD6K1QuZ6b9+CT9A3Jnynx3o34LhbfgyPGtOtyC1BvQReABAAfPz/MNYyMaaQP88e3R0+Z+xLehsAwBYeqExqY0o4fv0i5nevf9Dy+92j+52gdSiD/FZECdNtBfBcIX2D9mrvcW2u/wftG/GtO/5skK9i+lshS8ZHw8AGFJMl+HRWdi150oHPVpEZ9Z0aHeJbfdvB34htQNedNYNAByDG6kd1vIlibiSQe+d/ZSNVcNjTWnvjHs5fJH20qgp2CUIs9mMrl27Aig9YvfAA6U36Z9H8gRBEKwJa1nbVQu7BNG6dWtERUXBbDaX2bGtXr0aDRvyzlGCIAi1gaIoql/WAPsoGxMTgx07dkCjuT1PN27cGCEhIdXeMUEQhIpiqmNV4dgJWKPR4Omnn77ra0OGDKnWDgmCINwvNnUSThAEoS5hLdkNamEn4Ly8PKxevRo6nQ5jxoxB/fr1AQArVqzAK6+8YrHx8BsHWH1yw66kNiOPjz3s7UNq3RV657jDYX53uI9nfVKLa8h7QYTl0efczzi5sLFz/0b7FHR5gq6m0eY9/tz+6RfpTIb3N3mysf72tCfDmyX8zv+/G9Bj4aXw3gk9Sug9ht+ZOzax8xW23T076coUb73C92ntu7Q2rtCZjf3Emc7OGFbIeyPUN9P3Mle5wpKfA5fp8MQfh9hYTyf6nlrqTn+mAWBodzo7piqoa0/A7CbcjBkz0Lp1a3h5eWHUqFHIySlN4Tp48GCNdE4QBKEi1LU8YPYJ2Gg0ljnG+/r6YtKkSUhKSrKaHURBEIQ7saknYJPJhKysLAClDvETJkxAaGgo9Hq+kKAgCEJtYFLMql/WADsBz5kzBzExMbhypXRtrU+fPggMDERuLn/6ShAEoTawqSUIBwcHuLu7IzExEYMHD8acOXOg0WgQFxdXU/0TBEFQjWIlT7ZqYSfg+fPnIywsDDk5OZgyZcpdXhB9+vSx2Hihia8CoWWyFSz9iaCxo3+DpenpXXRvVz6ToUDh+8xx3HCe1Dq4P8zGahj/ikvbaM+G5i78qcQ/dtA/T30L3hZaHd2nszf4bBL7xh1JLRO8Z4NeR/suHDPTO//t99O+FwDwNx1ddeT6V3xWx3Y7OovF096TjdWAfg/cFf5N+J2piKHV0bFc1QqA93PgshwA4Hoh/RnKbsB/bk/vp7OMeAcKddS1o8iqvSB++OEH8YIQBMGqqWsJAuIFIQiCzWBThuziBSEIQl3CZLahNWDxghAEoS5hLdkNapHFXEEQbIa6tgbMVsS4l7i4OMyaNUt14wtbjmT1HSZ6J72nlt/R9mWM939nqjW0NlrYpXWkl8U7MxUIAOC4ji5W6lXChqKFuYjUdBp6t/uimc4YAIAGzA78bqbSBgB0LKJvjbPMOAFAgPY6qX1uqsfGXrOjf94nimjPhp/5H4fd8OhXQmdIAMA5M50FccaRrw6SaUdnsfzzFl/g9itneiyeuUWPRZEd36dvnegbsmsxP5DZTMZOfO5uNja1QS9Se/73DWysGhrVa6f6ey/fyKr09SoL+wR8Z/l5RVGQnZ2NY8eOAYCqkkSCIAg1SV17AmYn4JEjR2Ljxo2IioqCs7MzIiIikJiYWFN9EwRBqBA2tQk3ePBgtGnTBkuXLsXMmTOh0+nQvHnzmuqbIAhChbCW9DK18At5ANq3b48lS5YgMTERubm5MBr5qqeCIAi1RV2rCcdOwKdPn8akSZOQkJCA4cOH4/Llyxg0aBB27txZU/0TBEFQjVlRVL+sAdVeEFOnTsWOHTvKvCD8/f0tNv68/Q1WH+lO7+Jq7P9gY9Ou0lkShcwGcL+Z7my7iKc9AXY781l7bZkkCf9WOWzsgTNNSe09e9r+c2MYn1EwdEUeqa1vy3syfHC6Ban5FPFrbS0H0bvs+m187HUmc+Omhn4Piuz4dqPefoLU+o//go192Y72R3C2sOw41Z7OcLFzoTUA6H+Lvl9vaugb/ZlpfKWNr1fS97mlqhWcn0MXJssBAALz6CwJC4lCqrCpPGDxghAEoS5hLU+2ahEvCEEQbAazYlb9sgbEC0IQBJuhqjbXzGYzoqOjkZWVBUdHR8TExKBly5ZlempqKpKTk6HVahEaGgp/f3/k5eXhtddeQ2FhIby8vBAXFwdnZ75gK/sETHlBWGpUEAShNqiqLIi0tDQYjUakpKQgIiKibAUAAC5fvoykpCQkJydjzZo1WLZsGYxGI1atWoVnn30WGzZsQPv27ZGSkmKxvxbT0ARBEOoKSgVeHBkZGejRowcAoFOnTjhx4kSZdvz4cXTu3BmOjo5wd3eHt7c3MjMz74rp2bMn9u/fb7G/1bqb9siZLdXW9kvV1O7QqYxWTdcEgOfvU7PEN5H3HzuzEtflWFJN7VaG9Jwptd2FculQTe2+N/3+Y7nKFZaqWlRFpgPbvpHPNrqTlJSUu55Sg4KCyqrA6/V6uLndrhpib2+PkpISaLVa6PV6uLvfzk5xdXWFXq+/6+uurq4oKOCrrADihiYIwl+UOyfce3Fzc4PBcLv0ktlsLsv+ulczGAxwd3cv+7qTkxMMBgM8PDws9kGWIARBEO6hS5cuSE9PBwAcPXoUPj4+ZVrHjh2RkZGBoqIiFBQUIDs7Gz4+PujSpQt27y7Nc05PT4efn5/F61TIjlIQBOGvwJ9ZED///DMURcHixYuRnp4Ob29vBAQEIDU1FSkpKVAUBRMmTED//v1x5coVREZGwmAwoH79+khMTISLC21jCsgELAiCUGvIEoQgCEItIROwIAhCLSETsCAIQi1RIxOw2WzGvHnzEBQUhJCQEJw7d05VXHFxMaZPn44RI0bghRdewHfffVfha1+9ehW9evVCdnZ2heLeffddBAUF4fnnn8enn36qOq64uBgREREIDg7GiBEjVF/32LFjZUe8z507h+HDh2PEiBGYP38+zBZc/u+MPXXqFEaMGIGQkBCMGzcOV65cUR37J19++SWZnlNe3NWrVxEaGoqRI0ciODgYv/32W4X6GxgYiOHDh2PWrFnkz1revaB2nMqLVTtO3D1oaZzKi1U7VlSf1YyVyWTCrFmzEBwcjOHDh+Pnn39WPVblxaodq/Ji1Y7VXxalBti+fbsSGRmpKIqi/Pjjj8rEiRNVxX322WdKTEyMoiiKcu3aNaVXr14Vuq7RaFQmTZqk9OvXTzl9+rTquAMHDigTJkxQTCaTotfrlTfffFN17LfffqtMmTJFURRF2bt3r/LKK69YjFm9erXy7LPPKv/6178URVGUCRMmKAcOHFAURVHmzp2rfPPNN6pjR44cqfz3v/9VFEVRPvnkE2Xx4sWqYxVFUU6ePKmMHj36rq9ZiouMjFS++uorRVEU5fvvv1d27typOnbSpEnKrl27FEVRlGnTpinfffdduXHl3Qtqx6m8WLXjRN2DasapvFi1Y1VerNqx+vbbb5WZM2cqilJ6L0+cOFH1WJUXq3asyotVFHVj9VelRp6AuWN9HAMGDEBYWBiA0jPe9va0f3B5JCQkIDg4GF5eXhWK27t3L3x8fDB58mRMnDgRvXv3Vh3bunVrmEwmmM1m6PV6Vdad3t7eeOutt8r+ffLkyTIbUEtHGu+NXbZsGXx9fQGUPpHodLQv7L2x165dw7JlyzB79uwK9ffIkSO4dOkSxowZgy+//LKs72pifX19cf36dSiKAoPBQI5XefeC2nEqL1btOJUXq3acyotVO1blxaodq6effhqLFi0CAOTm5sLDw0P1WJUXq3asyotVO1Z/VWpkAqaO9VnC1dUVbm5u0Ov1mDJlCqZOnar6mp9//jkaNGhQNvFXhGvXruHEiRN44403sGDBArz22muqXZZcXFyQk5ODgQMHYu7cuaqc4/r373/Xh0lRFNj9/7Lilo403hv75y+bI0eOYP369RgzZoyqWJPJhKioKMyaNQuurrT5eHnXzMnJgYeHBz788EM0bdoU7733nurYVq1aITY2FgMHDsTVq1fRrVu3cuPKuxfUjlN5sWrH6d7YsLAw1eNU3nXVjlV5sWrHCij17I6MjMSiRYswePDgCt1T98ZW5J66M/bZZ59VPVZ/VWpkAuaO9Vni4sWLGD16NIYMGYLBgwervubGjRuxf/9+hISE4NSpU4iMjMTly5dVxXp6euKpp56Co6MjHnzwQeh0OuTl0ZUl7uTDDz/EU089he3bt+OLL77AzJkzUVTEVz24lzvtP9UeabyTrVu3Yv78+Vi9ejUaNGigKubkyZM4d+4coqOjMW3aNJw+fRqxsbGqYj09PdGnTx8AQJ8+fVT/hQMAsbGx+Pjjj7Ft2zYMHTr0Ltepe7n3XqjIOJV3H6kdpztjW7VqVaFxuve6FRmre2MrMlZA6V+A27dvx9y5c++6B9XcU3fG3rx5s0L31J+xkydPRmZm5n3dU38VamQC5o71cVy5cgVjx47F9OnT8cILL1Tomh9//DHWr1+PpKQk+Pr6IiEhAY0aNVIV6+fnhz179kBRFFy6dAm3bt2Cp6enqlgPD48yQ4569eqhpKQEJpOpQn1v3749fvjhBwClRxofe+wx1bFffPFF2c/dogVdUuheOnbsiK+++gpJSUlYtmwZ2rZti6ioKFWxfn5+ZUcwDx06hLZt26q+br169cr+OvLy8kJ+fn6531fevaB2nMqLVTtO98ZWZJzKu67asSovVu1Ybdq0Ce+++y4AwNnZGXZ2dnjkkUdUjVV5sd98842qsbo3tmHDhti6det93VN/FWrEjKdv377Yt28fgoODy471qeGdd95Bfn4+Vq1ahVWrVgEA3nvvPTg5OVVnd+Hv749Dhw7hhRdegKIomDdvnur15zFjxmD27NkYMWIEiouLER4ebvE44r1ERkZi7ty5WLZsGR588EH0799fVZzJZEJsbCyaNm2KV199FQDw+OOPY8qU6nX6ioyMxJw5c5CcnAw3NzckJiaqjo2JiUF4eDi0Wi0cHBzK1hDvpbx7ISoqCjExMRbH6d5Yk8mEX375Bc2aNbM4TpW5B8uLjY+PVzVW5cWqHat+/fph1qxZGDlyJEpKSjB79my0adNG1T1VXuzs2bNV3VPlxVb3Z7WuI0eRBUEQagk5iCEIglBLyAQsCIJQS8gELAiCUEvIBCwIglBLyAQsCIJQS8gELAiCUEvIBCwIglBL/D99Jqhhscqz5QAAAABJRU5ErkJggg==\n",
      "text/plain": [
       "<Figure size 432x288 with 2 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "p = Prompting(model = model)\n",
    "\n",
    "# get the best hyperparams.\n",
    "# query_X, support_X, query_y, support_y = p.frame_icl_examples(X, y, support_size = 0.5, seed = 0)\n",
    "\n",
    "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.5, random_state=0, stratify = y)\n",
    "X_train = np.array(X_train.tolist())\n",
    "X_test = np.array(X_test.tolist())\n",
    "y_train = np.array(y_train.tolist())\n",
    "y_test = np.array(y_test.tolist())\n",
    "\n",
    "X_test, X_val, y_test, y_val = train_test_split(X_test, y_test, test_size = 0.2, random_state=0, stratify = y_test)\n",
    "\n",
    "def get_gpt3_features(X_text, model_name):\n",
    "    def get_embedding(text, model_name=\"text-embedding-ada-002\"):\n",
    "        text = text.replace(\"\\n\", \" \")\n",
    "        return openai.Embedding.create(input = [text], model=model_name)['data'][0]['embedding']\n",
    "\n",
    "    queries = []\n",
    "    for sample in X_text:\n",
    "        model_input = '.'.join(sample.split('.')[:-2]) + '.'\n",
    "        vector = get_embedding(model_input, model_name)\n",
    "        queries.append(vector)\n",
    "\n",
    "    return np.array(queries)\n",
    "\n",
    "embeddings = get_gpt3_features(X_train, model_name = \"text-embedding-ada-002\")\n",
    "embeddings = embeddings /  np.linalg.norm(embeddings, axis=1, keepdims=True)\n",
    "sns.heatmap(1 - cosine_similarity(embeddings, embeddings))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "8fdcf02e-f5af-48a9-951f-abf592526ed8",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "positive    40\n",
       "negative    33\n",
       "Name: result of testing the hamster, dtype: int64"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pd.Series(y).value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "817c47c6-bae4-467b-b34c-a281155ea233",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Training distribution:  positive    20\n",
      "negative    16\n",
      "dtype: int64\n"
     ]
    }
   ],
   "source": [
    "print('Training distribution: ', pd.Series(y_train).value_counts())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "129c19e4-8fb0-4e02-b77c-2c94dfd7cb31",
   "metadata": {},
   "source": [
    "**summarizer curie**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "f387ede8-f0d2-44a4-b6cf-645abfc05fee",
   "metadata": {},
   "outputs": [],
   "source": [
    "cot = None\n",
    "sorted_ = False\n",
    "summarize_prompt = detail_prompt #detail_prompt\n",
    "temperature = 0.79\n",
    "# global_best_params = {\n",
    "#     'cot': None,\n",
    "#     'sorted': False,\n",
    "#     'summarize_prompt': simple_prompt,\n",
    "#     'temperature': 0.75\n",
    "# }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "1036d21a-b644-493a-a0bc-729e5252349e",
   "metadata": {},
   "outputs": [],
   "source": [
    "global_best_params = {\n",
    "    'cot': None,\n",
    "    'sorted': False,\n",
    "    'summarize_prompt': detail_prompt, #detail_prompt,\n",
    "    'temperature': 0.79\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "a7177c13-17ae-43ae-969c-ac8917b52d09",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'text-curie-001'"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "bb4e92d3-b187-4e3c-935e-0e225924a97b",
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "training\n",
      "calculating train error\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  0%|                        | 0/25 [00:00<?, ?it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "summary:\n",
      "The hamsters that tested positive have larger organs than average, while the hamsters that tested negative have smaller organs than average.\n",
      "this couldnt be parsed :  If the hamster's organs are all significantly larger than average, then it is likely that the hamster has a larger than average organ. If the hamster's organs are all significantly smaller than average, then it is likely that the hamster has a smaller than average organ.\n",
      "this couldnt be parsed :  If the hamster's organs are all significantly bigger than what would be expected, then it is likely that the hamster has a tumor.\n",
      "this couldnt be parsed :  If the hamster's heart and spleen are big, then it is likely that the hamster has a larger organ than average. If the hamster's lungs are small, then it is likely that the hamster has a smaller organ than average.\n",
      "contains some unk value\n",
      "summary:\n",
      "The hamster's lung, heart, and liver are all large, while its spleen is small and its kidney is very large. This hamster tested positive.\n",
      "\n",
      "The hamster's lung, heart, and liver are all larger than average, while its spleen is very large. Its kidney, however, is small. This hamster tested positive.\n",
      "\n",
      "The hamster's lung is very big, heart is small, liver is very big, spleen is big, and kidney is very big. This hamster tested positive.\n",
      "\n",
      "The hamster's lungs are small, heart is very small, liver is small, spleen is very small, and kidney is small. This hamster tested negative.\n",
      "\n",
      "The hamster's organs are all very small. The lung, heart, liver, spleen, and kidney are all tiny in comparison to other mammals. This hamster tested positive.\n",
      "\n",
      "The hamster's organs are very small in comparison to other animals. The lungs, heart, liver, spleen, and kidneys are all much smaller than average. This hamster tested positive.\n",
      "\n",
      "This hamster has very large organs compared to the average hamster. Its lung, heart, liver, spleen, and kidney are all significantly larger than normal. This hamster tested positive.\n",
      "\n",
      "The hamster's lung, heart, and liver are all larger than average, while its spleen and kidney are both very large. This hamster tested positive.\n",
      "\n",
      "The hamster's lungs are large, heart is very small, liver is very small, spleen is small, and kidney is very small. This hamster tested negative.\n",
      "\n",
      "The hamster's organs are small in comparison to other animals. The lungs, heart, liver, spleen, and kidney are all smaller than average. This hamster tested negative.\n",
      "\n",
      "The hamster's lung is big in comparison to its other organs. Its heart, liver, spleen, and kidney are all small. This hamster tested negative.\n",
      "\n",
      "The hamster has small lungs and a small heart. Its liver is very large, and its spleen and kidney are both big. This hamster tested negative.\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "  0%|                        | 0/25 [00:32<?, ?it/s]\n"
     ]
    },
    {
     "ename": "KeyboardInterrupt",
     "evalue": "",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)",
      "\u001b[0;32m/var/folders/ll/g4b6wylx35j6mmv9gvrczch40000gp/T/ipykernel_4284/104241521.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m     22\u001b[0m         \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msummary_temp\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     23\u001b[0m         \u001b[0;31m# summary = train_model(X_s, y_s, temperature = 0.80, sorted = False, summarize_prompt = 'Tl;dr')\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 24\u001b[0;31m         \u001b[0mtrain_err_rate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0m_\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0m_\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0m_\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmisclassifications_vector\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtrain_pred_vector\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mbatch_predict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msummary_temp\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX_train\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my_train\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcot\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m#, 'Knowledge to Prediction.\\n' + desc, query_instruct_text, classes, 'text-curie-001', True)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     25\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     26\u001b[0m         \u001b[0;31m# print(train_pred_vector)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/tenacity/__init__.py\u001b[0m in \u001b[0;36mwrapped_f\u001b[0;34m(*args, **kw)\u001b[0m\n\u001b[1;32m    322\u001b[0m         \u001b[0;34m@\u001b[0m\u001b[0mfunctools\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mwraps\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mf\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    323\u001b[0m         \u001b[0;32mdef\u001b[0m \u001b[0mwrapped_f\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 324\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mf\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    325\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    326\u001b[0m         \u001b[0;32mdef\u001b[0m \u001b[0mretry_with\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mt\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mAny\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mWrappedFn\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/tenacity/__init__.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, fn, *args, **kwargs)\u001b[0m\n\u001b[1;32m    402\u001b[0m         \u001b[0mretry_state\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mRetryCallState\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mretry_object\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfn\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mfn\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    403\u001b[0m         \u001b[0;32mwhile\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 404\u001b[0;31m             \u001b[0mdo\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0miter\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mretry_state\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mretry_state\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    405\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mDoAttempt\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    406\u001b[0m                 \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/tenacity/__init__.py\u001b[0m in \u001b[0;36miter\u001b[0;34m(self, retry_state)\u001b[0m\n\u001b[1;32m    347\u001b[0m         \u001b[0mis_explicit_retry\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mretry_state\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0moutcome\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfailed\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mretry_state\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0moutcome\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mexception\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mTryAgain\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    348\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mis_explicit_retry\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mretry\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mretry_state\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mretry_state\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 349\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mfut\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mresult\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    350\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    351\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mafter\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/concurrent/futures/_base.py\u001b[0m in \u001b[0;36mresult\u001b[0;34m(self, timeout)\u001b[0m\n\u001b[1;32m    437\u001b[0m                     \u001b[0;32mraise\u001b[0m \u001b[0mCancelledError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    438\u001b[0m                 \u001b[0;32melif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_state\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0mFINISHED\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 439\u001b[0;31m                     \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__get_result\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    440\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    441\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_condition\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mwait\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtimeout\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/concurrent/futures/_base.py\u001b[0m in \u001b[0;36m__get_result\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    389\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_exception\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    390\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 391\u001b[0;31m                 \u001b[0;32mraise\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_exception\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    392\u001b[0m             \u001b[0;32mfinally\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    393\u001b[0m                 \u001b[0;31m# Break a reference cycle with the exception in self._exception\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/tenacity/__init__.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, fn, *args, **kwargs)\u001b[0m\n\u001b[1;32m    405\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdo\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mDoAttempt\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    406\u001b[0m                 \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 407\u001b[0;31m                     \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfn\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    408\u001b[0m                 \u001b[0;32mexcept\u001b[0m \u001b[0mBaseException\u001b[0m\u001b[0;34m:\u001b[0m  \u001b[0;31m# noqa: B902\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    409\u001b[0m                     \u001b[0mretry_state\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mset_exception\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msys\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mexc_info\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/var/folders/ll/g4b6wylx35j6mmv9gvrczch40000gp/T/ipykernel_4284/3226623496.py\u001b[0m in \u001b[0;36mbatch_predict\u001b[0;34m(summary, X, y, cot)\u001b[0m\n\u001b[1;32m     62\u001b[0m \u001b[0;34m@\u001b[0m\u001b[0mretry\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstop\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstop_after_attempt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m10\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwait\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mwait_fixed\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m5\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     63\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mbatch_predict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msummary\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcot\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 64\u001b[0;31m     pred_texts = p.run_predictions(\n\u001b[0m\u001b[1;32m     65\u001b[0m                 \u001b[0mtaskname\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m''\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;31m#desc,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     66\u001b[0m                 \u001b[0mtexts\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/prompting-tabular-data/datasets/visualizing_hamster/prompting.py\u001b[0m in \u001b[0;36mrun_predictions\u001b[0;34m(self, taskname, texts, summary, query_instruct_text, cot_text, temperature, printf, sleep)\u001b[0m\n\u001b[1;32m    204\u001b[0m                      \u001b[0mquery\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtest_input\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    205\u001b[0m                      \u001b[0mquery_instruct_text\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mquery_instruct_text_temp\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 206\u001b[0;31m                      temperature = 0).strip()\n\u001b[0m\u001b[1;32m    207\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    208\u001b[0m             \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/prompting-tabular-data/datasets/visualizing_hamster/prompting.py\u001b[0m in \u001b[0;36mpredict\u001b[0;34m(self, taskname, summary, query, query_instruct_text, temperature)\u001b[0m\n\u001b[1;32m    162\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchatbot\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mChatbot\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mconfig\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mconversation_id\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    163\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchatbot\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrefresh_session\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 164\u001b[0;31m                 \u001b[0mresponse\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchatbot\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mget_chat_response\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mprompt\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    165\u001b[0m             \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mresponse\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'message'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    166\u001b[0m         \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/openai/api_resources/completion.py\u001b[0m in \u001b[0;36mcreate\u001b[0;34m(cls, *args, **kwargs)\u001b[0m\n\u001b[1;32m     23\u001b[0m         \u001b[0;32mwhile\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     24\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 25\u001b[0;31m                 \u001b[0;32mreturn\u001b[0m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcreate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     26\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mTryAgain\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     27\u001b[0m                 \u001b[0;32mif\u001b[0m \u001b[0mtimeout\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mtime\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtime\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0mstart\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0mtimeout\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/openai/api_resources/abstract/engine_api_resource.py\u001b[0m in \u001b[0;36mcreate\u001b[0;34m(cls, api_key, api_base, api_type, request_id, api_version, organization, **params)\u001b[0m\n\u001b[1;32m    151\u001b[0m         )\n\u001b[1;32m    152\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 153\u001b[0;31m         response, _, api_key = requestor.request(\n\u001b[0m\u001b[1;32m    154\u001b[0m             \u001b[0;34m\"post\"\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    155\u001b[0m             \u001b[0murl\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/openai/api_requestor.py\u001b[0m in \u001b[0;36mrequest\u001b[0;34m(self, method, url, params, headers, files, stream, request_id, request_timeout)\u001b[0m\n\u001b[1;32m    215\u001b[0m         \u001b[0mrequest_timeout\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mOptional\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mUnion\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mTuple\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfloat\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    216\u001b[0m     ) -> Tuple[Union[OpenAIResponse, Iterator[OpenAIResponse]], bool, str]:\n\u001b[0;32m--> 217\u001b[0;31m         result = self.request_raw(\n\u001b[0m\u001b[1;32m    218\u001b[0m             \u001b[0mmethod\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlower\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    219\u001b[0m             \u001b[0murl\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/openai/api_requestor.py\u001b[0m in \u001b[0;36mrequest_raw\u001b[0;34m(self, method, url, params, supplied_headers, files, stream, request_id, request_timeout)\u001b[0m\n\u001b[1;32m    515\u001b[0m             \u001b[0m_thread_context\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msession\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_make_session\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    516\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 517\u001b[0;31m             result = _thread_context.session.request(\n\u001b[0m\u001b[1;32m    518\u001b[0m                 \u001b[0mmethod\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    519\u001b[0m                 \u001b[0mabs_url\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/requests/sessions.py\u001b[0m in \u001b[0;36mrequest\u001b[0;34m(self, method, url, params, data, headers, cookies, files, auth, timeout, allow_redirects, proxies, hooks, stream, verify, cert, json)\u001b[0m\n\u001b[1;32m    540\u001b[0m         }\n\u001b[1;32m    541\u001b[0m         \u001b[0msend_kwargs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mupdate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msettings\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 542\u001b[0;31m         \u001b[0mresp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mprep\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0msend_kwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    543\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    544\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mresp\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/requests/sessions.py\u001b[0m in \u001b[0;36msend\u001b[0;34m(self, request, **kwargs)\u001b[0m\n\u001b[1;32m    653\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    654\u001b[0m         \u001b[0;31m# Send the request\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 655\u001b[0;31m         \u001b[0mr\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0madapter\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mrequest\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    656\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    657\u001b[0m         \u001b[0;31m# Total elapsed time of the request (approximately)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/requests/adapters.py\u001b[0m in \u001b[0;36msend\u001b[0;34m(self, request, stream, timeout, verify, cert, proxies)\u001b[0m\n\u001b[1;32m    437\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    438\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mchunked\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 439\u001b[0;31m                 resp = conn.urlopen(\n\u001b[0m\u001b[1;32m    440\u001b[0m                     \u001b[0mmethod\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mrequest\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmethod\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    441\u001b[0m                     \u001b[0murl\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0murl\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/urllib3/connectionpool.py\u001b[0m in \u001b[0;36murlopen\u001b[0;34m(self, method, url, body, headers, retries, redirect, assert_same_host, timeout, pool_timeout, release_conn, chunked, body_pos, **response_kw)\u001b[0m\n\u001b[1;32m    697\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    698\u001b[0m             \u001b[0;31m# Make the request on the httplib connection object.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 699\u001b[0;31m             httplib_response = self._make_request(\n\u001b[0m\u001b[1;32m    700\u001b[0m                 \u001b[0mconn\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    701\u001b[0m                 \u001b[0mmethod\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/urllib3/connectionpool.py\u001b[0m in \u001b[0;36m_make_request\u001b[0;34m(self, conn, method, url, timeout, chunked, **httplib_request_kw)\u001b[0m\n\u001b[1;32m    443\u001b[0m                     \u001b[0;31m# Python 3 (including for exceptions like SystemExit).\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    444\u001b[0m                     \u001b[0;31m# Otherwise it looks like a bug in the code.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 445\u001b[0;31m                     \u001b[0msix\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mraise_from\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0me\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    446\u001b[0m         \u001b[0;32mexcept\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mSocketTimeout\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mBaseSSLError\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mSocketError\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    447\u001b[0m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_raise_timeout\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0merr\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0me\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0murl\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0murl\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtimeout_value\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mread_timeout\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/urllib3/packages/six.py\u001b[0m in \u001b[0;36mraise_from\u001b[0;34m(value, from_value)\u001b[0m\n",
      "\u001b[0;32m~/hari_works/virtualenv/lib/python3.9/site-packages/urllib3/connectionpool.py\u001b[0m in \u001b[0;36m_make_request\u001b[0;34m(self, conn, method, url, timeout, chunked, **httplib_request_kw)\u001b[0m\n\u001b[1;32m    438\u001b[0m                 \u001b[0;31m# Python 3\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    439\u001b[0m                 \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 440\u001b[0;31m                     \u001b[0mhttplib_response\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mconn\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgetresponse\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    441\u001b[0m                 \u001b[0;32mexcept\u001b[0m \u001b[0mBaseException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    442\u001b[0m                     \u001b[0;31m# Remove the TypeError from the exception chain in\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/http/client.py\u001b[0m in \u001b[0;36mgetresponse\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1375\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1376\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1377\u001b[0;31m                 \u001b[0mresponse\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbegin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1378\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mConnectionError\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1379\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mclose\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/http/client.py\u001b[0m in \u001b[0;36mbegin\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    318\u001b[0m         \u001b[0;31m# read until we get a non-100 response\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    319\u001b[0m         \u001b[0;32mwhile\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 320\u001b[0;31m             \u001b[0mversion\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstatus\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreason\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_read_status\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    321\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0mstatus\u001b[0m \u001b[0;34m!=\u001b[0m \u001b[0mCONTINUE\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    322\u001b[0m                 \u001b[0;32mbreak\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/http/client.py\u001b[0m in \u001b[0;36m_read_status\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    279\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    280\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0m_read_status\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 281\u001b[0;31m         \u001b[0mline\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mstr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreadline\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0m_MAXLINE\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"iso-8859-1\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    282\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mline\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0m_MAXLINE\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    283\u001b[0m             \u001b[0;32mraise\u001b[0m \u001b[0mLineTooLong\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"status line\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/socket.py\u001b[0m in \u001b[0;36mreadinto\u001b[0;34m(self, b)\u001b[0m\n\u001b[1;32m    702\u001b[0m         \u001b[0;32mwhile\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    703\u001b[0m             \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 704\u001b[0;31m                 \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_sock\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecv_into\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mb\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    705\u001b[0m             \u001b[0;32mexcept\u001b[0m \u001b[0mtimeout\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    706\u001b[0m                 \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_timeout_occurred\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/ssl.py\u001b[0m in \u001b[0;36mrecv_into\u001b[0;34m(self, buffer, nbytes, flags)\u001b[0m\n\u001b[1;32m   1240\u001b[0m                   \u001b[0;34m\"non-zero flags not allowed in calls to recv_into() on %s\"\u001b[0m \u001b[0;34m%\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1241\u001b[0m                   self.__class__)\n\u001b[0;32m-> 1242\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnbytes\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mbuffer\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1243\u001b[0m         \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1244\u001b[0m             \u001b[0;32mreturn\u001b[0m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecv_into\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mbuffer\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnbytes\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mflags\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;32m/usr/local/Cellar/python@3.9/3.9.16/Frameworks/Python.framework/Versions/3.9/lib/python3.9/ssl.py\u001b[0m in \u001b[0;36mread\u001b[0;34m(self, len, buffer)\u001b[0m\n\u001b[1;32m   1098\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1099\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0mbuffer\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1100\u001b[0;31m                 \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_sslobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlen\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mbuffer\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1101\u001b[0m             \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1102\u001b[0m                 \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_sslobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlen\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mKeyboardInterrupt\u001b[0m: "
     ]
    }
   ],
   "source": [
    "sampling_times = 25\n",
    "train_errs = []\n",
    "print('training')\n",
    "\n",
    "summary_file = f'summary-curie-001-cluster-onlycat.pkl'\n",
    "summary_stats = {}\n",
    "\n",
    "# get train error.\n",
    "print('calculating train error')\n",
    "        \n",
    "# random\n",
    "# X_s, _, y_s, _ = train_test_split(X_train, y_train, test_size = 1 - 20/len(X_train), random_state=0, stratify = y_train)\n",
    "# len(X_train)\n",
    "\n",
    "# cluster sample\n",
    "X_s, y_s, sampled_indices = cluster_sample(embeddings, X_train, y_train, None, num_examples = 25)\n",
    "\n",
    "for step in tqdm.tqdm(range(sampling_times)):\n",
    "    while True:\n",
    "        summary_temp = train_model(X_s, y_s, temperature, sorted_, summarize_prompt) #, desc, 'text-curie-001')\n",
    "        print('summary:')\n",
    "        print(summary_temp)\n",
    "        # summary = train_model(X_s, y_s, temperature = 0.80, sorted = False, summarize_prompt = 'Tl;dr')\n",
    "        train_err_rate, _, _, _, misclassifications_vector, train_pred_vector = batch_predict(summary_temp, X_train, y_train, cot) #, 'Knowledge to Prediction.\\n' + desc, query_instruct_text, classes, 'text-curie-001', True)\n",
    "\n",
    "        # print(train_pred_vector)\n",
    "\n",
    "        if 'unk' in train_pred_vector:\n",
    "            print('contains some unk value')\n",
    "            continue\n",
    "        if len(np.unique(train_pred_vector)) == 1:\n",
    "            print('all ones or zeros :(')\n",
    "            continue\n",
    "        if len(np.unique(train_pred_vector)) != len(classes):\n",
    "            print('not equals num of classes in dataset :(')\n",
    "            continue\n",
    "        break\n",
    "        \n",
    "    # err_rate, _, _, _, _, y_preds = batch_predict(summary, X_train, y_train, None)\n",
    "    print(f'step {step} | val err: {train_err_rate}')\n",
    "    train_errs.append((train_err_rate, summary_temp, train_pred_vector))\n",
    "\n",
    "summary_stats['train'] = train_errs\n",
    "\n",
    "# best summary \n",
    "print('validating.')\n",
    "val_results = []\n",
    "\n",
    "for train_err_rate, summary_temp, train_pred_vector in sorted(train_errs, key = lambda x: x[0]):\n",
    "    val_err_rate, num_errors, total, err_indices, misclassifications_vector, val_preds = batch_predict(summary_temp, X_val, y_val, cot) #, 'Knowledge to Prediction.\\n' + desc, query_instruct_text, classes, 'text-curie-001')\n",
    "    # test_err_rate, num_errors, total, err_indices, misclassifications_vector, y_preds = batch_predict(summary, X_test, y_test, None)\n",
    "    print(f'train err: {train_err_rate} | val err: {val_err_rate}')\n",
    "    val_results.append((val_err_rate, train_err_rate, summary_temp, val_preds, train_pred_vector))\n",
    "\n",
    "summary_stats['val'] = val_results\n",
    "\n",
    "# test results\n",
    "test_results = []\n",
    "for best_val_err_rate, best_train_err_rate, best_summary, y_preds_val, y_preds_train in sorted(val_results, key = lambda x: (x[0], x[1]))[:5]:\n",
    "    test_result = batch_predict(best_summary, X_test, y_test, cot) #, 'Knowledge to Prediction.\\n' + desc, query_instruct_text, classes, 'text-curie-001')\n",
    "    print('test err: ', test_result[0], ' | val err: ', best_val_err_rate, ' | train err: ', best_train_err_rate)\n",
    "    test_results.append(test_result)\n",
    "    \n",
    "summary_stats['test'] = test_results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f2b94b1d-069c-4593-abaf-1fafc95e5ea0",
   "metadata": {},
   "outputs": [],
   "source": [
    "summary_file = f'summary-curie-001-cluster-onlycat.pkl' # visualizing_hamster_quartile-categorical.csv\n",
    "with open(summary_file, \"wb\") as f:\n",
    "    pickle.dump(summary_stats, f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e7f4c8f7-1da9-4954-bd73-bf09c6ec8194",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
