{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "d285ed21",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-21T02:05:47.188741Z",
     "start_time": "2023-07-21T02:05:46.782926Z"
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "eceaf387",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-21T02:07:30.414540Z",
     "start_time": "2023-07-21T02:07:30.410390Z"
    }
   },
   "outputs": [],
   "source": [
    "prompt1 = '''For a given input word, print a list of 4 or less distinct definitions of the word.\n",
    "\n",
    "Example:\n",
    "Input: face\n",
    "Output:\n",
    "1. to confront or deal with\n",
    "2. the expression on a person's face\n",
    "3. the front part of a head, from forehead to chin\n",
    "\n",
    "Example:\n",
    "Input: defenestration\n",
    "Output:\n",
    "1. to throw out of a window\n",
    "\n",
    "Input:\n",
    " '''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "e1f52c66",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-21T02:14:02.246331Z",
     "start_time": "2023-07-21T02:14:02.233244Z"
    }
   },
   "outputs": [],
   "source": [
    "df = pd.read_csv(\"wic_word_list.csv\")\n",
    "ip_list = list(df['Word List'])\n",
    "ip_list2 = ip_list"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "5e702c6c",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-21T02:14:05.002262Z",
     "start_time": "2023-07-21T02:14:04.993458Z"
    }
   },
   "outputs": [],
   "source": [
    "def chat_gpt_response(sample):\n",
    "    final_prompt = prompt1 + sample\n",
    "    response=openai.ChatCompletion.create(\n",
    "        model=\"gpt-3.5-turbo\",\n",
    "        messages= [{\"role\": \"user\", \"content\": final_prompt}],\n",
    "        temperature=0.7,\n",
    "        max_tokens=4096,\n",
    "        top_p=1,\n",
    "        frequency_penalty=0,\n",
    "        presence_penalty=0,\n",
    "        stop=None)\n",
    "    \n",
    "    reply = response[\"choices\"][0][\"message\"][\"content\"]\n",
    "    return reply"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "66847fbc",
   "metadata": {},
   "outputs": [],
   "source": [
    "count = 0\n",
    "\n",
    "batch_size = 100  #Tunable parameter\n",
    "\n",
    "while len(ip_list2) > 0:\n",
    "    temp_list = ip_list2[:batch_size]\n",
    " \n",
    "    output_list = []\n",
    "\n",
    "    for item in temp_list:\n",
    "        output_list.append(chat_gpt_response(item))\n",
    "    \n",
    "    data = {'Input': temp_list,'Output': output_list }\n",
    "    df_ans = pd.DataFrame(data)\n",
    "    df_ans.to_csv(\"output_wic_word_check_shard_\" + str(count) + \".csv\", index = False)\n",
    "    count+=1\n",
    "    print(\"shard number:\",count,\"Done\")\n",
    "    ip_list2 = ip_list2[batch_size:]"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:root] *",
   "language": "python",
   "name": "conda-root-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
