{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "b8d619b7",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-22T02:20:17.014672Z",
     "start_time": "2023-07-22T02:20:16.714113Z"
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "cd1e8993",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-22T02:20:42.833373Z",
     "start_time": "2023-07-22T02:20:42.826995Z"
    }
   },
   "outputs": [],
   "source": [
    "prompt1 = '''The given sentence has two noun phrases. Generate two clauses that could reasonably end this sentence. Each clause must contain a pronoun that refers to a different noun phrase from the sentence.\n",
    "Input: The city councilmen refused the demonstrators a permit because\n",
    "Output:\n",
    "Clause 1: they feared violence would occur\n",
    "Pronoun: they\n",
    "Pronoun in clause 1 refers to [the city councilmen]\n",
    "Clause 2: they advocated violence to achieve their goals\n",
    "Pronoun: they\n",
    "Pronoun in clause 2 refers to [the demonstrators]\n",
    "Explanation: The pronoun in clause 1 refers to the city councilmen. The pronoun in clause 2 refers to the demonstrators. Thus, both generated clauses refer to different noun phrases present in the sentence.\n",
    "Input: The professor graded his students harshly because\n",
    "Output:\n",
    " \n",
    "The given sentence has two noun phrases. Generate two clauses that could reasonably end this sentence. Each clause must contain a common pronoun that refers to a different noun phrase from the sentence. The noun phrases must not appear in the clauses.\n",
    "Input: The city councilmen refused the demonstrators a permit because\n",
    "Output:\n",
    "Clause 1: they feared violence would occur\n",
    "Clause 2: they advocated violence to achieve their goals\n",
    "Explanation: The common pronoun is “they”. The pronoun in clause 1 refers to the city councilmen. The pronoun in clause 2 refers to the demonstrators. Thus, both generated clauses refer to different noun phrases present in the sentence.\n",
    "Input:\n",
    "'''\n",
    "\n",
    "prompt2 = '''\n",
    "Output:\n",
    "'''\n",
    "\n",
    "# prompt3 = '''\n",
    "# Chosen definition:\n",
    "# '''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "98acbf49",
   "metadata": {},
   "outputs": [],
   "source": [
    "def chat_gpt_response(sample):\n",
    "    final_prompt = prompt1 + sample + prompt2 #+ sample[1] + prompt3\n",
    "    \n",
    "    response=openai.ChatCompletion.create(\n",
    "        model=\"gpt-3.5-turbo\",\n",
    "        messages= [{\"role\": \"user\", \"content\": final_prompt}],\n",
    "        temperature=0.7,\n",
    "        max_tokens=4096,\n",
    "        top_p=1,\n",
    "        frequency_penalty=0,\n",
    "        presence_penalty=0,\n",
    "        stop=None)\n",
    "    \n",
    "    reply = response[\"choices\"][0][\"message\"][\"content\"]\n",
    "    return reply"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "8369b3fc",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-22T02:35:07.203353Z",
     "start_time": "2023-07-22T02:35:07.189444Z"
    }
   },
   "outputs": [],
   "source": [
    "df = pd.read_csv(\"wsc_step_2_input.csv\")\n",
    "ip_list2 = list(df['Input'])\n",
    "# list1 = list(df['Input'])\n",
    "# list2 = list(df['Output'])\n",
    "# # ip_list = list(df['Word List'])\n",
    "# # ip_list2 = ip_list\n",
    "\n",
    "# ip_list = [ [x,y] for x, y in zip(list1, list2)]\n",
    "\n",
    "# ip_list2 = ip_list[:2]\n",
    "# len(ip_list2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4cea07f5",
   "metadata": {},
   "outputs": [],
   "source": [
    "count = 0\n",
    "\n",
    "batch_size = 100  #Tunable parameter\n",
    "\n",
    "while len(ip_list2) > 0:\n",
    "    temp_list = ip_list2[:batch_size] \n",
    "    output_list = []\n",
    "\n",
    "    for item in temp_list:\n",
    "        output_list.append(chat_gpt_response(item))\n",
    "    \n",
    "    data = {'Input': temp_list,'Output': output_list }\n",
    "    df_ans = pd.DataFrame(data)\n",
    "    df_ans.to_csv(\"output_wsc_part_2_shard_\" + str(count) + \".csv\", index = False)\n",
    "    count+=1\n",
    "    print(\"shard number:\",count,\"Done\")\n",
    "    ip_list2 = ip_list2[batch_size:]"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:root] *",
   "language": "python",
   "name": "conda-root-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
