{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T17:03:02.127695Z",
     "start_time": "2022-10-05T17:02:59.735238Z"
    },
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "jkCx5GziPtde",
    "outputId": "1c526707-0f81-4cbe-ffc5-e030b5f47557"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: openai in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (0.23.0)\n",
      "Requirement already satisfied: typing-extensions in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (3.10.0.2)\n",
      "Requirement already satisfied: openpyxl>=3.0.7 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (3.0.9)\n",
      "Requirement already satisfied: requests>=2.20 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (2.26.0)\n",
      "Requirement already satisfied: pandas>=1.2.3 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (1.3.4)\n",
      "Requirement already satisfied: pandas-stubs>=1.1.0.11 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (1.4.3.220822)\n",
      "Requirement already satisfied: numpy in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (1.20.3)\n",
      "Requirement already satisfied: tqdm in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openai) (4.62.3)\n",
      "Requirement already satisfied: et-xmlfile in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from openpyxl>=3.0.7->openai) (1.1.0)\n",
      "Requirement already satisfied: python-dateutil>=2.7.3 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from pandas>=1.2.3->openai) (2.8.2)\n",
      "Requirement already satisfied: pytz>=2017.3 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from pandas>=1.2.3->openai) (2021.3)\n",
      "Requirement already satisfied: types-pytz>=2022.1.1 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from pandas-stubs>=1.1.0.11->openai) (2022.2.1.0)\n",
      "Requirement already satisfied: six>=1.5 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from python-dateutil>=2.7.3->pandas>=1.2.3->openai) (1.16.0)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from requests>=2.20->openai) (2021.10.8)\n",
      "Requirement already satisfied: idna<4,>=2.5 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from requests>=2.20->openai) (3.2)\n",
      "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from requests>=2.20->openai) (1.26.7)\n",
      "Requirement already satisfied: charset-normalizer~=2.0.0 in /Users/him1411/opt/anaconda3/lib/python3.9/site-packages (from requests>=2.20->openai) (2.0.4)\n"
     ]
    }
   ],
   "source": [
    "!pip install openai"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:07:35.802828Z",
     "start_time": "2022-10-05T21:07:34.055016Z"
    },
    "id": "YUDHKBmqPLrp"
   },
   "outputs": [],
   "source": [
    "import os\n",
    "import openai\n",
    "import pandas as pd\n",
    "from collections import deque\n",
    "from tqdm import tqdm\n",
    "\n",
    "openai.api_key = \"\" #Use cautiously "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:07:36.510514Z",
     "start_time": "2022-10-05T21:07:36.369275Z"
    },
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "YMt2xuoOPwDB",
    "outputId": "48148b63-7a8c-4366-9985-f6f0eb3a2a22"
   },
   "outputs": [
    {
     "ename": "ModuleNotFoundError",
     "evalue": "No module named 'google.colab'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mModuleNotFoundError\u001b[0m                       Traceback (most recent call last)",
      "\u001b[0;32m/var/folders/xf/l5jsvn9s4y73c622dmjv9p0r0000gn/T/ipykernel_14273/1408506528.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0;32mfrom\u001b[0m \u001b[0mgoogle\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcolab\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mdrive\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      2\u001b[0m \u001b[0mdrive\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmount\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'/content/drive'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'google.colab'"
     ]
    }
   ],
   "source": [
    "from google.colab import drive\n",
    "drive.mount('/content/drive')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:07:37.235384Z",
     "start_time": "2022-10-05T21:07:37.225193Z"
    },
    "id": "wFSckmkuPyIs"
   },
   "outputs": [],
   "source": [
    "def gpt3(oneshot, premise, prmpt):\n",
    "  allData = \"\"\n",
    "  ppt = oneshot + \"\\n\" + prmpt + premise + \"\\n\\npronoun: \\n\"\n",
    "  \n",
    "  response = openai.Completion.create(\n",
    "  model=\"text-davinci-002\",\n",
    "  prompt=ppt,\n",
    "  temperature=0.7,\n",
    "  max_tokens=512,\n",
    "  top_p=1,\n",
    "  frequency_penalty=2,\n",
    "  presence_penalty=2\n",
    "  )\n",
    "  print(\"ppt----------> \",ppt, \"\\n GPT3:\\n\", response['choices'][0]['text'])\n",
    "  allData = {\"Premise\":premise,\"GPT3 Response\":\"Choice 1:\\n\"+ response['choices'][0]['text']}\n",
    "\n",
    "  return allData"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:07:39.327784Z",
     "start_time": "2022-10-05T21:07:39.292156Z"
    },
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "qHf2xjKzQgx3",
    "outputId": "02d1917b-55e7-48b9-b45b-4d30e9c5b563"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Premise List</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>The city councilmen refused the demonstrators ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>The city councilmen refused the demonstrators ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>The trophy doesn't fit into the brown suitcase...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>The trophy doesn't fit into the brown suitcase...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Joan made sure to thank Susan for all the help...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        Premise List\n",
       "0  The city councilmen refused the demonstrators ...\n",
       "1  The city councilmen refused the demonstrators ...\n",
       "2  The trophy doesn't fit into the brown suitcase...\n",
       "3  The trophy doesn't fit into the brown suitcase...\n",
       "4  Joan made sure to thank Susan for all the help..."
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_cause = pd.read_csv(\"wsc_premise_list.csv\")\n",
    "df_cause.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:07:40.447799Z",
     "start_time": "2022-10-05T21:07:40.435567Z"
    },
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "MFlWtaGeQt4I",
    "outputId": "c2ab7ca3-1b1a-48eb-88b8-a5e18b0a840c"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>gpt-3response</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "Empty DataFrame\n",
       "Columns: [gpt-3response]\n",
       "Index: []"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_result.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:09:28.720956Z",
     "start_time": "2022-10-05T21:09:13.804448Z"
    },
    "id": "0ENQWvqkP0nz"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The city councilmen refused the demonstrators a permit because they feared violence.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " they\n",
      "\n",
      "option 1: \n",
      "city councilmen \n",
      "option 2: demonstrators \n",
      "Answer: city councilmen\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The city councilmen refused the demonstrators a permit because they advocated violence.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " they\n",
      "\n",
      "option 1: \n",
      "city councilmen \n",
      "option 2:  demonstrators\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " The trophy\n",
      "\n",
      "option 1: \n",
      "it is too large.\n",
      "option 2: \n",
      "The trophy doesn't fit into the brown suitcase because The trophy is too large.\n",
      "\n",
      " Answer: it is too large\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too small.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " it\n",
      "\n",
      "option 1: \n",
      "suitcase\n",
      "\n",
      "option 2: \n",
      "trophy\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "Joan made sure to thank Susan for all the help she had recieved.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " she\n",
      "\n",
      "option 1: \n",
      "Joan \n",
      "option 2: Susan\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "Joan made sure to thank Susan for all the help she had given.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " she\n",
      "\n",
      "option 1: \n",
      "Joan \n",
      "option 2: Susan \n",
      "Answer: Susan\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "Paul tried to call George on the phone, but he wasn't successful.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " he\n",
      "\n",
      "option 1: \n",
      "Paul \n",
      "option 2: \n",
      "George \n",
      "Answer: George\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "Paul tried to call George on the phone, but he wasn't available.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " he\n",
      "\n",
      "option 1: \n",
      "Paul \n",
      "option 2: \n",
      "George \n",
      "Answer: George\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The lawyer asked the witness a question, but he was reluctant to repeat it.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " he\n",
      "\n",
      "option 1: \n",
      "witness\n",
      "option 2: lawyer\n",
      "ppt---------->  A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
      "\n",
      "sentence:\n",
      "The trophy doesn't fit into the brown suitcase because it is too large.\n",
      "\n",
      "pronoun:\n",
      "it\n",
      "\n",
      "option 1:\n",
      "trophy\n",
      "\n",
      "option 2:\n",
      "suitcase\n",
      "\n",
      "Answer:\n",
      " trophy\n",
      "Generate more samples now. Be diverse in sample generation. \n",
      "\n",
      "sentence:\n",
      "The lawyer asked the witness a question, but he was reluctant to answer it.\n",
      "\n",
      "pronoun: \n",
      " \n",
      " GPT3:\n",
      " it\n",
      "\n",
      "option 1: \n",
      "question \n",
      "option 2: answer \n",
      "Answer: question\n"
     ]
    }
   ],
   "source": [
    "data = []\n",
    "pathtosave = \"./\"\n",
    "shardno = 1\n",
    "num = 10 #Num of Premises or data to generate\n",
    "oneshot = '''A sample consists of a sentence, a pronoun from the sentence and two options from the sentence that give the pronoun resolution. Out of the two options, the correct option is given using the answer category. An example is given below to help you out. \n",
    "\n",
    "sentence:\n",
    "The trophy doesn't fit into the brown suitcase because it is too large.\n",
    "\n",
    "pronoun:\n",
    "it\n",
    "\n",
    "option 1:\n",
    "trophy\n",
    "\n",
    "option 2:\n",
    "suitcase\n",
    "\n",
    "Answer:\n",
    " trophy'''\n",
    "#change ppt\n",
    "ppt = '''Generate more samples now. Be diverse in sample generation. \n",
    "\n",
    "sentence:\\n'''\n",
    "for i in (range(df_cause.shape[0])):\n",
    "  if data!=[] and len(data)%100==0:\n",
    "    print(\"Shard no: \", shardno)\n",
    "    dataDF = pd.DataFrame(data)\n",
    "    dataDF.to_csv(pathtosave + f\"/shard_oneshot_copa_cause_{shardno}.csv\", index=False)\n",
    "    shardno+=1\n",
    "    data = []\n",
    "  if num==0:\n",
    "    break\n",
    "  d = gpt3(oneshot,df_cause.iloc[i]['Premise List'],ppt)\n",
    "  data.append(d)\n",
    "  num-=1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {
    "ExecuteTime": {
     "end_time": "2022-10-05T21:20:19.313457Z",
     "start_time": "2022-10-05T21:20:19.300247Z"
    },
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "AeL-GYXia5E1",
    "outputId": "025d6ded-9e08-4cb3-a194-7bc202b45ead"
   },
   "outputs": [],
   "source": [
    "df = pd.DataFrame(data)\n",
    "df.to_csv(pathtosave + \"WSC_result.csv\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "GI3E_77TgsLc"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "collapsed_sections": [],
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
