{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "jkCx5GziPtde",
    "outputId": "1c526707-0f81-4cbe-ffc5-e030b5f47557"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
      "Collecting openai\n",
      "  Downloading openai-0.23.0.tar.gz (43 kB)\n",
      "\u001b[K     |████████████████████████████████| 43 kB 1.5 MB/s \n",
      "\u001b[?25h  Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
      "  Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
      "    Preparing wheel metadata ... \u001b[?25l\u001b[?25hdone\n",
      "Requirement already satisfied: openpyxl>=3.0.7 in /usr/local/lib/python3.7/dist-packages (from openai) (3.0.10)\n",
      "Requirement already satisfied: requests>=2.20 in /usr/local/lib/python3.7/dist-packages (from openai) (2.23.0)\n",
      "Requirement already satisfied: pandas>=1.2.3 in /usr/local/lib/python3.7/dist-packages (from openai) (1.3.5)\n",
      "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (from openai) (1.21.6)\n",
      "Collecting pandas-stubs>=1.1.0.11\n",
      "  Downloading pandas_stubs-1.2.0.62-py3-none-any.whl (163 kB)\n",
      "\u001b[K     |████████████████████████████████| 163 kB 8.6 MB/s \n",
      "\u001b[?25hRequirement already satisfied: tqdm in /usr/local/lib/python3.7/dist-packages (from openai) (4.64.1)\n",
      "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from openai) (4.1.1)\n",
      "Requirement already satisfied: et-xmlfile in /usr/local/lib/python3.7/dist-packages (from openpyxl>=3.0.7->openai) (1.1.0)\n",
      "Requirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.7/dist-packages (from pandas>=1.2.3->openai) (2.8.2)\n",
      "Requirement already satisfied: pytz>=2017.3 in /usr/local/lib/python3.7/dist-packages (from pandas>=1.2.3->openai) (2022.2.1)\n",
      "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.7/dist-packages (from python-dateutil>=2.7.3->pandas>=1.2.3->openai) (1.15.0)\n",
      "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests>=2.20->openai) (3.0.4)\n",
      "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests>=2.20->openai) (2.10)\n",
      "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests>=2.20->openai) (2022.6.15)\n",
      "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests>=2.20->openai) (1.24.3)\n",
      "Building wheels for collected packages: openai\n",
      "  Building wheel for openai (PEP 517) ... \u001b[?25l\u001b[?25hdone\n",
      "  Created wheel for openai: filename=openai-0.23.0-py3-none-any.whl size=54478 sha256=d1bba1a625c65bd07f4a5e8b3144c9d6b23bd915ab0b94de6b54eead8d954b36\n",
      "  Stored in directory: /root/.cache/pip/wheels/70/d5/31/f9f67660319d89e4f54501d27b1e90f88a3309c42ea4fd734c\n",
      "Successfully built openai\n",
      "Installing collected packages: pandas-stubs, openai\n",
      "Successfully installed openai-0.23.0 pandas-stubs-1.2.0.62\n"
     ]
    }
   ],
   "source": [
    "!pip install openai"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "id": "YUDHKBmqPLrp"
   },
   "outputs": [],
   "source": [
    "import os\n",
    "import openai\n",
    "import pandas as pd\n",
    "from collections import deque\n",
    "from tqdm import tqdm\n",
    "\n",
    "openai.api_key = \"API TOKEN\" #Use cautiously "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "YMt2xuoOPwDB",
    "outputId": "48148b63-7a8c-4366-9985-f6f0eb3a2a22"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mounted at /content/drive\n"
     ]
    }
   ],
   "source": [
    "from google.colab import drive\n",
    "drive.mount('/content/drive')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {
    "id": "wFSckmkuPyIs"
   },
   "outputs": [],
   "source": [
    "def gpt3(oneshot, premise, prmpt):\n",
    "  allData = \"\"\n",
    "  ppt = oneshot + \"\\n\" + prmpt + premise + \"\\n\\nChoice 1: \\n\"\n",
    "  \n",
    "  response = openai.Completion.create(\n",
    "  model=\"text-davinci-002\",\n",
    "  prompt=ppt,\n",
    "  temperature=0.7,\n",
    "  max_tokens=512,\n",
    "  top_p=1,\n",
    "  frequency_penalty=2,\n",
    "  presence_penalty=2\n",
    "  )\n",
    "  print(\"ppt----------> \",ppt, \"\\n GPT3:\\n\", response['choices'][0]['text'])\n",
    "  allData = {\"Premise\":premise,\"GPT3 Response\":\"Choice 1:\\n\"+ response['choices'][0]['text']}\n",
    "\n",
    "  return allData"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "qHf2xjKzQgx3",
    "outputId": "02d1917b-55e7-48b9-b45b-4d30e9c5b563"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "  <div id=\"df-d5efe7f4-0223-4e3c-b0b2-ef257b67a308\">\n",
       "    <div class=\"colab-df-container\">\n",
       "      <div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Premise List</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>My body cast a shadow over the grass.What was ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>The woman tolerated her friend's difficult beh...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>The women met for coffee.What was the CAUSE of...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>The runner wore shorts.What was the CAUSE of t...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>The guests of the party hid behind the couch.W...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>\n",
       "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-d5efe7f4-0223-4e3c-b0b2-ef257b67a308')\"\n",
       "              title=\"Convert this dataframe to an interactive table.\"\n",
       "              style=\"display:none;\">\n",
       "        \n",
       "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
       "       width=\"24px\">\n",
       "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
       "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
       "  </svg>\n",
       "      </button>\n",
       "      \n",
       "  <style>\n",
       "    .colab-df-container {\n",
       "      display:flex;\n",
       "      flex-wrap:wrap;\n",
       "      gap: 12px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert {\n",
       "      background-color: #E8F0FE;\n",
       "      border: none;\n",
       "      border-radius: 50%;\n",
       "      cursor: pointer;\n",
       "      display: none;\n",
       "      fill: #1967D2;\n",
       "      height: 32px;\n",
       "      padding: 0 0 0 0;\n",
       "      width: 32px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert:hover {\n",
       "      background-color: #E2EBFA;\n",
       "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
       "      fill: #174EA6;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert {\n",
       "      background-color: #3B4455;\n",
       "      fill: #D2E3FC;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert:hover {\n",
       "      background-color: #434B5C;\n",
       "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
       "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
       "      fill: #FFFFFF;\n",
       "    }\n",
       "  </style>\n",
       "\n",
       "      <script>\n",
       "        const buttonEl =\n",
       "          document.querySelector('#df-d5efe7f4-0223-4e3c-b0b2-ef257b67a308 button.colab-df-convert');\n",
       "        buttonEl.style.display =\n",
       "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
       "\n",
       "        async function convertToInteractive(key) {\n",
       "          const element = document.querySelector('#df-d5efe7f4-0223-4e3c-b0b2-ef257b67a308');\n",
       "          const dataTable =\n",
       "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
       "                                                     [key], {});\n",
       "          if (!dataTable) return;\n",
       "\n",
       "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
       "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
       "            + ' to learn more about interactive tables.';\n",
       "          element.innerHTML = '';\n",
       "          dataTable['output_type'] = 'display_data';\n",
       "          await google.colab.output.renderOutput(dataTable, element);\n",
       "          const docLink = document.createElement('div');\n",
       "          docLink.innerHTML = docLinkHtml;\n",
       "          element.appendChild(docLink);\n",
       "        }\n",
       "      </script>\n",
       "    </div>\n",
       "  </div>\n",
       "  "
      ],
      "text/plain": [
       "                                        Premise List\n",
       "0  My body cast a shadow over the grass.What was ...\n",
       "1  The woman tolerated her friend's difficult beh...\n",
       "2  The women met for coffee.What was the CAUSE of...\n",
       "3  The runner wore shorts.What was the CAUSE of t...\n",
       "4  The guests of the party hid behind the couch.W..."
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_cause = pd.read_csv(\"/content/drive/MyDrive/Colab Notebooks/DataGen/Copa/Copa_cause_list.csv\")\n",
    "df_result = pd.read_csv(\"/content/drive/MyDrive/Colab Notebooks/DataGen/Copa/Copa_result_list.csv\")\n",
    "df_cause.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "MFlWtaGeQt4I",
    "outputId": "c2ab7ca3-1b1a-48eb-88b8-a5e18b0a840c"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "  <div id=\"df-9814977d-6448-4a9c-8b92-fbc41aae910a\">\n",
       "    <div class=\"colab-df-container\">\n",
       "      <div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Premise List</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>The physician misdiagnosed the patient.What ha...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>The elderly woman suffered a stroke.What happe...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>The pond froze over for the winter.What happen...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>The offender violated parole.What happened as ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>I poured water on my sleeping friend.What happ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>\n",
       "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-9814977d-6448-4a9c-8b92-fbc41aae910a')\"\n",
       "              title=\"Convert this dataframe to an interactive table.\"\n",
       "              style=\"display:none;\">\n",
       "        \n",
       "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
       "       width=\"24px\">\n",
       "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
       "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
       "  </svg>\n",
       "      </button>\n",
       "      \n",
       "  <style>\n",
       "    .colab-df-container {\n",
       "      display:flex;\n",
       "      flex-wrap:wrap;\n",
       "      gap: 12px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert {\n",
       "      background-color: #E8F0FE;\n",
       "      border: none;\n",
       "      border-radius: 50%;\n",
       "      cursor: pointer;\n",
       "      display: none;\n",
       "      fill: #1967D2;\n",
       "      height: 32px;\n",
       "      padding: 0 0 0 0;\n",
       "      width: 32px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert:hover {\n",
       "      background-color: #E2EBFA;\n",
       "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
       "      fill: #174EA6;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert {\n",
       "      background-color: #3B4455;\n",
       "      fill: #D2E3FC;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert:hover {\n",
       "      background-color: #434B5C;\n",
       "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
       "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
       "      fill: #FFFFFF;\n",
       "    }\n",
       "  </style>\n",
       "\n",
       "      <script>\n",
       "        const buttonEl =\n",
       "          document.querySelector('#df-9814977d-6448-4a9c-8b92-fbc41aae910a button.colab-df-convert');\n",
       "        buttonEl.style.display =\n",
       "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
       "\n",
       "        async function convertToInteractive(key) {\n",
       "          const element = document.querySelector('#df-9814977d-6448-4a9c-8b92-fbc41aae910a');\n",
       "          const dataTable =\n",
       "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
       "                                                     [key], {});\n",
       "          if (!dataTable) return;\n",
       "\n",
       "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
       "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
       "            + ' to learn more about interactive tables.';\n",
       "          element.innerHTML = '';\n",
       "          dataTable['output_type'] = 'display_data';\n",
       "          await google.colab.output.renderOutput(dataTable, element);\n",
       "          const docLink = document.createElement('div');\n",
       "          docLink.innerHTML = docLinkHtml;\n",
       "          element.appendChild(docLink);\n",
       "        }\n",
       "      </script>\n",
       "    </div>\n",
       "  </div>\n",
       "  "
      ],
      "text/plain": [
       "                                        Premise List\n",
       "0  The physician misdiagnosed the patient.What ha...\n",
       "1  The elderly woman suffered a stroke.What happe...\n",
       "2  The pond froze over for the winter.What happen...\n",
       "3  The offender violated parole.What happened as ...\n",
       "4  I poured water on my sleeping friend.What happ..."
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_result.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "0ENQWvqkP0nz"
   },
   "outputs": [],
   "source": [
    "data = []\n",
    "pathtosave = \"/content/drive/MyDrive/Colab Notebooks/DataGen/Copa\"\n",
    "shardno = 1\n",
    "num = 10 #Num of Premises or data to generate\n",
    "oneshot = '''Generate a sample that consists of a premise ,  2 alternate choices and an answer highlighting the correct choice. \\n\\nEach sample has a premise and two alternatives, where the task is to select the alternative that more plausibly has a causal relation with the premise.\\n\\nAlso, determine the relationship between the correct alternative and premise as cause or effect while giving the output of the correct choice. An example is given below to help you out. \\n\\nPremise: \\nThe runner wore shorts. What was the CAUSE of this?\\n\\nChoice 1:\\nThe forecast predicted high temperatures.\\n\\nChoice 2:\\nShe planned to run along the beach.\\n\\nAnswer:\\nChoice 1 \\n\\nGenerate more samples now. Be diverse in sample generation. \\n\\nPremise:'''\n",
    "#change ppt\n",
    "ppt = '''Generate more samples now. Be diverse in sample generation. \\n\\nPremise:\\n'''\n",
    "for i in (range(df_cause.shape[0])):\n",
    "  if data!=[] and len(data)%100==0:\n",
    "    print(\"Shard no: \", shardno)\n",
    "    dataDF = pd.DataFrame(data)\n",
    "    dataDF.to_csv(pathtosave + f\"/shard_oneshot_copa_cause_{shardno}.csv\", index=False)\n",
    "    shardno+=1\n",
    "    data = []\n",
    "  if num==0:\n",
    "    break\n",
    "  d = gpt3(oneshot,df_cause.iloc[i]['Premise List'],ppt)\n",
    "  data.append(d)\n",
    "  num-=1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "AeL-GYXia5E1",
    "outputId": "025d6ded-9e08-4cb3-a194-7bc202b45ead"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "  <div id=\"df-c36588e7-e038-4831-9849-cb9299ed767c\">\n",
       "    <div class=\"colab-df-container\">\n",
       "      <div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Premise</th>\n",
       "      <th>GPT3 Response</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>My body cast a shadow over the grass.What was ...</td>\n",
       "      <td>Choice 1:\\nThe sun was setting. \\nChoice 2: I ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>The woman tolerated her friend's difficult beh...</td>\n",
       "      <td>Choice 1:\\nShe was raised to be polite and pat...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>The women met for coffee.What was the CAUSE of...</td>\n",
       "      <td>Choice 1:\\n They were friends from college.\\nC...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>The runner wore shorts.What was the CAUSE of t...</td>\n",
       "      <td>Choice 1:\\nThe forecast predicted high tempera...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>The guests of the party hid behind the couch.W...</td>\n",
       "      <td>Choice 1:\\nThey saw a spider on the floor. \\nC...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>\n",
       "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-c36588e7-e038-4831-9849-cb9299ed767c')\"\n",
       "              title=\"Convert this dataframe to an interactive table.\"\n",
       "              style=\"display:none;\">\n",
       "        \n",
       "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
       "       width=\"24px\">\n",
       "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
       "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
       "  </svg>\n",
       "      </button>\n",
       "      \n",
       "  <style>\n",
       "    .colab-df-container {\n",
       "      display:flex;\n",
       "      flex-wrap:wrap;\n",
       "      gap: 12px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert {\n",
       "      background-color: #E8F0FE;\n",
       "      border: none;\n",
       "      border-radius: 50%;\n",
       "      cursor: pointer;\n",
       "      display: none;\n",
       "      fill: #1967D2;\n",
       "      height: 32px;\n",
       "      padding: 0 0 0 0;\n",
       "      width: 32px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert:hover {\n",
       "      background-color: #E2EBFA;\n",
       "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
       "      fill: #174EA6;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert {\n",
       "      background-color: #3B4455;\n",
       "      fill: #D2E3FC;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert:hover {\n",
       "      background-color: #434B5C;\n",
       "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
       "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
       "      fill: #FFFFFF;\n",
       "    }\n",
       "  </style>\n",
       "\n",
       "      <script>\n",
       "        const buttonEl =\n",
       "          document.querySelector('#df-c36588e7-e038-4831-9849-cb9299ed767c button.colab-df-convert');\n",
       "        buttonEl.style.display =\n",
       "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
       "\n",
       "        async function convertToInteractive(key) {\n",
       "          const element = document.querySelector('#df-c36588e7-e038-4831-9849-cb9299ed767c');\n",
       "          const dataTable =\n",
       "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
       "                                                     [key], {});\n",
       "          if (!dataTable) return;\n",
       "\n",
       "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
       "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
       "            + ' to learn more about interactive tables.';\n",
       "          element.innerHTML = '';\n",
       "          dataTable['output_type'] = 'display_data';\n",
       "          await google.colab.output.renderOutput(dataTable, element);\n",
       "          const docLink = document.createElement('div');\n",
       "          docLink.innerHTML = docLinkHtml;\n",
       "          element.appendChild(docLink);\n",
       "        }\n",
       "      </script>\n",
       "    </div>\n",
       "  </div>\n",
       "  "
      ],
      "text/plain": [
       "                                             Premise  \\\n",
       "0  My body cast a shadow over the grass.What was ...   \n",
       "1  The woman tolerated her friend's difficult beh...   \n",
       "2  The women met for coffee.What was the CAUSE of...   \n",
       "3  The runner wore shorts.What was the CAUSE of t...   \n",
       "4  The guests of the party hid behind the couch.W...   \n",
       "\n",
       "                                       GPT3 Response  \n",
       "0  Choice 1:\\nThe sun was setting. \\nChoice 2: I ...  \n",
       "1  Choice 1:\\nShe was raised to be polite and pat...  \n",
       "2  Choice 1:\\n They were friends from college.\\nC...  \n",
       "3  Choice 1:\\nThe forecast predicted high tempera...  \n",
       "4  Choice 1:\\nThey saw a spider on the floor. \\nC...  "
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame(data)\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "hngXL4rFbISk",
    "outputId": "1c0c9d3d-ab52-4c6f-9980-e8fe9e901f7b"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "\n",
      "Choice 1:\n",
      "The sun was setting. \n",
      "Choice 2: I turned on the porch light. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "She was raised to be polite and patient.\n",
      "\n",
      "Choice 2: \n",
      "She hoped her friend would change over time. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      " They were friends from college.\n",
      "Choice 2: \n",
      " They worked in the same office building.\n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "The forecast predicted high temperatures. \n",
      "Choice 2: \n",
      "She planned to run along the beach. \n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "They saw a spider on the floor. \n",
      "Choice 2: \n",
      "They were playing hide-and-seek. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "He was caught in a corruption scandal.\n",
      "\n",
      "Choice 2: \n",
      "He promised to raise taxes.\n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "I used laundry detergent. \n",
      "Choice 2: I spilled coffee on my shirt. \n",
      "\n",
      "Answer: Choice 2\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "He had a coupon. \n",
      "Choice 2: \n",
      "It was senior citizen day. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "The customer was unhappy with the product. \n",
      "Choice 2: \n",
      "The store manager was rude to the customer. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Choice 1:\n",
      "The faucet had been leaking for weeks. \n",
      "Choice 2: The woman was a professional plumber. \n",
      "\n",
      "Answer: Choice 1\n"
     ]
    }
   ],
   "source": [
    "for p in df.iloc[:,1]:\n",
    "  print(\"\\n\")\n",
    "  print(p)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "id": "5sSDhLY2exUw"
   },
   "source": [
    "## Result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "id": "k4Ns5vt2bRRI"
   },
   "outputs": [],
   "source": [
    "def gpt3(oneshot, premise, prmpt):\n",
    "  allData = \"\"\n",
    "  ppt = oneshot + \"\\n\" + prmpt + premise + \"\\n\\nChoice 1: \\n\"\n",
    "  \n",
    "  response = openai.Completion.create(\n",
    "  model=\"text-davinci-002\",\n",
    "  prompt=ppt,\n",
    "  temperature=0.7,\n",
    "  max_tokens=512,\n",
    "  top_p=1,\n",
    "  frequency_penalty=2,\n",
    "  presence_penalty=2\n",
    "  )\n",
    "  print(\"ppt----------> \",ppt, \"\\n GPT3:\\n\", response['choices'][0]['text'])\n",
    "  allData = {\"Premise\":premise,\"GPT3 Response\":\"Choice 1:\\n\"+ response['choices'][0]['text']}\n",
    "\n",
    "  return allData"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "WCYWNPS9ez2x"
   },
   "outputs": [],
   "source": [
    "data = []\n",
    "pathtosave = \"/content/drive/MyDrive/Colab Notebooks/DataGen/Copa\"\n",
    "shardno = 1\n",
    "num = 10 #Num of Premises or data to generate\n",
    "oneshot = '''Generate a sample that consists of a premise ,  2 alternate choices and an answer highlighting the correct choice. \\n\\nEach sample has a premise and two alternatives, where the task is to select the alternative that more plausibly has a causal relation with the premise.\\n\\nAlso, determine the relationship between the correct alternative and premise as cause or effect while giving the output of the correct choice. An example is given below to help you out. \\n\\nPremise: \\nThe pond froze over for the winter. What happened as a RESULT?\\n\\nChoice 1:\\nPeople skated on the pond.\\n\\nChoice 2:\\nPeople brought boats to the pond.\\n\\nAnswer:\\nChoice 1\\n'''\n",
    "#change ppt\n",
    "ppt = '''\\nGenerate more samples now. Be diverse in sample generation. \\n\\nPremise:\\n'''\n",
    "for i in (range(df_result.shape[0])):\n",
    "  if data!=[] and len(data)%100==0:\n",
    "    print(\"Shard no: \", shardno)\n",
    "    dataDF = pd.DataFrame(data)\n",
    "    dataDF.to_csv(pathtosave + f\"/shard_oneshot_copa_result_{shardno}.csv\", index=False)\n",
    "    shardno+=1\n",
    "    data = []\n",
    "  if num==0:\n",
    "    break\n",
    "  d = gpt3(oneshot,df_result.iloc[i]['Premise List'],ppt)\n",
    "  data.append(d)\n",
    "  num-=1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 206
    },
    "id": "6ndaCuDjrCcc",
    "outputId": "4641eef0-e42e-4ffd-f702-c8a45ef2c86b"
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "  <div id=\"df-fd473dc5-734e-4663-a094-ac2996ff17b4\">\n",
       "    <div class=\"colab-df-container\">\n",
       "      <div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Premise List</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>The physician misdiagnosed the patient.What ha...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>The elderly woman suffered a stroke.What happe...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>The pond froze over for the winter.What happen...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>The offender violated parole.What happened as ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>I poured water on my sleeping friend.What happ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>\n",
       "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-fd473dc5-734e-4663-a094-ac2996ff17b4')\"\n",
       "              title=\"Convert this dataframe to an interactive table.\"\n",
       "              style=\"display:none;\">\n",
       "        \n",
       "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
       "       width=\"24px\">\n",
       "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
       "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
       "  </svg>\n",
       "      </button>\n",
       "      \n",
       "  <style>\n",
       "    .colab-df-container {\n",
       "      display:flex;\n",
       "      flex-wrap:wrap;\n",
       "      gap: 12px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert {\n",
       "      background-color: #E8F0FE;\n",
       "      border: none;\n",
       "      border-radius: 50%;\n",
       "      cursor: pointer;\n",
       "      display: none;\n",
       "      fill: #1967D2;\n",
       "      height: 32px;\n",
       "      padding: 0 0 0 0;\n",
       "      width: 32px;\n",
       "    }\n",
       "\n",
       "    .colab-df-convert:hover {\n",
       "      background-color: #E2EBFA;\n",
       "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
       "      fill: #174EA6;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert {\n",
       "      background-color: #3B4455;\n",
       "      fill: #D2E3FC;\n",
       "    }\n",
       "\n",
       "    [theme=dark] .colab-df-convert:hover {\n",
       "      background-color: #434B5C;\n",
       "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
       "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
       "      fill: #FFFFFF;\n",
       "    }\n",
       "  </style>\n",
       "\n",
       "      <script>\n",
       "        const buttonEl =\n",
       "          document.querySelector('#df-fd473dc5-734e-4663-a094-ac2996ff17b4 button.colab-df-convert');\n",
       "        buttonEl.style.display =\n",
       "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
       "\n",
       "        async function convertToInteractive(key) {\n",
       "          const element = document.querySelector('#df-fd473dc5-734e-4663-a094-ac2996ff17b4');\n",
       "          const dataTable =\n",
       "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
       "                                                     [key], {});\n",
       "          if (!dataTable) return;\n",
       "\n",
       "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
       "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
       "            + ' to learn more about interactive tables.';\n",
       "          element.innerHTML = '';\n",
       "          dataTable['output_type'] = 'display_data';\n",
       "          await google.colab.output.renderOutput(dataTable, element);\n",
       "          const docLink = document.createElement('div');\n",
       "          docLink.innerHTML = docLinkHtml;\n",
       "          element.appendChild(docLink);\n",
       "        }\n",
       "      </script>\n",
       "    </div>\n",
       "  </div>\n",
       "  "
      ],
      "text/plain": [
       "                                        Premise List\n",
       "0  The physician misdiagnosed the patient.What ha...\n",
       "1  The elderly woman suffered a stroke.What happe...\n",
       "2  The pond froze over for the winter.What happen...\n",
       "3  The offender violated parole.What happened as ...\n",
       "4  I poured water on my sleeping friend.What happ..."
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_result.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "xWz8fA4wgZb0",
    "outputId": "ee5636c4-291c-4ff8-8045-044d36333fb6"
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "\n",
      "Premise:  The physician misdiagnosed the patient.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The patient died.\n",
      "Choice 2: \n",
      "The patient was cured. \n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  The elderly woman suffered a stroke.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The woman's daughter called the ambulance.\n",
      "\n",
      "Choice 2: \n",
      "The woman was taken to the hospital by her husband. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  The pond froze over for the winter.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "People skated on the pond. \n",
      "Choice 2: \n",
      "People brought boats to the pond. \n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  The offender violated parole.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The offender was sent to prison. \n",
      "Choice 2: \n",
      "The offender committed another crime. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  I poured water on my sleeping friend.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "My friend woke up.\n",
      "\n",
      "Choice 2: \n",
      "My friend got a cold. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  It got dark outside.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The lamp was turned on.\n",
      "\n",
      "Choice 2: \n",
      "The sun set. \n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  The woman's ring slipped off in the shower.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The woman's finger shrunk.\n",
      "\n",
      "Choice 2: \n",
      "The woman's ring was too big.\n",
      "\n",
      "Answer: Choice 2\n",
      "\n",
      "\n",
      "Premise:  The woman's date wanted to look like a gentleman.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The woman didn't have a good time.\n",
      "\n",
      "Choice 2: \n",
      "The man opened the door for her. \n",
      "\n",
      "Answer: Choice 2\n",
      "\n",
      "\n",
      "Premise:  The farmland needed irrigation.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The farmer watered the crops.\n",
      "\n",
      "Choice 2: \n",
      "It rained on the farmland.\n",
      "\n",
      "Answer: Choice 1\n",
      "\n",
      "\n",
      "Premise:  The toddler became cranky.What happened as a RESULT? \n",
      "Response:\n",
      " Choice 1:\n",
      "The toddler was hungry.\n",
      "\n",
      "Choice 2: \n",
      "The toddler saw a scary movie.\n",
      "\n",
      "Answer: Choice 1\n"
     ]
    }
   ],
   "source": [
    "df1 = pd.DataFrame(data)\n",
    "for p in range(df1.shape[0]):\n",
    "  print(\"\\n\")\n",
    "  print(\"Premise: \",df1.iloc[p][0], \"\\nResponse:\\n\", df1.iloc[p][1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "id": "GI3E_77TgsLc"
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "colab": {
   "collapsed_sections": [],
   "provenance": []
  },
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
