{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "0428ec8b",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:28:04.394540Z",
     "start_time": "2023-07-25T02:28:04.096950Z"
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import json"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "dfa0c8fc",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:29:05.486156Z",
     "start_time": "2023-07-25T02:29:05.462717Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>input</th>\n",
       "      <th>output</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Premise :My body cast a shadow over the grass....</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Premise :The woman tolerated her friend's diff...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Premise :The women met for coffee.What was the...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Premise :The runner wore shorts.What was the C...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Premise :The guests of the party hid behind th...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>393</th>\n",
       "      <td>Premise :The man wanted to save money.What hap...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>394</th>\n",
       "      <td>Premise :The girl desired her parent's approva...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>395</th>\n",
       "      <td>Premise :The truck crashed into the motorcycle...</td>\n",
       "      <td>Choice 2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>396</th>\n",
       "      <td>Premise :The swimmer won the race.What happene...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>397</th>\n",
       "      <td>Premise :The print on the brochure was tiny.Wh...</td>\n",
       "      <td>Choice 1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>398 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 input    output\n",
       "0    Premise :My body cast a shadow over the grass....  Choice 1\n",
       "1    Premise :The woman tolerated her friend's diff...  Choice 1\n",
       "2    Premise :The women met for coffee.What was the...  Choice 1\n",
       "3    Premise :The runner wore shorts.What was the C...  Choice 1\n",
       "4    Premise :The guests of the party hid behind th...  Choice 1\n",
       "..                                                 ...       ...\n",
       "393  Premise :The man wanted to save money.What hap...  Choice 1\n",
       "394  Premise :The girl desired her parent's approva...  Choice 1\n",
       "395  Premise :The truck crashed into the motorcycle...  Choice 2\n",
       "396  Premise :The swimmer won the race.What happene...  Choice 1\n",
       "397  Premise :The print on the brochure was tiny.Wh...  Choice 1\n",
       "\n",
       "[398 rows x 2 columns]"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_csv(\"val.csv\")\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "f35d7f28",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:29:06.269963Z",
     "start_time": "2023-07-25T02:29:06.264595Z"
    }
   },
   "outputs": [],
   "source": [
    "prompt = '''You are given a premise and 2 possible hypotheses (Choice 1 and Choice 2) as input. Select the hypothesis which is more likely to have a causal link to the sentence. \n",
    "If the premise asks for CAUSE:\n",
    "If the premise is more likely to be the result of Choice 1, output Choice 1. Otherwise, output Choice 2.\n",
    "If the premise asks for RESULT:\n",
    "If Choice 1 is more likely to be the result of the premise, output Choice 1. Otherwise, output Choice 2.\n",
    "\n",
    "Example:\n",
    "Premise : My body cast a shadow over the grass.What was the CAUSE of this? \n",
    "Choice 1 :The sun was rising. \n",
    "Choice 2 :The grass was cut. \n",
    "Output : Choice 1 \n",
    "Explanation : The premise asks for CAUSE. Out of the 2 choices, choice 1 describing the position of the sun is more likely to cause a shadow. The grass being cut has no relation.\n",
    "\n",
    "Example: \n",
    "Premise : The elderly woman suffered a stroke.What happened as a RESULT? \n",
    "Choice 1 :The woman's daughter came over to clean her house. \n",
    "Choice 2 :The woman's daughter moved in to take care of her.\n",
    "Output : Choice 2\n",
    "Explanation : The premise asks for RESULT. Choice 2 is more likely to logically follow the premise of the sick elderly woman. There is nothing to suggest cleaning the house.\n",
    "\n",
    "Premise :'''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "3a510a7b",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:29:08.106271Z",
     "start_time": "2023-07-25T02:29:08.079658Z"
    }
   },
   "outputs": [],
   "source": [
    "ip_col = 'input'\n",
    "df[ip_col] = prompt + df[ip_col]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "2bc22dd9",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:29:13.943990Z",
     "start_time": "2023-07-25T02:29:13.915212Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "count    398.000000\n",
       "mean     236.650754\n",
       "std        4.243369\n",
       "min      228.000000\n",
       "50%      236.000000\n",
       "75%      239.000000\n",
       "80%      240.000000\n",
       "85%      241.000000\n",
       "90%      243.000000\n",
       "99%      247.000000\n",
       "max      249.000000\n",
       "Name: input, dtype: float64"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df[ip_col].str.split(\" \").str.len().describe(percentiles = [.5,.75,.8,.85,.90,.99])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "74bde580",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-07-25T02:29:24.542316Z",
     "start_time": "2023-07-25T02:29:24.494252Z"
    }
   },
   "outputs": [],
   "source": [
    "df.to_csv(\"train_w_inst.csv\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "baadefd3",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python [conda env:root] *",
   "language": "python",
   "name": "conda-root-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
