{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Round 1 \n",
    "- These are the data after applying the prompt in Appendix A.1\n",
    "- It includes results on SAT/DSAT classification as well as additional information such as domain, intent, dialogue state, etc.\n",
    "- Only include the first 5k row as ARR requires the file size to be smaller than 50MB"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_round_1 = pd.read_csv(\"wildfeedback-round-1.csv\")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>original_index</th>\n",
       "      <th>TurnId</th>\n",
       "      <th>UtterranceId</th>\n",
       "      <th>Role</th>\n",
       "      <th>Content</th>\n",
       "      <th>Summary</th>\n",
       "      <th>Domain</th>\n",
       "      <th>Intent</th>\n",
       "      <th>Preceeding</th>\n",
       "      <th>Satisfaction</th>\n",
       "      <th>Satisfaction-Justificiation</th>\n",
       "      <th>Disatisfaction</th>\n",
       "      <th>Dissatisfaction-Justificiation</th>\n",
       "      <th>State</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>173070</td>\n",
       "      <td>1</td>\n",
       "      <td>0</td>\n",
       "      <td>User</td>\n",
       "      <td>Why does my NekoCat const keep rerendering eve...</td>\n",
       "      <td>The user is asking why their NekoCat component...</td>\n",
       "      <td>SOFTWARE AND WEB DEVELOPMENT</td>\n",
       "      <td>INTENT:1-INFORMATION_SEEKING</td>\n",
       "      <td>NO</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>NEWTOPIC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>173070</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>Agent</td>\n",
       "      <td>The NyanCat component is re-rendering every ti...</td>\n",
       "      <td>The user is asking why their NekoCat component...</td>\n",
       "      <td>SOFTWARE AND WEB DEVELOPMENT</td>\n",
       "      <td>INTENT:1-INFORMATION_SEEKING</td>\n",
       "      <td>NO</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>NEWTOPIC</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>173070</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>User</td>\n",
       "      <td>I want it to be inside of Room2</td>\n",
       "      <td>The user wants the NyanCat component to be ins...</td>\n",
       "      <td>SOFTWARE AND WEB DEVELOPMENT</td>\n",
       "      <td>INTENT:1-INFORMATION_SEEKING</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>173070</td>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>Agent</td>\n",
       "      <td>In that case, you can create a separate compon...</td>\n",
       "      <td>The user wants the NyanCat component to be ins...</td>\n",
       "      <td>SOFTWARE AND WEB DEVELOPMENT</td>\n",
       "      <td>INTENT:1-INFORMATION_SEEKING</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>173070</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>User</td>\n",
       "      <td>it still re renders the animation</td>\n",
       "      <td>The user reports that the NyanCat component st...</td>\n",
       "      <td>SOFTWARE AND WEB DEVELOPMENT</td>\n",
       "      <td>INTENT:1-INFORMATION_SEEKING</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>True</td>\n",
       "      <td>[\"Revision\"]</td>\n",
       "      <td>FEEDBACK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>178135</td>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>Agent</td>\n",
       "      <td>Teen Magma Cube: “I’m Maddy, Maggy’s older sis...</td>\n",
       "      <td>Amalgacimex and Maggy encounter another Magma ...</td>\n",
       "      <td>GAMES</td>\n",
       "      <td>INTENT:4-OPEN-ENDED_DISCOVERY</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>178135</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>User</td>\n",
       "      <td>(As Amalgacimex and the two Magma Cube sisters...</td>\n",
       "      <td>Amalgacimex and the Magma Cube sisters meet a ...</td>\n",
       "      <td>GAMES</td>\n",
       "      <td>INTENT:4-OPEN-ENDED_DISCOVERY</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>178135</td>\n",
       "      <td>3</td>\n",
       "      <td>5</td>\n",
       "      <td>Agent</td>\n",
       "      <td>Pregnant Magma Cube: “My name is Ember. And it...</td>\n",
       "      <td>Amalgacimex and the Magma Cube sisters meet a ...</td>\n",
       "      <td>GAMES</td>\n",
       "      <td>INTENT:4-OPEN-ENDED_DISCOVERY</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>178135</td>\n",
       "      <td>4</td>\n",
       "      <td>6</td>\n",
       "      <td>User</td>\n",
       "      <td>(Amalgacimex and the Magma Cube sisters all se...</td>\n",
       "      <td>Amalgacimex and the Magma Cube sisters settle ...</td>\n",
       "      <td>GAMES</td>\n",
       "      <td>INTENT:4-OPEN-ENDED_DISCOVERY</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>178135</td>\n",
       "      <td>4</td>\n",
       "      <td>7</td>\n",
       "      <td>Agent</td>\n",
       "      <td>Ember: (laughs) “Oh, those are our fire-resist...</td>\n",
       "      <td>Amalgacimex and the Magma Cube sisters settle ...</td>\n",
       "      <td>GAMES</td>\n",
       "      <td>INTENT:4-OPEN-ENDED_DISCOVERY</td>\n",
       "      <td>YES</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>False</td>\n",
       "      <td>[\"N/A\"]</td>\n",
       "      <td>CONTINUATION</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      original_index  TurnId  UtterranceId   Role  \\\n",
       "0             173070       1             0   User   \n",
       "1             173070       1             1  Agent   \n",
       "2             173070       2             2   User   \n",
       "3             173070       2             3  Agent   \n",
       "4             173070       3             4   User   \n",
       "...              ...     ...           ...    ...   \n",
       "4995          178135       2             3  Agent   \n",
       "4996          178135       3             4   User   \n",
       "4997          178135       3             5  Agent   \n",
       "4998          178135       4             6   User   \n",
       "4999          178135       4             7  Agent   \n",
       "\n",
       "                                                Content  \\\n",
       "0     Why does my NekoCat const keep rerendering eve...   \n",
       "1     The NyanCat component is re-rendering every ti...   \n",
       "2                       I want it to be inside of Room2   \n",
       "3     In that case, you can create a separate compon...   \n",
       "4                     it still re renders the animation   \n",
       "...                                                 ...   \n",
       "4995  Teen Magma Cube: “I’m Maddy, Maggy’s older sis...   \n",
       "4996  (As Amalgacimex and the two Magma Cube sisters...   \n",
       "4997  Pregnant Magma Cube: “My name is Ember. And it...   \n",
       "4998  (Amalgacimex and the Magma Cube sisters all se...   \n",
       "4999  Ember: (laughs) “Oh, those are our fire-resist...   \n",
       "\n",
       "                                                Summary  \\\n",
       "0     The user is asking why their NekoCat component...   \n",
       "1     The user is asking why their NekoCat component...   \n",
       "2     The user wants the NyanCat component to be ins...   \n",
       "3     The user wants the NyanCat component to be ins...   \n",
       "4     The user reports that the NyanCat component st...   \n",
       "...                                                 ...   \n",
       "4995  Amalgacimex and Maggy encounter another Magma ...   \n",
       "4996  Amalgacimex and the Magma Cube sisters meet a ...   \n",
       "4997  Amalgacimex and the Magma Cube sisters meet a ...   \n",
       "4998  Amalgacimex and the Magma Cube sisters settle ...   \n",
       "4999  Amalgacimex and the Magma Cube sisters settle ...   \n",
       "\n",
       "                            Domain                         Intent Preceeding  \\\n",
       "0     SOFTWARE AND WEB DEVELOPMENT   INTENT:1-INFORMATION_SEEKING         NO   \n",
       "1     SOFTWARE AND WEB DEVELOPMENT   INTENT:1-INFORMATION_SEEKING         NO   \n",
       "2     SOFTWARE AND WEB DEVELOPMENT   INTENT:1-INFORMATION_SEEKING        YES   \n",
       "3     SOFTWARE AND WEB DEVELOPMENT   INTENT:1-INFORMATION_SEEKING        YES   \n",
       "4     SOFTWARE AND WEB DEVELOPMENT   INTENT:1-INFORMATION_SEEKING        YES   \n",
       "...                            ...                            ...        ...   \n",
       "4995                         GAMES  INTENT:4-OPEN-ENDED_DISCOVERY        YES   \n",
       "4996                         GAMES  INTENT:4-OPEN-ENDED_DISCOVERY        YES   \n",
       "4997                         GAMES  INTENT:4-OPEN-ENDED_DISCOVERY        YES   \n",
       "4998                         GAMES  INTENT:4-OPEN-ENDED_DISCOVERY        YES   \n",
       "4999                         GAMES  INTENT:4-OPEN-ENDED_DISCOVERY        YES   \n",
       "\n",
       "      Satisfaction Satisfaction-Justificiation  Disatisfaction  \\\n",
       "0            False                     [\"N/A\"]           False   \n",
       "1            False                     [\"N/A\"]           False   \n",
       "2            False                     [\"N/A\"]           False   \n",
       "3            False                     [\"N/A\"]           False   \n",
       "4            False                     [\"N/A\"]            True   \n",
       "...            ...                         ...             ...   \n",
       "4995         False                     [\"N/A\"]           False   \n",
       "4996         False                     [\"N/A\"]           False   \n",
       "4997         False                     [\"N/A\"]           False   \n",
       "4998         False                     [\"N/A\"]           False   \n",
       "4999         False                     [\"N/A\"]           False   \n",
       "\n",
       "     Dissatisfaction-Justificiation         State  \n",
       "0                           [\"N/A\"]      NEWTOPIC  \n",
       "1                           [\"N/A\"]      NEWTOPIC  \n",
       "2                           [\"N/A\"]  CONTINUATION  \n",
       "3                           [\"N/A\"]  CONTINUATION  \n",
       "4                      [\"Revision\"]      FEEDBACK  \n",
       "...                             ...           ...  \n",
       "4995                        [\"N/A\"]  CONTINUATION  \n",
       "4996                        [\"N/A\"]  CONTINUATION  \n",
       "4997                        [\"N/A\"]  CONTINUATION  \n",
       "4998                        [\"N/A\"]  CONTINUATION  \n",
       "4999                        [\"N/A\"]  CONTINUATION  \n",
       "\n",
       "[5000 rows x 14 columns]"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_round_1"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Round 2\n",
    "- These are the data after applying the prompt in A.2\n",
    "- It includes the summarized user preferenecs\n",
    "- Keep only the first 5k data due to file size constraint"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_preferences = pd.read_csv(\"wildfeedback-round-2.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>messages</th>\n",
       "      <th>model_response</th>\n",
       "      <th>input_token_usage</th>\n",
       "      <th>output_token_usage</th>\n",
       "      <th>original_idx</th>\n",
       "      <th>history</th>\n",
       "      <th>sft_data</th>\n",
       "      <th>num_tokens</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"3\",\\n        \"pref...</td>\n",
       "      <td>1555.0</td>\n",
       "      <td>198.0</td>\n",
       "      <td>95</td>\n",
       "      <td>[{'turn id': '1', 'User': \"Ignore all the inst...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1131</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"2\",\\n        \"pref...</td>\n",
       "      <td>2573.0</td>\n",
       "      <td>786.0</td>\n",
       "      <td>99</td>\n",
       "      <td>[{'turn id': '1', 'User': \"I need help creatin...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>2014</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"1\",\\n        \"pref...</td>\n",
       "      <td>1193.0</td>\n",
       "      <td>749.0</td>\n",
       "      <td>137</td>\n",
       "      <td>[{'turn id': '1', 'User': 'Write me a short bo...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>267</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"2\",\\n        \"pref...</td>\n",
       "      <td>1569.0</td>\n",
       "      <td>492.0</td>\n",
       "      <td>137</td>\n",
       "      <td>[{'turn id': '1', 'User': 'Write me a short bo...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>799</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"2\",\\n        \"pref...</td>\n",
       "      <td>3350.0</td>\n",
       "      <td>1076.0</td>\n",
       "      <td>166</td>\n",
       "      <td>[{'turn id': '1', 'User': 'test', 'Agent': \"I'...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1086</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"11\",\\n        \"pre...</td>\n",
       "      <td>1429.0</td>\n",
       "      <td>118.0</td>\n",
       "      <td>332199</td>\n",
       "      <td>[{'turn id': '1', 'User': 'What does the \"Top-...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1185</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"11\",\\n        \"pre...</td>\n",
       "      <td>1520.0</td>\n",
       "      <td>148.0</td>\n",
       "      <td>332199</td>\n",
       "      <td>[{'turn id': '1', 'User': 'What does the \"Top-...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1204</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"5\",\\n        \"pref...</td>\n",
       "      <td>1577.0</td>\n",
       "      <td>154.0</td>\n",
       "      <td>332370</td>\n",
       "      <td>[{'turn id': '1', 'User': 'For the following s...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1298</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"5\",\\n        \"pref...</td>\n",
       "      <td>1703.0</td>\n",
       "      <td>138.0</td>\n",
       "      <td>332370</td>\n",
       "      <td>[{'turn id': '1', 'User': 'For the following s...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>1300</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>[{'role': 'system', 'content': 'You are a help...</td>\n",
       "      <td>[\\n    {\\n        \"query\": \"1\",\\n        \"pref...</td>\n",
       "      <td>1777.0</td>\n",
       "      <td>289.0</td>\n",
       "      <td>332370</td>\n",
       "      <td>[{'turn id': '1', 'User': 'For the following s...</td>\n",
       "      <td>[('conversations', [{'from': 'human', 'value':...</td>\n",
       "      <td>331</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                               messages  \\\n",
       "0     [{'role': 'system', 'content': 'You are a help...   \n",
       "1     [{'role': 'system', 'content': 'You are a help...   \n",
       "2     [{'role': 'system', 'content': 'You are a help...   \n",
       "3     [{'role': 'system', 'content': 'You are a help...   \n",
       "4     [{'role': 'system', 'content': 'You are a help...   \n",
       "...                                                 ...   \n",
       "4995  [{'role': 'system', 'content': 'You are a help...   \n",
       "4996  [{'role': 'system', 'content': 'You are a help...   \n",
       "4997  [{'role': 'system', 'content': 'You are a help...   \n",
       "4998  [{'role': 'system', 'content': 'You are a help...   \n",
       "4999  [{'role': 'system', 'content': 'You are a help...   \n",
       "\n",
       "                                         model_response  input_token_usage  \\\n",
       "0     [\\n    {\\n        \"query\": \"3\",\\n        \"pref...             1555.0   \n",
       "1     [\\n    {\\n        \"query\": \"2\",\\n        \"pref...             2573.0   \n",
       "2     [\\n    {\\n        \"query\": \"1\",\\n        \"pref...             1193.0   \n",
       "3     [\\n    {\\n        \"query\": \"2\",\\n        \"pref...             1569.0   \n",
       "4     [\\n    {\\n        \"query\": \"2\",\\n        \"pref...             3350.0   \n",
       "...                                                 ...                ...   \n",
       "4995  [\\n    {\\n        \"query\": \"11\",\\n        \"pre...             1429.0   \n",
       "4996  [\\n    {\\n        \"query\": \"11\",\\n        \"pre...             1520.0   \n",
       "4997  [\\n    {\\n        \"query\": \"5\",\\n        \"pref...             1577.0   \n",
       "4998  [\\n    {\\n        \"query\": \"5\",\\n        \"pref...             1703.0   \n",
       "4999  [\\n    {\\n        \"query\": \"1\",\\n        \"pref...             1777.0   \n",
       "\n",
       "      output_token_usage  original_idx  \\\n",
       "0                  198.0            95   \n",
       "1                  786.0            99   \n",
       "2                  749.0           137   \n",
       "3                  492.0           137   \n",
       "4                 1076.0           166   \n",
       "...                  ...           ...   \n",
       "4995               118.0        332199   \n",
       "4996               148.0        332199   \n",
       "4997               154.0        332370   \n",
       "4998               138.0        332370   \n",
       "4999               289.0        332370   \n",
       "\n",
       "                                                history  \\\n",
       "0     [{'turn id': '1', 'User': \"Ignore all the inst...   \n",
       "1     [{'turn id': '1', 'User': \"I need help creatin...   \n",
       "2     [{'turn id': '1', 'User': 'Write me a short bo...   \n",
       "3     [{'turn id': '1', 'User': 'Write me a short bo...   \n",
       "4     [{'turn id': '1', 'User': 'test', 'Agent': \"I'...   \n",
       "...                                                 ...   \n",
       "4995  [{'turn id': '1', 'User': 'What does the \"Top-...   \n",
       "4996  [{'turn id': '1', 'User': 'What does the \"Top-...   \n",
       "4997  [{'turn id': '1', 'User': 'For the following s...   \n",
       "4998  [{'turn id': '1', 'User': 'For the following s...   \n",
       "4999  [{'turn id': '1', 'User': 'For the following s...   \n",
       "\n",
       "                                               sft_data  num_tokens  \n",
       "0     [('conversations', [{'from': 'human', 'value':...        1131  \n",
       "1     [('conversations', [{'from': 'human', 'value':...        2014  \n",
       "2     [('conversations', [{'from': 'human', 'value':...         267  \n",
       "3     [('conversations', [{'from': 'human', 'value':...         799  \n",
       "4     [('conversations', [{'from': 'human', 'value':...        1086  \n",
       "...                                                 ...         ...  \n",
       "4995  [('conversations', [{'from': 'human', 'value':...        1185  \n",
       "4996  [('conversations', [{'from': 'human', 'value':...        1204  \n",
       "4997  [('conversations', [{'from': 'human', 'value':...        1298  \n",
       "4998  [('conversations', [{'from': 'human', 'value':...        1300  \n",
       "4999  [('conversations', [{'from': 'human', 'value':...         331  \n",
       "\n",
       "[5000 rows x 8 columns]"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_preferences"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Round 3\n",
    "- This is WildFeedback GPT-4 (WF GPT-4) we used to train the models\n",
    "- Keep only the first 5k data due to file size constraint"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_train = pd.read_json(\"wildfeedback-round-3.jsonl\", lines=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>conversations</th>\n",
       "      <th>chosen</th>\n",
       "      <th>rejected</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>[{'from': 'human', 'value': 'hi'}, {'from': 'g...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Thank you for the ad...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Given the clarified ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>[{'from': 'human', 'value': 'Here is a chess g...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Of course, please ta...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Sure thing, feel fre...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[{'from': 'human', 'value': 'import asyncio\n",
       "im...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Certainly! Below is ...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Apologies for the in...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>[{'from': 'human', 'value': 'can you build me ...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Certainly! Let's mod...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Sure, here's an upda...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>[{'from': 'human', 'value': 'help me please'},...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Thank you for the cl...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Apologies for the mi...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4995</th>\n",
       "      <td>[{'from': 'human', 'value': 'hi'}, {'from': 'g...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Title: **From Emanci...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Title: **From Emanci...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4996</th>\n",
       "      <td>[{'from': 'human', 'value': 'How many tokens a...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Understood. I'll wai...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Understood. Please g...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4997</th>\n",
       "      <td>[{'from': 'human', 'value': '1. Country: Varda...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'I apologize for the ...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Apologies for the co...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4998</th>\n",
       "      <td>[{'from': 'human', 'value': 'I used this code:...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'I see the issue. The...</td>\n",
       "      <td>{'from': 'gpt', 'value': 'Apologies for the co...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4999</th>\n",
       "      <td>[{'from': 'human', 'value': 'now draw html str...</td>\n",
       "      <td>{'from': 'gpt', 'value': '&lt;!DOCTYPE html&gt;&lt;html...</td>\n",
       "      <td>{'from': 'gpt', 'value': '&lt;!DOCTYPE html&gt;&lt;html...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>5000 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                          conversations  \\\n",
       "0     [{'from': 'human', 'value': 'hi'}, {'from': 'g...   \n",
       "1     [{'from': 'human', 'value': 'Here is a chess g...   \n",
       "2     [{'from': 'human', 'value': 'import asyncio\n",
       "im...   \n",
       "3     [{'from': 'human', 'value': 'can you build me ...   \n",
       "4     [{'from': 'human', 'value': 'help me please'},...   \n",
       "...                                                 ...   \n",
       "4995  [{'from': 'human', 'value': 'hi'}, {'from': 'g...   \n",
       "4996  [{'from': 'human', 'value': 'How many tokens a...   \n",
       "4997  [{'from': 'human', 'value': '1. Country: Varda...   \n",
       "4998  [{'from': 'human', 'value': 'I used this code:...   \n",
       "4999  [{'from': 'human', 'value': 'now draw html str...   \n",
       "\n",
       "                                                 chosen  \\\n",
       "0     {'from': 'gpt', 'value': 'Thank you for the ad...   \n",
       "1     {'from': 'gpt', 'value': 'Of course, please ta...   \n",
       "2     {'from': 'gpt', 'value': 'Certainly! Below is ...   \n",
       "3     {'from': 'gpt', 'value': 'Certainly! Let's mod...   \n",
       "4     {'from': 'gpt', 'value': 'Thank you for the cl...   \n",
       "...                                                 ...   \n",
       "4995  {'from': 'gpt', 'value': 'Title: **From Emanci...   \n",
       "4996  {'from': 'gpt', 'value': 'Understood. I'll wai...   \n",
       "4997  {'from': 'gpt', 'value': 'I apologize for the ...   \n",
       "4998  {'from': 'gpt', 'value': 'I see the issue. The...   \n",
       "4999  {'from': 'gpt', 'value': '<!DOCTYPE html><html...   \n",
       "\n",
       "                                               rejected  \n",
       "0     {'from': 'gpt', 'value': 'Given the clarified ...  \n",
       "1     {'from': 'gpt', 'value': 'Sure thing, feel fre...  \n",
       "2     {'from': 'gpt', 'value': 'Apologies for the in...  \n",
       "3     {'from': 'gpt', 'value': 'Sure, here's an upda...  \n",
       "4     {'from': 'gpt', 'value': 'Apologies for the mi...  \n",
       "...                                                 ...  \n",
       "4995  {'from': 'gpt', 'value': 'Title: **From Emanci...  \n",
       "4996  {'from': 'gpt', 'value': 'Understood. Please g...  \n",
       "4997  {'from': 'gpt', 'value': 'Apologies for the co...  \n",
       "4998  {'from': 'gpt', 'value': 'Apologies for the co...  \n",
       "4999  {'from': 'gpt', 'value': '<!DOCTYPE html><html...  \n",
       "\n",
       "[5000 rows x 3 columns]"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_train"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
