{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "6e38ff87-ac0b-41b9-870d-387ad349ea95",
   "metadata": {},
   "source": [
    "## Method\n",
    "\n",
    "1. Convert html to ax_tree (I modified the [html2axtree script](https://github.com/web-arena-x/agent-model/blob/main/scripts/html/html2axtree.py) such that the ids are numbers).\n",
    "2. Prompt gpt4"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6939cc7c-f1c2-493d-a1bb-9ef40a5f9494",
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import openai_num_tokens_from_messages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "141a6802-7e61-44af-8914-450afd914afb",
   "metadata": {},
   "outputs": [],
   "source": [
    "task_instruction = \"\"\"You are a browser. You are given the an accessbility tree that represent the current webpage the user is focusing at. Guess one possible objective of the user, and a reasonable next action.\n",
    "Provide the answer in the following format (including ```):\n",
    "\n",
    "```\n",
    "Objective: {objective}\n",
    "Action: {action}\n",
    "```\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "033d4142-13e2-4529-9534-a224e01ed42b",
   "metadata": {},
   "outputs": [],
   "source": [
    "action_instruction = \"\"\"The actions the user can perform fall into several categories:\n",
    "\n",
    "Page Operation Actions:\n",
    "`click [id]`: This action clicks on an element with a specific id on the webpage.\n",
    "`type [id] [content] [press_enter_after=0|1]`: Use this to type the content into the field with id. By default, the \"Enter\" key is pressed after typing unless press_enter_after is set to 0.\n",
    "`hover [id]`: Hover over an element with id.\n",
    "`press [key_comb]`:  Simulates the pressing of a key combination on the keyboard (e.g., Ctrl+v).\n",
    "`scroll [direction=down|up]`: Scroll the page up or down.\n",
    "\n",
    "Tab Management Actions:\n",
    "`new_tab`: Open a new, empty browser tab.\n",
    "`tab_focus [tab_index]`: Switch the browser's focus to a specific tab using its index.\n",
    "`close_tab`: Close the currently active tab.\n",
    "\n",
    "URL Navigation Actions:\n",
    "`goto [url]`: Navigate to a specific URL.\n",
    "`go_back`: Navigate to the previously viewed page.\n",
    "`go_forward`: Navigate to the next page (if a previous 'go_back' action was performed).\n",
    "Completion Action:\n",
    "`stop [answer]`: Issue this action when you believe the task is complete. If the objective is to find a text-based answer, provide the answer in the bracket. If you believe the task is impossible to complete, provide the answer as \"N/A\" in the bracket.\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ed1678e0-3a12-4146-bd6a-e710b6d8b5e5",
   "metadata": {},
   "outputs": [],
   "source": [
    "from bs4 import BeautifulSoup\n",
    "from html2axtree import create_accessibility_tree # TODO: we have a updated version of conversion script\n",
    "\n",
    "def get_info(html, print=False, model='gpt-4-1106-preview'):\n",
    "    soup = BeautifulSoup(html, 'html.parser')\n",
    "    def _f():\n",
    "        _f.cnt += 1\n",
    "        return _f.cnt\n",
    "    _f.cnt = -1\n",
    "    ax_tree = create_accessibility_tree(soup.html, _f)\n",
    "\n",
    "    messages=[\n",
    "        {\"role\": \"system\", \"content\": task_instruction},\n",
    "        {\"role\": \"system\", \"content\": action_instruction},\n",
    "        {\"role\": \"user\", \"content\": print_tree(ax_tree)},\n",
    "    ]\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, model)\n",
    "    if print:\n",
    "        print('num_tokens', num_tokens, f'cost for {model} $', num_tokens / 1000 * 0.01)\n",
    "\n",
    "    return soup, ax_tree, num_tokens, num_tokens / 1000 * 0.01"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "491e2ef0-7dd0-40d3-93b5-f57995bfc687",
   "metadata": {},
   "source": [
    "## Estimate total cost"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "03ffa2d9-540e-48be-a82f-a9f7f5d4e781",
   "metadata": {},
   "outputs": [],
   "source": [
    "from typing import Tuple\n",
    "from tqdm import tqdm\n",
    "from html2axtree import print_tree\n",
    "\n",
    "import gzip\n",
    "f = gzip.open('./en0000-01.warc.gz', 'r')\n",
    "\n",
    "num_tokens = []\n",
    "cost = []\n",
    "cur = ''\n",
    "first = True\n",
    "\n",
    "for line in tqdm(f):\n",
    "    cur += line.decode()\n",
    "    if cur.endswith('\\r\\n\\r\\n\\r\\n'):\n",
    "        try:\n",
    "            body = '\\r\\n\\r\\n'.join(cur.strip().split('\\r\\n\\r\\n')[1:])\n",
    "            if not first:\n",
    "                _, _, num_token, c = get_info(body)\n",
    "                num_tokens.append(num_token)\n",
    "                cost.append(c)\n",
    "            else:\n",
    "                first = False\n",
    "            cur = ''\n",
    "        except Exception as e:\n",
    "            print(e)\n",
    "    if len(cost) > 1000:\n",
    "        break\n",
    "\n",
    "import numpy as np\n",
    "print(np.mean(num_tokens), np.mean(cost))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3d4ae208-3cd3-48d5-b920-3e659e8525cc",
   "metadata": {},
   "outputs": [],
   "source": [
    "from typing import Tuple\n",
    "from html2axtree import print_tree\n",
    "\n",
    "data = []\n",
    "cur = ''\n",
    "\n",
    "import gzip\n",
    "f = gzip.open('./en0000-01.warc.gz', 'r')\n",
    "\n",
    "def semicolon_to_dict(metadata_list):\n",
    "    metadata_dict = {}\n",
    "    for element in metadata_list:\n",
    "        try:\n",
    "            index = element.index(':')\n",
    "            key, value = element[:index], element[index+2:] # skip ': '\n",
    "            metadata_dict[key] = value\n",
    "        except:\n",
    "            continue\n",
    "\n",
    "    return metadata_dict\n",
    "\n",
    "for line in f:\n",
    "    cur += line.decode()\n",
    "    if cur.endswith('\\r\\n\\r\\n\\r\\n'):\n",
    "        metadata = cur.strip().split('\\r\\n\\r\\n')[0]\n",
    "        body = '\\r\\n\\r\\n'.join(cur.strip().split('\\r\\n\\r\\n')[1:])\n",
    "        metadata = semicolon_to_dict(metadata.split('\\r\\n'))\n",
    "        data.append((metadata, body))\n",
    "        if len(data) > 1:\n",
    "            print(get_info(data[-1][1])[2:])\n",
    "        cur = ''\n",
    "        \n",
    "    if len(data) > 10:\n",
    "        break"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5dfc0573-9f2e-4585-a6cb-a470c8bf0e6f",
   "metadata": {},
   "source": [
    "## (Subsample tree)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "34346424-1b44-4c5f-a96d-3ce309856319",
   "metadata": {},
   "outputs": [],
   "source": [
    "def annotate_tree(node):\n",
    "    width, height, size = 0, 0, 0\n",
    "    for child in node['children']:\n",
    "        _width, _height, _size = annotate_tree(child)\n",
    "        width += _width\n",
    "        height = max(height, _height)\n",
    "        size += _size\n",
    "\n",
    "    node['width'] = width if len(node['children']) else 1\n",
    "    node['height'] = height + 1\n",
    "    node['size'] = size + 1\n",
    "\n",
    "    return node['width'], node['height'], node['size']\n",
    "\n",
    "annotate_tree(ax_tree)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "05750363-cbf7-499c-a582-e08cd72e4bbf",
   "metadata": {},
   "outputs": [],
   "source": [
    "def print_sub_tree(node, width_lb, width_ub):\n",
    "    if width_lb <= node['width'] <= width_ub:\n",
    "        print(print_tree(node))\n",
    "        input()\n",
    "    else:\n",
    "        for child in node['children']:\n",
    "            print_sub_tree(child, width_lb, width_ub)\n",
    "\n",
    "print_sub_tree(ax_tree, 20, 40)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d753a8e4-6686-4524-aa4a-039830cdab5c",
   "metadata": {},
   "source": [
    "## Setup openai"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e0b9a5cc-5363-4dc0-ba54-9ea671e1a145",
   "metadata": {},
   "outputs": [],
   "source": [
    "import openai\n",
    "import os\n",
    "openai.api_key = os.environ['OPENAI_API_KEY']\n",
    "OPENAI_MODEL = \"gpt-4-1106-preview\""
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0c53d84d-3200-45a1-9aae-3da5d32787e0",
   "metadata": {},
   "source": [
    "### Example 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7554ad76-ba95-42ba-a9f3-2c54358fb45e",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "print(json.dumps(data[3][0], indent=2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fa687132-d042-4ce9-b8d0-006a16ec6ed8",
   "metadata": {},
   "outputs": [],
   "source": [
    "soup = BeautifulSoup(data[3][1], 'html.parser')\n",
    "def _f():\n",
    "    _f.cnt += 1\n",
    "    return _f.cnt\n",
    "_f.cnt = -1\n",
    "ax_tree = create_accessibility_tree(soup.html, _f)\n",
    "# TODO: \n",
    "messages=[\n",
    "    {\"role\": \"system\", \"content\": task_instruction},\n",
    "    {\"role\": \"system\", \"content\": action_instruction},\n",
    "    {\"role\": \"user\", \"content\": print_tree(ax_tree)},\n",
    "]\n",
    "num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "print('num_tokens', num_tokens, 'cost $', num_tokens / 1000 * 0.01)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f5583922-a14a-4876-9a5d-76cc6d4f0f46",
   "metadata": {},
   "outputs": [],
   "source": [
    "response = openai.ChatCompletion.create(\n",
    "    model=OPENAI_MODEL,\n",
    "    messages=messages,\n",
    "    temperature=0.2,\n",
    ")\n",
    "\n",
    "print(response[\"choices\"][0][\"message\"][\"content\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6e1052b8-d804-429c-a4e7-2671914b4da6",
   "metadata": {},
   "outputs": [],
   "source": [
    "s = print_tree(ax_tree)\n",
    "print(s[s.index('994')-910:s.index('994')+1000].replace('\\t'*5, '\\t'*1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4951c8d7-883f-4c25-837b-e3f376db5a00",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(s)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "24116d95-5534-477e-b12a-94b1ce2732fc",
   "metadata": {},
   "source": [
    "### Example 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7c0cc5a8-d6d2-4a45-a6aa-33635bde8ff4",
   "metadata": {},
   "outputs": [],
   "source": [
    "soup = BeautifulSoup(data[5][1], 'html.parser')\n",
    "def _f():\n",
    "    _f.cnt += 1\n",
    "    return _f.cnt\n",
    "_f.cnt = -1\n",
    "ax_tree = create_accessibility_tree(soup.html, _f)\n",
    "\n",
    "messages=[\n",
    "    {\"role\": \"system\", \"content\": task_instruction},\n",
    "    {\"role\": \"system\", \"content\": action_instruction},\n",
    "    {\"role\": \"user\", \"content\": print_tree(ax_tree)},\n",
    "]\n",
    "num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "print('num_tokens', num_tokens, 'cost $', num_tokens / 1000 * 0.01)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e4883452-dfed-44f2-88de-ac095366d186",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "print(json.dumps(data[5][0], indent=2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9e592594-1831-4650-b01a-54e6827959c1",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6814e490-d2d4-4327-9cbe-d618ee39889f",
   "metadata": {},
   "outputs": [],
   "source": [
    "response = openai.ChatCompletion.create(\n",
    "    model=OPENAI_MODEL,\n",
    "    messages=messages,\n",
    "    temperature=0.2,\n",
    ")\n",
    "\n",
    "print(response[\"choices\"][0][\"message\"][\"content\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d2090835-8284-4ef4-b0d5-0910a165c044",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('tmp.html', 'w') as f:\n",
    "    print(soup.html, file=f)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "2848f9bf-4a4f-40a6-8409-1f685d5f5b3b",
   "metadata": {},
   "source": [
    "### Example 3"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44fd1fee-39af-44ea-8b04-7774eaf26c2a",
   "metadata": {},
   "outputs": [],
   "source": [
    "soup = BeautifulSoup(data[6][1], 'html.parser')\n",
    "def _f():\n",
    "    _f.cnt += 1\n",
    "    return _f.cnt\n",
    "_f.cnt = -1\n",
    "ax_tree = create_accessibility_tree(soup.html, _f)\n",
    "\n",
    "messages=[\n",
    "    {\"role\": \"system\", \"content\": task_instruction},\n",
    "    {\"role\": \"system\", \"content\": action_instruction},\n",
    "    {\"role\": \"user\", \"content\": print_tree(ax_tree)},\n",
    "]\n",
    "num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "print('num_tokens', num_tokens, 'cost $', num_tokens / 1000 * 0.01)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f09896bf-929f-44cc-b20d-cc76defba20a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "print(json.dumps(data[6][0], indent=2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d52dff58-37d9-4d6a-82ee-a28c465e727a",
   "metadata": {},
   "outputs": [],
   "source": [
    "response = openai.ChatCompletion.create(\n",
    "    model=OPENAI_MODEL,\n",
    "    messages=messages,\n",
    "    temperature=0.2,\n",
    ")\n",
    "\n",
    "print(response[\"choices\"][0][\"message\"][\"content\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "44cfac4d-47d2-4605-9bac-9720900f2e9a",
   "metadata": {},
   "outputs": [],
   "source": [
    "s = print_tree(ax_tree)\n",
    "print(s[s.index('442')-910:s.index('442')+1000].replace('\\t'*5, '\\t'*1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "006e1c18-f0ed-4a5d-804a-4232f68ab90b",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('tmp.html', 'w') as f:\n",
    "    print(soup.html, file=f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6674b719-8bff-4f6e-9b0a-6a9bed91ea54",
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(1, len(data)):\n",
    "    soup = BeautifulSoup(data[i][1], 'html.parser')\n",
    "    ax_tree = create_accessibility_tree(soup.html, _f)\n",
    "    # TODO: \n",
    "    messages=[\n",
    "        {\"role\": \"system\", \"content\": task_instruction},\n",
    "        {\"role\": \"system\", \"content\": action_instruction},\n",
    "        {\"role\": \"user\", \"content\": print_tree(ax_tree)},\n",
    "    ]\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "    print(i)\n",
    "    print('num_tokens', num_tokens, 'cost $', num_tokens / 1000 * 0.01)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0a514deb-c673-4d9b-9b04-5186f92c0916",
   "metadata": {},
   "source": [
    "## Pros\n",
    "\n",
    "1. Method is simple: thanks for 128k context window, we can just dump the whole ax tree into it!\n",
    "\n",
    "## Cons\n",
    "\n",
    "1. Cost issue: every inference cost about 0.5 - 1 usd\n",
    "2. Diversity issue (?) probably can only get one datapoint from one website. Might not be a issue since we have a lot of website\n",
    "3. Objective will be relative simple and action will be kind of trivial?"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3a080811-e57f-4104-b408-6a58b277e86b",
   "metadata": {},
   "source": [
    "## 11/27 Meeting with b\n",
    "\n",
    "1. axtree generated by chrome might be a lot more concise, compared to the one we \"converted\" above (TODO: ask b for updated conversion script)\n",
    "2. diversity in data matters -> instead of fetching the whole page in prompt, we maybe should do some subsampling to save cost. (TODO: figure out how to do meaningful subsampling? (1) split the axtree into k part and sample one of them (2) load html to DOM and use in-view-port function to extract the current page as a meaningful subsample) (3) sample number lines from, say n ~ N(150, 10), and then split html into block of n lines and sample one block to parse into axtree\n",
    "\n",
    "```\n",
    "mean, std = 125, 50\n",
    "while True:\n",
    "    gaussian_number = np.random.normal(mean, std)\n",
    "    if 50 <= gaussian_number <= 150:\n",
    "        break\n",
    "    random_number = np.random.randint(1, int(gaussian_number) + 1)\n",
    "```\n",
    "\n",
    "3. After subsampling should be able to test out GPT 3.5\n",
    "4. See if model is able to generate history action intention (non-grounded bc we don't have past axtree observations)\n",
    "5. A side note is that right now the generated objective & action is rly grounded in the current page i.e. it might not be diverse enough (all generated objective & action pairs are easy)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f70fada7-4f97-4986-9745-6f2f25c89c64",
   "metadata": {},
   "source": [
    "### Better html 2 axtree"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "509abba8-ba60-433e-8849-5655d557ce25",
   "metadata": {},
   "outputs": [],
   "source": [
    "!python3 test.py"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5a15baaf-b989-4c34-874b-ee853d1a533a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "with open('tmp.json', 'r') as f:\n",
    "    res = json.load(f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cd2c3fa7-4fe7-4be8-9efb-09093dd75933",
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(1, len(res)+1):\n",
    "    messages=[\n",
    "        {\"role\": \"system\", \"content\": task_instruction},\n",
    "        {\"role\": \"system\", \"content\": action_instruction},\n",
    "        {\"role\": \"user\", \"content\": res[i-1]},\n",
    "    ]\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "    print(i)\n",
    "    print('num_tokens', num_tokens, 'cost $', num_tokens / 1000 * 0.01)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "5ca4a763-f512-4f87-ace9-b7bb6fd02e72",
   "metadata": {},
   "source": [
    "### New prompt & Generation quality comparision - gpt-4 vs gpt-3.5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "deebeefb-7f01-4934-af32-34af41d8255e",
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import openai_num_tokens_from_messages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b1d22ee5-1702-4571-aec5-077d9aa385c3",
   "metadata": {},
   "outputs": [],
   "source": [
    "# will be formatted later\n",
    "task_instruction = \"\"\"You are a browser. You are given the an accessbility tree that represent the current webpage the user is focusing at. Guess one possible objective of the user, a history of actions of length {history_len} (might be performed in other related pages, like search or login), and the next action that the user should perform. Remember to follow the format below exactly without extra annotation and use number id. Just make up specific information like URLs if you are not sure about it.\n",
    "Provide the answer in the following format (including ```):\n",
    "\n",
    "```\n",
    "Objective: {{objective}}\n",
    "History:\n",
    "{{action1}}\n",
    "{{action2}}\n",
    "{{action3}}\n",
    "...\n",
    "Action:\n",
    "{{next_action}}\n",
    "```\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "69950259-042e-4674-b481-4088207da75b",
   "metadata": {},
   "outputs": [],
   "source": [
    "action_instruction = \"\"\"The actions the user can perform fall into several categories:\n",
    "\n",
    "Page Operation Actions:\n",
    "`click [id]`: This action clicks on an element with a specific id on the webpage.\n",
    "`type [id] [content] [press_enter_after=0|1]`: Use this to type the content into the field with id. By default, the \"Enter\" key is pressed after typing unless press_enter_after is set to 0.\n",
    "`hover [id]`: Hover over an element with id.\n",
    "`press [key_comb]`:  Simulates the pressing of a key combination on the keyboard (e.g., Ctrl+v).\n",
    "`scroll [direction=down|up]`: Scroll the page up or down.\n",
    "\n",
    "Tab Management Actions:\n",
    "`new_tab`: Open a new, empty browser tab.\n",
    "`tab_focus [tab_index]`: Switch the browser's focus to a specific tab using its index.\n",
    "`close_tab`: Close the currently active tab.\n",
    "\n",
    "URL Navigation Actions:\n",
    "`goto [url]`: Navigate to a specific URL.\n",
    "`go_back`: Navigate to the previously viewed page.\n",
    "`go_forward`: Navigate to the next page (if a previous 'go_back' action was performed).\n",
    "Completion Action:\n",
    "`stop [answer]`: Issue this action when you believe the task is complete. If the objective is to find a text-based answer, provide the answer in the bracket. If you believe the task is impossible to complete, provide the answer as \"N/A\" in the bracket.\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5d080e25-34af-4e03-b166-c91b42c770ff",
   "metadata": {},
   "outputs": [],
   "source": [
    "for i in range(1, len(data)):\n",
    "    with open(f'htmls/{i}.html', 'w') as f:\n",
    "        print(data[i][1], file=f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5a1b4846-1f82-403c-b258-f61ad5322984",
   "metadata": {},
   "outputs": [],
   "source": [
    "task_instruction.format(history_len=5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1a43d519-33d9-4d2a-a837-bd9e637b5d7a",
   "metadata": {},
   "outputs": [],
   "source": [
    "import random\n",
    "for i in range(1, len(res)+1):\n",
    "    print('data', i)\n",
    "    print('-'*10)\n",
    "    history_len = random.randint(3, 10)\n",
    "    print('history_len', history_len)\n",
    "    messages=[\n",
    "        {\"role\": \"system\", \"content\": task_instruction.format(history_len=history_len)},\n",
    "        {\"role\": \"system\", \"content\": action_instruction},\n",
    "        {\"role\": \"user\", \"content\": res[i-1]},\n",
    "    ]\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "    print('num_tokens for gpt-4-1106-preview', num_tokens, 'cost $', num_tokens / 1000 * 0.01)\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-3.5-turbo-1106')\n",
    "    print('num_tokens for gpt-3.5-turbo-1106', num_tokens, 'cost $', num_tokens / 1000 * 0.001)\n",
    "    print()\n",
    "\n",
    "    print('gpt-4-1106-preview')\n",
    "    print('-'*10)\n",
    "    try:\n",
    "        response = openai.ChatCompletion.create(\n",
    "            model='gpt-4-1106-preview',\n",
    "            messages=messages,\n",
    "            temperature=0.2,\n",
    "        )\n",
    "        print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "    except Exception as e:\n",
    "        print(e)\n",
    "    print()\n",
    "\n",
    "    # print('gpt-3.5-turbo-1106')\n",
    "    # print('-'*10)\n",
    "    # try:\n",
    "    #     response = openai.ChatCompletion.create(\n",
    "    #         model='gpt-3.5-turbo-1106',\n",
    "    #         messages=messages,\n",
    "    #         temperature=0.2,\n",
    "    #     )\n",
    "    #     print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "    # except Exception as e:\n",
    "    #     print(e)\n",
    "    # print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "925b967a-595a-482c-bfb2-ad6b4f0ff421",
   "metadata": {},
   "outputs": [],
   "source": [
    "print(res[5-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "91576b37-4771-4532-bb3b-e2943f6cba60",
   "metadata": {},
   "outputs": [],
   "source": [
    "import random\n",
    "for i in range(1, len(res)+1):\n",
    "    print('data', i)\n",
    "    print('-'*10)\n",
    "    history_len = random.randint(3, 10)\n",
    "    print('history_len', history_len)\n",
    "    messages=[\n",
    "        {\"role\": \"system\", \"content\": task_instruction.format(history_len=history_len)},\n",
    "        {\"role\": \"system\", \"content\": action_instruction},\n",
    "        {\"role\": \"user\", \"content\": res[i-1]},\n",
    "    ]\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "    print('num_tokens for gpt-4-1106-preview', num_tokens, 'cost $', num_tokens / 1000 * 0.01)\n",
    "    num_tokens = openai_num_tokens_from_messages(messages, 'gpt-3.5-turbo-1106')\n",
    "    print('num_tokens for gpt-3.5-turbo-1106', num_tokens, 'cost $', num_tokens / 1000 * 0.001)\n",
    "    print()\n",
    "\n",
    "    # print('gpt-4-1106-preview')\n",
    "    # print('-'*10)\n",
    "    # try:\n",
    "    #     response = openai.ChatCompletion.create(\n",
    "    #         model='gpt-4-1106-preview',\n",
    "    #         messages=messages,\n",
    "    #         temperature=0.2,\n",
    "    #     )\n",
    "    #     print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "    # except Exception as e:\n",
    "    #     print(e)\n",
    "    # print()\n",
    "\n",
    "    print('gpt-3.5-turbo-1106')\n",
    "    print('-'*10)\n",
    "    try:\n",
    "        response = openai.ChatCompletion.create(\n",
    "            model='gpt-3.5-turbo-1106',\n",
    "            messages=messages,\n",
    "            temperature=0.2,\n",
    "        )\n",
    "        print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "    except Exception as e:\n",
    "        print(e)\n",
    "    print()"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "19ae3842-1778-4d4a-9485-d518f13b1740",
   "metadata": {},
   "source": [
    "### Block Subsample"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "af3ecb74-2728-4f0a-91ff-d21a4ae79f26",
   "metadata": {},
   "outputs": [],
   "source": [
    "# will be formatted later\n",
    "task_instruction = \"\"\"You are a browser. You are given the an accessbility tree that represent the current webpage the user is focusing at. Guess one possible objective of the user, a history of actions of length {history_len} (might be performed in other related pages, like search or login), and the next action that the user should perform. Remember to follow the format below exactly without extra annotation and use number id. Just make up specific information like URLs if you are not sure about it.\n",
    "Provide the answer in the following format (including ```):\n",
    "\n",
    "```\n",
    "Objective: {{objective}}\n",
    "History:\n",
    "{{action1}}\n",
    "{{action2}}\n",
    "{{action3}}\n",
    "...\n",
    "Action:\n",
    "{{next_action}}\n",
    "```\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cf49f772-23a2-446e-b068-954781b40ea1",
   "metadata": {},
   "outputs": [],
   "source": [
    "action_instruction = \"\"\"The actions the user can perform fall into several categories:\n",
    "\n",
    "Page Operation Actions:\n",
    "`click [id]`: This action clicks on an element with a specific id on the webpage.\n",
    "`type [id] [content] [press_enter_after=0|1]`: Use this to type the content into the field with id. By default, the \"Enter\" key is pressed after typing unless press_enter_after is set to 0.\n",
    "`hover [id]`: Hover over an element with id.\n",
    "`press [key_comb]`:  Simulates the pressing of a key combination on the keyboard (e.g., Ctrl+v).\n",
    "`scroll [direction=down|up]`: Scroll the page up or down.\n",
    "\n",
    "Tab Management Actions:\n",
    "`new_tab`: Open a new, empty browser tab.\n",
    "`tab_focus [tab_index]`: Switch the browser's focus to a specific tab using its index.\n",
    "`close_tab`: Close the currently active tab.\n",
    "\n",
    "URL Navigation Actions:\n",
    "`goto [url]`: Navigate to a specific URL.\n",
    "`go_back`: Navigate to the previously viewed page.\n",
    "`go_forward`: Navigate to the next page (if a previous 'go_back' action was performed).\n",
    "Completion Action:\n",
    "`stop [answer]`: Issue this action when you believe the task is complete. If the objective is to find a text-based answer, provide the answer in the bracket. If you believe the task is impossible to complete, provide the answer as \"N/A\" in the bracket.\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c078b95f",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5c2a05d3-210d-4d28-b176-d707fa35626d",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "def sample():\n",
    "    mean, std = 125, 50\n",
    "    while True:\n",
    "        gaussian_number = np.random.normal(mean, std)\n",
    "        if 50 <= gaussian_number <= 150:\n",
    "            break\n",
    "    random_number = np.random.randint(1, int(gaussian_number) + 1)\n",
    "    return random_number"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6cc73426-5b31-451d-a18e-8fc781489f81",
   "metadata": {},
   "outputs": [],
   "source": [
    "# low block size\n",
    "for i in range(1, 11):\n",
    "    block_size = 50 #sample()\n",
    "\n",
    "    block_html = []\n",
    "    lines = res[i-1].split('\\n')\n",
    "    for j in range(0, len(lines), block_size):\n",
    "        if j+block_size >= len(lines):\n",
    "            break\n",
    "        block_html.append('\\n'.join(lines[j : j+block_size]))\n",
    "\n",
    "    print('data', i, 'with block size', block_size)\n",
    "    print('number of block', len(block_html))\n",
    "    print('-'*10)\n",
    "\n",
    "    for block in block_html:\n",
    "        print('='*10)\n",
    "        print(block)\n",
    "        print('='*10)\n",
    "\n",
    "        history_len = random.randint(3, 10)\n",
    "        print('history_len', history_len)\n",
    "        messages=[\n",
    "            {\"role\": \"system\", \"content\": task_instruction.format(history_len=history_len)},\n",
    "            {\"role\": \"system\", \"content\": action_instruction},\n",
    "            {\"role\": \"user\", \"content\": block},\n",
    "        ]\n",
    "        num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "        print('num_tokens for gpt-4-1106-preview', num_tokens, 'cost $', num_tokens / 1000 * 0.01)\n",
    "        num_tokens = openai_num_tokens_from_messages(messages, 'gpt-3.5-turbo-1106')\n",
    "        print('num_tokens for gpt-3.5-turbo-1106', num_tokens, 'cost $', num_tokens / 1000 * 0.001)\n",
    "        print()\n",
    "    \n",
    "        print('gpt-4-1106-preview')\n",
    "        print('-'*10)\n",
    "        try:\n",
    "            response = openai.ChatCompletion.create(\n",
    "                model='gpt-4-1106-preview',\n",
    "                messages=messages,\n",
    "                temperature=0.2,\n",
    "            )\n",
    "            print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "        except Exception as e:\n",
    "            print(e)\n",
    "        print()\n",
    "    \n",
    "        print('gpt-3.5-turbo-1106')\n",
    "        print('-'*10)\n",
    "        try:\n",
    "            response = openai.ChatCompletion.create(\n",
    "                model='gpt-3.5-turbo-1106',\n",
    "                messages=messages,\n",
    "                temperature=0.2,\n",
    "            )\n",
    "            print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "        except Exception as e:\n",
    "            print(e)\n",
    "        print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fde163f4-cfa0-4046-9899-cf2a80b50806",
   "metadata": {},
   "outputs": [],
   "source": [
    "# high block size\n",
    "for i in range(1, 11):\n",
    "    block_size = 150 #sample()\n",
    "\n",
    "    block_html = []\n",
    "    lines = res[i-1].split('\\n')\n",
    "    for j in range(0, len(lines), block_size):\n",
    "        if j+block_size >= len(lines):\n",
    "            break\n",
    "        block_html.append('\\n'.join(lines[j : j+block_size]))\n",
    "\n",
    "    print('data', i, 'with block size', block_size)\n",
    "    print('number of block', len(block_html))\n",
    "    print('-'*10)\n",
    "\n",
    "    for block in block_html:\n",
    "        print('='*10)\n",
    "        print(block)\n",
    "        print('='*10)\n",
    "\n",
    "        history_len = random.randint(3, 10)\n",
    "        print('history_len', history_len)\n",
    "        messages=[\n",
    "            {\"role\": \"system\", \"content\": task_instruction.format(history_len=history_len)},\n",
    "            {\"role\": \"system\", \"content\": action_instruction},\n",
    "            {\"role\": \"user\", \"content\": block},\n",
    "        ]\n",
    "        num_tokens = openai_num_tokens_from_messages(messages, 'gpt-4-1106-preview')\n",
    "        print('num_tokens for gpt-4-1106-preview', num_tokens, 'cost $', num_tokens / 1000 * 0.01)\n",
    "        num_tokens = openai_num_tokens_from_messages(messages, 'gpt-3.5-turbo-1106')\n",
    "        print('num_tokens for gpt-3.5-turbo-1106', num_tokens, 'cost $', num_tokens / 1000 * 0.001)\n",
    "        print()\n",
    "    \n",
    "        print('gpt-4-1106-preview')\n",
    "        print('-'*10)\n",
    "        try:\n",
    "            response = openai.ChatCompletion.create(\n",
    "                model='gpt-4-1106-preview',\n",
    "                messages=messages,\n",
    "                temperature=0.2,\n",
    "            )\n",
    "            print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "        except Exception as e:\n",
    "            print(e)\n",
    "        print()\n",
    "    \n",
    "        print('gpt-3.5-turbo-1106')\n",
    "        print('-'*10)\n",
    "        try:\n",
    "            response = openai.ChatCompletion.create(\n",
    "                model='gpt-3.5-turbo-1106',\n",
    "                messages=messages,\n",
    "                temperature=0.2,\n",
    "            )\n",
    "            print(response[\"choices\"][0][\"message\"][\"content\"])\n",
    "        except Exception as e:\n",
    "            print(e)\n",
    "        print()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c3eb10ab-9b10-48f2-8b40-4b7c2a064d4c",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
