OPERATION_GUIDANCE_PROMPT = """
[OPERATION_GUIDANCE]
Follow these guidelines:
- Choose the simplest method.
- In Reddits, clicking the 'Alphabetical' link will lead to a full list of forums.

Action Related:
- Ensure the index for click, type, and hover is visible in OBSERVATION.
- Scroll to reveal hidden UI elements.
- Confirm that a UI element supports the intended action before interacting.
- Every element is clickable by default.
"""

ACTIONS_PREFIX = """
[ADMISSIBLE ACTIONS]
Only use the actions listed below. Do not use any other actions.
Output the correct parameter format, e.g. bool outputs True or False, instead of strings. Output like env_op.stop(answer="") or env_op.stop(""), not env_op.stop(answer: "").
"""

ACTIONS_PROMPT = """
### Page Operation Actions:
env_op.click(id: int, option: str="") # clicks on an element with a specific id on the webpage. If the element has popup options, input the option to select one. You cannot click a checkbox element, and you should click the StaticText above it instead.

env_op.type(id: int, content: str, clear_existing: bool=True, press_enter_after: bool=True) # type the content into the field with id. By default, the existing content in the field will be cleared unless clear_existing is set to False, and the "Enter" key is pressed after typing unless press_enter_after is set to False; Example usage: env_op.type(101, "Hello, World!", clear_existing=True, press_enter_after=True)

env_op.hover(id: int) # hover over an element with id
    
env_op.press(key_comb: str) # simulates the pressing of a key combination on the keyboard (e.g., Ctrl+v)

env_op.scroll(direction: Literal["up", "down"]="down") # scroll the page up or down.

### Tab Management Actions:
env_op.new_tab() # open a new, empty browser tab

env_op.tab_focus(tab_index: int) # switch the browser's focus to a specific tab using its index

env_op.close_tab() # close the currently active tab.

### URL Navigation Actions:
env_op.goto(url: str) # navigate to a specific URL

env_op.go_back() # navigate to the previously viewed page

env_op.go_forward() # navigate to the next page (if a previous 'go_back' action was performed).

### Completion Action:
env_op.stop(answer: str="") # Issue this action when you believe the task is complete. If the objective is to find a text-based answer, provide the answer in the bracket. If you believe the task is impossible to complete, provide the answer="N/A" in the bracket.
"""

FIND_ELEMENT_PROMPT = """
### Get Element Index
env_op.find_element(**kwargs) -> int # Use this function to find an element in the UI list using filtering criteria and return its index. If no matching element is found, the index will be -1.
- Rules for generating `kwargs`:
  - Use find_element only when an index is required (e.g., not for env_op.scroll).
  - Extract all attributes necessary to uniquely identify the element in the current page. Keys must be correct, and values must be fully preserved without modification.
  - Always include target_description: briefly describe the element's role, appearance, position on screen, and any dynamic/contextual content that helps make it unique.
  - For semantic/fuzzy matching: When exact text match is not possible (e.g., parameter value differs from actual UI text), include the `text` attribute for initial exact match attempt, and use `target_description` to indicate semantic matching (e.g., "the link that matches or contains the parameter value").
- `kwargs` Examples:
  - Exact match: target element: "[101] button 'Submit' enabled: True"
    kwargs = {{"type": "button", "text": "Submit", "enabled": True, "target_description": "the button to submit"}}
  - Semantic match: when parameter value might differ from actual UI text
    kwargs = {{"type": "link", "text": parameter_value, "target_description": "the link that matches or contains the parameter value"}}
"""

INDEX_REPLACEMENT_PROMPT = (
  "\n[Index Replacement]\nYou need to use this function to replace the hardcoded `index` value with the index variable generated by the `find_element()`."
  + FIND_ELEMENT_PROMPT
)

ASK_MLLM_PROMPT = ("""
### Ask MLLM to answer one question based on the current page
env_op.ask_mllm(question: str) -> str # Will return the answer in plain text.
# For advanced parsing, you can ask mllm to return a json object, and then use json.loads(answer) to get targets.
# Example:
# answer = env_op.ask_mllm(question="...Return a json object with the name of the reviews as keys and the number of stars as values.")
# json.loads(answer) # {{'name1': '...', 'name2': '...'}}
""")

GET_UI_CONTENT_PROMPT = ("""
### Get Current UI Elements List
env_op.get_ui_content() -> dict - Each key-value pair contains properties of a UI element on the current page.
- Example return:
  {{101: {{'index': 101, 'type': 'button', 'text': 'Submit', 'enabled': True}}, 102: {{'index': 102, 'type': 'button', 'text': 'Cancel', 'enabled': True}}, 103: {{'index': 103, 'type': 'link', 'text': 'Wiki'}}, 'meta': {{'tab': 'Tab 0 (current): Postmill', 'scroll_bar': 'Scroll Bar: All content is visible.', 'url': 'http://ec2-3-16-131-173.us-east-2.compute.amazonaws.com:9999/'}}}}
- The 'meta' key contains the current tab, scroll bar position, and URL of the current page.
- If the full page is not visible, the 'scroll_bar' describes the position of the scroll bar, e.g., 'Scroll Bar: The area above the visible region contains 35% of the total content. The area below the visible region still contains 30% of the total content.'
""")

FUNCTION_ACTIONS_PROMPT = ACTIONS_PREFIX + ACTIONS_PROMPT

FUNCTION_ACTIONS_FIND_ELEMENT_PROMPT = (
  ACTIONS_PREFIX
  + ACTIONS_PROMPT
  + FIND_ELEMENT_PROMPT
  + GET_UI_CONTENT_PROMPT
  + ASK_MLLM_PROMPT
)
