from UIAgents.Agent_RPA.prompts.general_prompt import INDEX_REPLACEMENT_PROMPT, ACTIONS_PROMPT, ASK_MLLM_PROMPT

OUTPUT_EXAMPLE = """
[Output Example]
Example 1 (With xpath - simple):
{{
  "thought": "The hardcoded xpath can be made more robust by using text matching instead of data-wob_ref which may change.",
  "soft_action": "xpath = env_op.find_element(\"//*[name()='button' and text()='Ok']\", \"Button labeled 'Ok' for confirming actions\")\nenv_op.click_xpath(xpath)"
}}

Example 2 (With xpath - using context):
{{
  "thought": "To make the star selection robust, I'll use the ancestor email thread context with the sender's name.",
  "soft_action": "xpath = env_op.find_element(\"//div[@class='email-thread' and .//div[contains(text(), 'Evy')]]//span[@class='star']\", \"Star icon in Evy's email thread\")\nenv_op.click_xpath(xpath)"
}}

Example 3 (Without xpath):
{{
  "thought": "This action doesn't need element matching, just a key press.",
  "soft_action": "env_op.press_key('enter')"
}}

Example 4 (MLLM needed):
{{
  "thought": "Counting requires visual analysis that's better handled by MLLM than element matching.",
  "soft_action": "env_op.ask_mllm('Based on the screen, answer how many notes are there in the note list.')"
}}
"""

PROMPT_TEMPLATE = ("""
[system]
Generate a Soft-coded Action by converting the hardcoded xpath in the given action to a robust xpath expression.
Your task is to create an xpath that can reliably locate the target element across different task instances by using semantic attributes (text, class, id, etc.) and contextual relationships (ancestor/descendant).

Before generating the xpath:
1. Analyze if the action requires element matching or can use other approaches (ask_mllm, press_key, etc.)
2. If element matching is needed, craft a `find_element` function call with xpath that captures the element's essential characteristics
3. Leverage XPath's full expressiveness: combine attributes, use text matching, include ancestor context

Key principles:
- Avoid brittle attributes (like data-wob_ref) that may change between instances. Prefer semantic attributes: text content, class names, id, aria-labels
- Use ancestor/descendant relationships to provide context
- If the provided xpath is enough robust, you can directly use it as the xpath parameter of the `find_element` function.

If using `find_element()`, ensure that:
1. The revised logic maintains the same intended behavior as the original hardcoded action;
2. If xpath is not required, do not use the find_element method.
"""
+ INDEX_REPLACEMENT_PROMPT
+ "\n[ADMISSIBLE ACTIONS]"
+ "\n# Use these only when appropriate based on the original action and UI context:" + ACTIONS_PROMPT
+ "\n# You may additionally consider the following smart action patterns if relevant:" + ASK_MLLM_PROMPT
+ """
[Output Format]
Your output must include two sections:
### Thought:
Provide a brief explanation (under 40 words) for how you crafted the robust xpath.

### Soft-coded Action:
- If not using `find_element()`: write new code in proper way.
- If the original action requires a UI element xpath:
  Replace the hardcoded xpath with a dynamic lookup using `env_op.find_element`. You must output *exactly* these two lines:
  ```python
  xpath = env_op.find_element("your_robust_xpath_here", "brief element description")
  env_op.xxx(xpath, ...)  # Replace xxx with the appropriate action
  ```
- If the original action does NOT require an xpath: Simply output the action without calling env_op.find_element.
"""
+ OUTPUT_EXAMPLE
+ """
**User goal/request**: {goal}

[Input Provided]
- Observations Analysis:
{obs_analysis}

- Action Justification:
{action_reason}

- Hard Coded Action:
{action}

- Action Related element:
{related_element}

- Current screenshot, annotated screenshot, and html body:
{ui_info_str}
""")


def get_action_translator_prompt(
  goal: str,
  obs_analysis: str,
  action_reason: str,
  action: str,
  related_element: str,
  ui_info_str: str = "",
) -> str:
  return PROMPT_TEMPLATE.format(
    goal=goal,
    obs_analysis=obs_analysis,
    action_reason=action_reason,
    action=action,
    related_element=related_element,
    ui_info_str=ui_info_str if ui_info_str else 'Not available',
  )