from UIAgents.Agent_RPA.prompts.general_prompt import INDEX_REPLACEMENT_PROMPT, ACTIONS_PROMPT, ASK_MLLM_PROMPT

OUTPUT_EXAMPLE = """
[Output Example]
Example 1 (With index):
{{
  "thought": "The hardcoded input is targeting a field to name a note. The UI list shows a field with the placeholder “my_note”, described as part of a dialog.",
  "soft_action": "kwargs = {{\"type\": \"input\", \"text\": \"my_note\", \"target_description\": \"Input field for the file name in the note creation dialog\"}}\nindex = env_op.find_element(**kwargs)\nenv_op.type(index, 'ordered_items', True)\n"
}}

Example 2 (Without index):
{{
  "thought": "...",
  "soft_action": "env_op.scroll('up')"
}}

Example 3 (MLLM needed):
{{
  "thought": "...",
  "soft_action": "env_op.ask_mllm('Based on the screen, answer how many notes are there in the note list. plain text, no extra content.')"
}}
"""

PROMPT_TEMPLATE = ("""
[system]
Generate a Soft-coded Action by dynamically replacing the hardcoded index in the given action with an element-matching strategy.
Before that, determine from the observation and action justification whether the original action can be decided by mechanical element matching; if not, consider using `ask_mllm()` for combined visual and language reasoning.
MLLMs are inherently random, so `ask_mllm` may not always return expected results. To ensure stability, use strict prompt constraints or minimize their usage.

If using `find_element()`, ensure that:
1. The revised logic maintains the same intended behavior as the original hardcoded action;
2. If index is not required, do not use the find_element method.
"""
+ INDEX_REPLACEMENT_PROMPT
+ "\n[ADMISSIBLE ACTIONS]"
+ "\n# Use these only when appropriate based on the original action and UI context:" + ACTIONS_PROMPT
+ "\n# You may additionally consider the following smart action patterns if relevant:" + ASK_MLLM_PROMPT
+ """
[Output Format]
Your output must include two sections:
### Thought:
Provide a brief explanation (under 30 words) for how you constructed the dynamic UI element matching parameters (i.e. the `kwargs`).
### Soft-coded Action:
- If not using `find_element()`: write new code in proper way.
- If the original action requires a UI element index:
Replace the hardcoded index with a dynamic lookup using `env_op.find_element`. You can output these three lines of code:
```python
kwargs = {{...}}  # A dictionary describing the target UI element
index = env_op.find_element(**kwargs)  # Use env_op to locate the element dynamically
env_op.xxx(...)  # Replace xxx with the correct action using the index
```
- If the original action does NOT require a index: Simply output the soft-coded action without calling env_op.find_element.
"""
+ OUTPUT_EXAMPLE
+ """
**User goal/request**: {goal}

[Input Provided]
- Observations Analysis:
{obs_analysis}

- Action Justification:
{action_reason}

- Hard Coded Action:
{action}

- Action Related element:
{related_element}

- Current UI elements list:
{ui_info_str}
""")


def get_action_translator_prompt(
  goal: str,
  obs_analysis: str,
  action_reason: str,
  action: str,
  related_element: str,
  ui_info_str: str = "",
) -> str:
  return PROMPT_TEMPLATE.format(
    goal=goal,
    obs_analysis=obs_analysis,
    action_reason=action_reason,
    action=action,
    related_element=related_element,
    ui_info_str=ui_info_str if ui_info_str else 'Not available',
  )