import copy
import os
import sys
from typing import Any

import regex
from absl import flags

from .env_operation import EnvOperation
from .prompts.action_translator_prompt import get_action_translator_prompt
from .prompts.breakpoint_analyzer_prompt import get_exec_evaluator_prompt
from .prompts.concluder_prompt import get_concluder_prompt
from .prompts.planner_prompt import get_planner_prompt
from .prompts.summarizer_prompt import get_summarizer_prompt
from .utils import agent_utils, JSON_models
from .utils.JSON_API import OpenAIWrapper
from .utils.JSON_models import ScreenObs, PlannerStepData
from .utils.agent_utils import print_with_color

FLAGS = flags.FLAGS


class Agent_RPA:
  def __init__(
    self,
    env_op: EnvOperation,
    llm: OpenAIWrapper,
    name: str = 'Agent_RPA',
    planner_llm: OpenAIWrapper = None,
    summarizer_llm: OpenAIWrapper = None,
    actiontranslator_llm: OpenAIWrapper = None,
    params_extractor_llm: OpenAIWrapper = None,
  ):
    """Initializes Agent_RPA.

    Args:
      env_op: The environment operation wrapper.
      llm: The main multimodal LLM wrapper (for Concluder, etc.).
      name: The agent name.
      planner_llm: Optional LLM wrapper for Planner Agent. If None, uses main llm.
      summarizer_llm: Optional LLM wrapper for Summarizer Agent. If None, uses main llm.
      actiontranslator_llm: Optional LLM wrapper for ActionTranslator Agent. If None, uses main llm.
      params_extractor_llm: Optional LLM wrapper for Params Extractor. If None, uses main llm.
    """
    self.env_op = env_op
    self.llm = llm
    self.planner_llm = planner_llm if planner_llm is not None else llm
    self.summarizer_llm = summarizer_llm if summarizer_llm is not None else llm
    self.actiontranslator_llm = actiontranslator_llm if actiontranslator_llm is not None else llm
    self.params_extractor_llm = params_extractor_llm if params_extractor_llm is not None else llm
    self.rpa_bank = None
    
    # Set within run_tasks_*.py
    self.cur_task_type = None
    self.cur_task = None  # the current task description
    self.rpa_mode = False  # False for ReAct, True for RPA Verification or RPA Testing
    self.additional_guidelines = ''
    self.action_history = []
    self.reflection = None  # reset in run_tasks_react.py
    self.reflection_history = []
    
    self.record_token = JSON_models.RecordToken()
  
  def reset(self, task_type: str, log_task_path: str, to_init_task: bool = True):
    self.log_task_path = log_task_path
    os.makedirs(self.log_task_path, exist_ok=True)
    
    self.cur_task_type = task_type
    # self.cur_task = task.goal # set in episode_runner.py, after env_op.reset()
    
    if to_init_task:
      # reset to initial state for each ReAct trial
      self.previous_plan = 'You are just starting the task, and no previous plan exists.'
      self.completed_tasks = ['You just started, no plan has been completed yet.']
      self.screen_changes = 'You just started, no actions has been performed yet.'
      self.action_history = []  # store execution_info (get from env_op and summarizer_agent)
      self._action_translation_context = []  # store context for batch action translation
    else:
      self.previous_plan = 'You ran the rpa code generated earlier.'
      # No need to reset completed_tasks. It will be set in run_tasks_rpa.py
      self.screen_changes = 'Because the code was run directly, no screen_changes were recorded. The screen prior to execution was the desktop.'
      # No need to reset action_history and env_op when Breakpoint_Analyzer_Agent output 'Y'
    
    self.flag_done = False
    self.agent_traj = []  # store ReActStepInfo
    
    return len(self.action_history)
  
  def rpa_testing(self) -> JSON_models.RPAExecTraj:
    
    print_with_color('============================================', 'magenta')
    print_with_color(f"Current Stage: {self.rpa_mode}\n", 'magenta')
    
    rpa_dict = self.rpa_bank.rpa_dict
    
    if self.cur_task_type not in rpa_dict:
      print_with_color("rpa doesn't exist", 'magenta')
      return JSON_models.RPAExecTraj()
    
    rpa = rpa_dict[self.cur_task_type]
    # -----start: RPA Verification and Testing
    function_call, env_op_traj, exec_result = self.Execute_rpa_code(
      task=self.cur_task,
      execution_file_path=self.log_task_path,
      rpa=rpa
    )
    print(f'answer return: {exec_result.answer_return}\n')
    
    rpa_exec_traj = JSON_models.RPAExecTraj(
      task=self.cur_task,
      function_call=function_call,
      rpa_code=rpa['rpa_code'],
      exec_result=exec_result,
      action_history=self.env_op.action_history,  # self.action_history
      env_op_traj=env_op_traj,
    )
    self.action_history = rpa_exec_traj.action_history
    self.flag_done = exec_result.done
    return rpa_exec_traj
  
  def step(self) -> JSON_models.ReActStepInfo:
    
    step_n = len(self.action_history) + 1
    print_with_color(f'# Step {step_n}', 'magenta')
    
    # -----start: plan
    planner_result = self.Planner_Agent(
      log_task_path=self.log_task_path,
      goal=self.cur_task,
      step_n=step_n,
      current_obs=self.env_op.cur_obs,
    )
    
    # planner_output = copy.deepcopy(planner_result.data.output)
    planner_output = JSON_models.PlannerOutput_w_soft(**copy.deepcopy(planner_result.data.output).dict())
    # -----end: plan
    
    # -----start: execute code
    traj, exec_result = self.env_op.execute_code(planner_output.code, vars={}, save_path=self.log_task_path)
    action_related_element = traj[-1].related_elements
    exec_feedback = exec_result.exec_feedback
    self.flag_done = exec_result.done
    print_with_color('exec_result', 'magenta')
    print_with_color(exec_result, 'magenta')
    # -----end: execute code
    
    planner_output.soft_action = exec_result.executed_code
    if FLAGS.agent_name == 'agent_rpa':
      is_final_step = 'env_op.stop' in planner_output.soft_action or self.flag_done
      # Collect context for batch action translation (executed before RPA Builder)
      if FLAGS.use_action_translator:
        translation_context = {
          'step_n': step_n,
          'step_data': planner_result.data,
          'related_element': action_related_element,
          'related_index': traj[-1].related_target,
          'is_screen_changed': traj[-1].is_screen_changed,
          'is_final_step': is_final_step,
        }
        self._action_translation_context.append(translation_context)
      if FLAGS.react_soft_action:
        planner_output.soft_action = planner_result.data.output.soft_action
    
    # -----start: summarize
    if self.flag_done:
      self.screen_changes = 'No screen changes.'
      execution_summary = exec_feedback
    else:
      summarizer_result = self.Summarizer_Agent(
        log_task_path=self.log_task_path,
        goal=self.cur_task,
        step_n=step_n,
        step_data=planner_result.data,
        after_obs=self.env_op.cur_obs,
        exec_feedback=exec_feedback,  # exec_result.exec_feedback
      )
      self.screen_changes = summarizer_result.screen_changes
      execution_summary = summarizer_result.execution_summary
    # -----end: summarize
    
    # Whether to include exec_feedback
    if len(self.env_op.action_history):
      execution_info = f"{self.env_op.action_history[-1]}\nExecution Summary: {execution_summary}"
    else:
      execution_info = f"No action has been performed.\nExecution Summary: {execution_summary}"
    
    self.action_history.append(execution_info)
    
    print_with_color('--------------------------------------------', 'magenta')
    print_with_color(f'# Completed Step {step_n}\n', 'magenta')
    
    react_step_info = JSON_models.ReActStepInfo(
      step_n=step_n,
      ui_content=self.env_op.before_obs.ui_content,
      obs_description=planner_output.observation,
      action_reason=planner_output.code_reason,
      action=planner_output.code,
      soft_coded_action=planner_output.soft_action,
      related_elements=action_related_element,
      execution_summary=execution_summary,
      action_step_str=self.action_history[-1] if len(self.action_history) else None,
      exec_step_info=traj[-1],
    )
    self.agent_traj.append(react_step_info)
    
    return react_step_info
  
  def Planner_Agent(
    self,
    log_task_path: str,
    goal: str,
    step_n: int,
    current_obs: ScreenObs,
  ) -> JSON_models.PlannerInteractionResult:
    
    print_with_color('============================================', 'green')
    print_with_color("Current Agent: Planner\n", 'green')
    
    state = f'step-{step_n}_before'
    
    planner_prompt = get_planner_prompt(
      goal=goal,
      previous_plan=self.previous_plan,
      completed_plan=self.completed_tasks[-1],
      action_history=self.action_history,
      ui_content=current_obs.ui_content,
      screen_changes=self.screen_changes,
      reflection=self.reflection,  # Add the result of the previous reflection
      additional_guidelines=self.additional_guidelines,
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_planner_prompt.txt', content=planner_prompt)
    
    planner_output, planner_raw_response = self.planner_llm.predict_mm(
      planner_prompt,
      [current_obs.screenshot],
      output_format=JSON_models.PlannerOutput_w_soft if FLAGS.react_soft_action else JSON_models.PlannerOutput
    )
    agent_utils.write_to_file(file_path=log_task_path,
                              file_name=state + '_planner_raw_response.txt',
                              content=planner_raw_response)
    # store step_tokens
    planner_tokens = planner_raw_response.usage
    self.record_token.step = str(step_n)
    self.record_token.agent = 'Planner'
    self.record_token.step_tokens = planner_tokens
    agent_utils.record_cost_tokens(self.record_token)
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_planner_output.txt', content=planner_output)
    
    self.previous_plan = planner_output.plan_list
    self.completed_tasks.append(planner_output.completed_tasks)
    
    step_data_pl = PlannerStepData(
      obs=current_obs,
      output=planner_output,
    )
    
    # -----start: print planner_output
    print_with_color(f'Observations:\n{planner_output.observation}\n', 'green')
    if planner_output.consider_reflection:
      print_with_color(f'Reflection Consideration:\n{planner_output.consider_reflection}\n', 'green')
    print_with_color(f'Completed Tasks:\n{planner_output.completed_tasks}\n', 'green')
    print_with_color(f'Plan Justification:\n{planner_output.plan_reason}\n', 'green')
    print_with_color(f'Plan List:\n{planner_output.plan_list}\n', 'green')
    print_with_color(f'Next Action Justification:\n{planner_output.code_reason}\n', 'green')
    print_with_color(f'Action:\n{planner_output.code}\n', 'green')
    if hasattr(planner_output, 'soft_action'):
      print_with_color(f'Soft Action:\n{planner_output.soft_action}\n', 'green')
    sys.stdout.flush()
    # -----end: print planner_output
    
    return JSON_models.PlannerInteractionResult(data=step_data_pl)
  
  def Summarizer_Agent(
    self,
    log_task_path: str,
    goal: str,
    step_n: int,
    step_data: PlannerStepData,
    after_obs: ScreenObs = None,
    exec_feedback: str = None,
  ) -> JSON_models.SummarizerInteractionResult:
    print_with_color('============================================', 'green')
    print_with_color("Current Agent: Summarizer\n", 'green')
    state = f'step-{step_n}_after'  # e.g. 1_before, 2_after
    
    before_screenshot_label = step_data.obs.screenshot.copy()
    after_screenshot_label = after_obs.screenshot.copy()
    agent_utils.add_screenshot_label(before_screenshot_label, 'before')
    agent_utils.add_screenshot_label(after_screenshot_label, 'after')
    agent_utils.store_image(before_screenshot_label, f'step-{step_n}_summarizer_screenshot_before.png',
                            file_path=log_task_path)
    agent_utils.store_image(after_screenshot_label, f'step-{step_n}_summarizer_screenshot_after.png',
                            file_path=log_task_path)
    
    # Handle case where action_history is empty (e.g., when code fails at exec stage)
    if self.env_op.action_history:
      action_info = self.env_op.action_history[-1]
    else:
      action_info = f"Executed code: 'N/A'"
    
    summarizer_prompt = get_summarizer_prompt(
      goal=goal,
      before_ui_content=step_data.obs.ui_content,
      after_ui_content=after_obs.ui_content,
      execution_info=f"{action_info}\nExecution Result: {exec_feedback}",
      reason=step_data.output.code_reason,
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_summarizer_prompt.txt',
                              content=summarizer_prompt)
    
    summarizer_output, summarizer_raw_response = self.summarizer_llm.predict_mm(
      summarizer_prompt,
      [
        before_screenshot_label,
        after_screenshot_label
      ],
      output_format=JSON_models.SummarizerOutput
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_summarizer_raw_response.txt',
                              content=summarizer_raw_response)
    
    summarizer_tokens = summarizer_raw_response.usage
    self.record_token.step = str(step_n)
    self.record_token.agent = 'Summarizer'
    self.record_token.step_tokens = summarizer_tokens
    agent_utils.record_cost_tokens(self.record_token)
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_summarizer_output.txt',
                              content=summarizer_output)
    
    print_with_color(f'Screen Changes:\n{summarizer_output.screen_changes}\n', 'green')
    print_with_color(f'Execution Summary:\n{summarizer_output.execution_summary}\n', 'green')
    
    return JSON_models.SummarizerInteractionResult(
      execution_summary=summarizer_output.execution_summary,
      screen_changes=summarizer_output.screen_changes
    )
  
  def Execute_rpa_code(
    self,
    task: str,
    execution_file_path: str,
    rpa: Any,
  ):
    print_with_color('============================================', 'cyan')
    print_with_color("Current Module: RPA Exec\n", 'cyan')
    
    rpa_description = rpa['rpa_description']
    rpa_params = rpa['rpa_params']
    rpa_code = rpa['rpa_code']
    rpa_example = rpa['example_usage']
    
    # -----start: use llm to extract parameters for function_call
    # based on 'rpa_description', 'parameters', 'new task' to extract current parameters
    prompt = (
      "You are an expert in extracting task parameters for RPA functions. "
      "Your task is to accurately extract the required parameters for a new task, "
      "based on the provided rpa_description and rpa_parameters format.\n\n"
      
      "[Input]\n"
      f"rpa_description: {rpa_description}\n"
      "rpa_parameters:\n"
      f"{rpa_params}\n"
      f"Example Usage: {rpa_example}\n"
      f"New Task: {task}\n\n"

      # CMH added
      # "[Current Page Information]\n"
      # "HTML Content:\n"
      # f"{self.env_op.cur_obs.ui_content}\n\n"
      
      "[Output Format]\n"
      "Extract the appropriate parameters from the **New Task** according to the rpa_parameters specification, "
      "and construct a function call following the **Example Usage**.\n"
      "**Only include parameters explicitly mentioned in the New Task. Omit missing parameters (functions have defaults).**\n"
      "Do not change the function name or any of the parameter names in **Example Usage** under any circumstances.\n\n"
      
      "Output Example:\n"
      "{\n"
      '  "function_call": "delete_file(file_name=\\"record.txt\\")"\n'
      "}"
    )
    output, raw_response = self.params_extractor_llm.predict_mm(prompt, [], output_format=JSON_models.ParamsExtractionOutput)
    agent_utils.write_to_file(file_path=execution_file_path, file_name='0_extract_params_output.txt', content=output)
    
    cost_tokens = raw_response.usage
    self.record_token.step = '0'
    self.record_token.agent = 'extract params'
    self.record_token.step_tokens = cost_tokens
    agent_utils.record_cost_tokens(self.record_token)
    
    function_call = output.function_call
    if function_call:
      try:
        func_name = agent_utils.extract_function_names(rpa_example)
        pattern = r'\((?:[^()]+|(?R))*\)'  # (?R) is recursive
        params = (regex.findall(pattern, function_call))[0]
      except Exception as e:
        print(f'Error occurred when extracting params: {e}')
      else:
        function_call = f'{func_name}{params}'
    print_with_color(f"Generated function call:\n{function_call}", 'cyan')
    # -----end: use llm to extract parameters for function_call
    
    env_op_traj, exec_result = self.env_op.execute_code(code=rpa_code, vars={"function_call": function_call},
                                                        save_path=execution_file_path, flag_exec_rpa=True)
    
    return function_call, env_op_traj, exec_result
  
  def Concluder_Agent(
    self,
    goal: str,
    log_task_path: str,
    episode_results: JSON_models.EpisodeResult,
  ) -> JSON_models.ConcluderOutput:
    print('--------------------------------------------')
    print("Current Agent: Concluder\n")
    
    is_success = False
    if episode_results.task_successful == 1.0 and episode_results.agent_done:
      is_success = True
    
    if episode_results.task_successful == 1.0:
      benchmark_feedback = "the benchmark judged the task as fully completed"
    elif episode_results.task_successful == 0.0:
      benchmark_feedback = "the benchmark judged the task as not completed at all"
    else:
      benchmark_feedback = f"the benchmark judged the task as partially completed (approximately {episode_results.task_successful * 100:.0f}%)"
    
    if episode_results.agent_done:
      agent_feedback = "the agent believes the task was completed"
    else:
      agent_feedback = "the agent believes the task is still incomplete"
    
    if ((episode_results.task_successful == 1.0 and episode_results.agent_done) or
        (episode_results.task_successful == 0.0 and not episode_results.agent_done)):
      conjunction = "and"
    else:
      conjunction = "while"
    
    env_feedback = f"Regarding the task outcome: {benchmark_feedback}, {conjunction} {agent_feedback}.\n"
    
    concluder_prompt = get_concluder_prompt(
      goal=goal,
      completed_tasks=self.completed_tasks[-1],
      action_history=self.action_history,
      ui_info_str=self.env_op.cur_obs.ui_content,
      reflection_history=self.reflection_history,
      env_feedback=env_feedback,
      is_success=is_success,
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_prompt.txt', content=concluder_prompt)
    
    concluder_output, raw_response = self.llm.predict_mm(concluder_prompt, [self.env_op.cur_obs.screenshot],
                                                         output_format=JSON_models.ConcluderOutput)
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_raw_output.txt', content=raw_response)
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_output.txt', content=concluder_output)
    
    cost_tokens = raw_response.usage
    self.record_token.agent = 'Concluder'
    self.record_token.step_tokens = cost_tokens
    agent_utils.record_cost_tokens(self.record_token)
    
    if not raw_response:
      print("Error: Didn't get concluder response.")
    
    print(f"Episode Conclusion:\n{concluder_output.episode_conclusion}\n")
    print(f"Reflection:\n{concluder_output.reflection}\n")
    
    if concluder_output.reflection is not None:
      self.reflection = concluder_output.reflection
      self.reflection_history.append(concluder_output.reflection)
      episode_results.reflection = concluder_output.reflection
      if isinstance(episode_results.agent_traj, JSON_models.RPAExecTraj):
        episode_results.agent_traj.reflection = concluder_output.reflection
    
    return concluder_output
  
  def Breakpoint_Analyzer_Agent(
    self,
    rpa_exec_traj: JSON_models.RPAExecTraj,
    log_path: str,
  ) -> JSON_models.ExecEvaluatorOutput:
    print('============================================')
    print("Current Agent: Breakpoint_Analyzer_Agent\n")
    
    if not os.path.exists(log_path):
      os.makedirs(log_path)
    
    ui_content = self.env_op.cur_obs.ui_content
    
    # get prompt
    prompt = get_exec_evaluator_prompt(rpa_exec_traj=rpa_exec_traj, ui_content=ui_content)
    agent_utils.write_to_file(file_path=log_path, file_name='Exec_Evaluator_Agent_prompt.txt', content=prompt)
    
    # call MLLM
    output, raw_response = self.llm.predict_mm(prompt, [],
                                               output_format=JSON_models.ExecEvaluatorOutput)
    agent_utils.write_to_file(file_path=log_path, file_name='Exec_Evaluator_Agent_output.txt', content=output)
    cost_tokens = raw_response.usage
    self.record_token.step = '-'
    self.record_token.agent = 'Exec Evaluator'
    self.record_token.step_tokens = cost_tokens
    agent_utils.record_cost_tokens(self.record_token)
    
    print(f'Observations:\n{output.observation}\n')
    print(f'Completed Tasks:\n{output.completed_tasks}\n')
    print(f'Plan Justification:\n{output.plan_reason}\n')
    print(f'Plan List:\n{output.plan_list}\n')
    print(f'Whether To Continue:\n{output.to_continue}\n')
    
    return output
  
  # =========================================================================
  # Batch Action Translation (Execute Before RPA Builder)
  # =========================================================================
  
  def batch_translate_actions(
    self,
    react_trajs: list[JSON_models.ReActTraj],
    log_path: str = None
  ) -> list[JSON_models.ReActTraj]:
    """
    Translate all actions in ReAct trajectories before RPA Builder.
    
    This is called before RPA Builder to process actions in batch
    rather than during ReAct execution.
    
    Args:
      react_trajs: List of ReAct trajectories to translate
      log_path: Optional log path for translation results
      
    Returns:
      List of ReAct trajectories with updated soft_coded_action fields
    """
    if not FLAGS.use_action_translator:
      # Action translation disabled, return as-is
      print_with_color("Action translation disabled, skipping batch translation.", 'yellow')
      return react_trajs
    
    print_with_color("\n🔧 Batch Action Translation (Before RPA Builder)...", 'blue')
    
    translated_trajs = []
    action_translation_context = getattr(self, '_action_translation_context', [])
    
    # Only translate the last trajectory (most recent ReAct episode)
    # Previous trajectories are kept as-is
    for traj_idx, react_traj in enumerate(react_trajs):
      is_last_traj = (traj_idx == len(react_trajs) - 1)
      
      if is_last_traj and action_translation_context:
        print_with_color(f"\n  Processing trajectory {traj_idx + 1}/{len(react_trajs)} (with translation)...", 'cyan')
        translated_steps = []
        
        # Create a mapping from step_n to context for easier lookup
        context_map = {ctx['step_n']: ctx for ctx in action_translation_context}
        
        # Debug: print context mapping
        print_with_color(f"  Context available for steps: {sorted(context_map.keys())}", 'cyan')
        traj_step_nums = [s.step_n for s in react_traj.traj]
        print_with_color(f"  Trajectory has steps: {traj_step_nums}", 'cyan')
        
        for step_info in react_traj.traj:
          # Find context by step_n
          ctx = context_map.get(step_info.step_n)
          
          if ctx:
            should_translate = (
              ctx['is_screen_changed'] or ctx['is_final_step']
            )
            
            if should_translate:
              # Perform action translation
              translated_action = self.ActionTranslator_Agent(
                goal=react_traj.task,
                step_n=ctx['step_n'],
                step_data=ctx['step_data'],
                related_element=ctx['related_element'],
                related_index=ctx['related_index'],
                log_path=log_path or self.log_task_path
              )
              
              # Update soft_coded_action
              step_info.soft_coded_action = translated_action
              print_with_color(
                f"    ✓ Translated step {ctx['step_n']}: {translated_action[:60]}...",
                'green'
              )
            else:
              # Keep original action
              print_with_color(
                f"    - Skipped step {ctx['step_n']} (no screen change)",
                'grey'
              )
          else:
            # No context available, use original action
            print_with_color(
              f"    ⚠ No context for step {step_info.step_n}, keeping original action",
              'yellow'
            )
          
          translated_steps.append(step_info)
        
        # Create new trajectory with translated steps
        translated_traj = JSON_models.ReActTraj(
          task=react_traj.task,
          reflection=react_traj.reflection,
          traj=translated_steps,
          action_history=react_traj.action_history,
          success=react_traj.success,
          conclusion=react_traj.conclusion,
          env_op_traj=react_traj.env_op_traj
        )
        
        translated_trajs.append(translated_traj)
      else:
        # Keep trajectory as-is (no translation context or not the last trajectory)
        print_with_color(f"\n  Keeping trajectory {traj_idx + 1}/{len(react_trajs)} as-is (no translation)", 'grey')
        translated_trajs.append(react_traj)
    
    print_with_color("✅ Batch Action Translation Complete\n", 'blue')
    
    # Clear translation context after processing
    if hasattr(self, '_action_translation_context'):
      self._action_translation_context = []
    
    return translated_trajs
  
  # =========================================================================
  # ActionTranslator (Individual Action Translation)
  # =========================================================================
  
  def ActionTranslator_Agent(
    self,
    log_path: str,
    goal: str,
    step_n: int,
    step_data: PlannerStepData,
    related_element: str,
    related_index: int = None,
  ) -> str:
    print_with_color('============================================', 'light_red')
    print_with_color("Current Agent: ActionTranslator_Agent\n", 'light_red')
    
    if not os.path.exists(log_path):
      os.makedirs(log_path)
    file_prefix = f'step-{step_n}'
    
    prompt = get_action_translator_prompt(goal=goal, obs_analysis=step_data.output.observation,
                                          action_reason=step_data.output.code_reason,
                                          action=step_data.output.code,
                                          related_element=related_element,
                                          ui_info_str=step_data.obs.ui_content)
    agent_utils.write_to_file(file_path=log_path, file_name=f'{file_prefix}_ActionTranslator_Agent_prompt.txt',
                              content=prompt)
    
    output, raw_response = self.actiontranslator_llm.predict_mm(prompt, [step_data.obs.screenshot],
                                               output_format=JSON_models.ActionTranslatorOutput)
    agent_utils.write_to_file(file_path=log_path, file_name=f'{file_prefix}_ActionTranslator_Agent_output.txt',
                              content=output)
    cost_tokens = raw_response.usage
    self.record_token.step = str(step_n)
    self.record_token.agent = 'ActionTranslator'
    self.record_token.step_tokens = cost_tokens
    agent_utils.record_cost_tokens(self.record_token)
    
    print(f'Thought:\n{output.thought}\n')
    print(f'Soft Action:\n{output.soft_action}\n')
    
    # if 'kwargs' in output.soft_action:  # Soft action with kwargs needs index; extract_ui_value ensures kwargs accuracy
    #   output.soft_action = agent_utils.extract_ui_value(output.soft_action, related_element, related_index)
    #
    # print(f'Optimized Soft Action:\n{output.soft_action}\n')
    
    return output.soft_action
