import copy
import os
import sys
from typing import Any

import regex
from absl import flags

from .env_operation import EnvOperation
from .prompts.action_translator_prompt import get_action_translator_prompt
from .prompts.breakpoint_analyzer_prompt import get_exec_evaluator_prompt
from .prompts.concluder_prompt import get_concluder_prompt
from .prompts.planner_prompt import get_planner_prompt
from .prompts.summarizer_prompt import get_summarizer_prompt
from .utils import agent_utils, JSON_models
from .utils.llm_client import OpenAIWrapper
from .utils.JSON_models import ScreenObs, PlannerStepData
from .utils.agent_utils import print_with_color

FLAGS = flags.FLAGS


class Agent_RPA:
  def __init__(
    self,
    env_op: EnvOperation,
    default_llm: OpenAIWrapper,
    name: str = 'Agent_RPA',
    actiontranslator_llm: OpenAIWrapper = None,
    breakpoint_analyzer_llm: OpenAIWrapper = None,
    concluder_llm: OpenAIWrapper = None,
    params_extractor_llm: OpenAIWrapper = None,
    planner_llm: OpenAIWrapper = None,
  ):
    """Initializes Agent_RPA.

    Args:
      env_op: The environment operation.
      default_llm: The default LLM wrapper (main LLM).
      name: The agent name.
      actiontranslator_llm: The LLM wrapper for ActionTranslator.
      breakpoint_analyzer_llm: The LLM wrapper for Breakpoint Analyzer.
      concluder_llm: The LLM wrapper for Concluder.
      params_extractor_llm: The LLM wrapper for Params Extractor.
      planner_llm: The LLM wrapper for Planner Agent.
    """
    self.env_op = env_op
    self.llm = default_llm
    self.default_llm = default_llm
    self.actiontranslator_llm = actiontranslator_llm if actiontranslator_llm is not None else default_llm
    self.breakpoint_analyzer_llm = breakpoint_analyzer_llm if breakpoint_analyzer_llm is not None else default_llm
    self.concluder_llm = concluder_llm if concluder_llm is not None else default_llm
    self.params_extractor_llm = params_extractor_llm if params_extractor_llm is not None else default_llm
    self.planner_llm = planner_llm if planner_llm is not None else default_llm
    self.rpa_bank = None
    
    # Set within run_tasks_*.py
    self.cur_task_type = None
    self.cur_task = None  # the current task description
    self.rpa_mode = False  # False for ReAct, True for RPA Verification or RPA Testing
    self.additional_guidelines = ''
    self.action_history = []
    self.reflection = None  # reset in run_tasks_react.py
    self.reflection_history = []
    
    self.record_token = JSON_models.RecordToken()
  
  def reset(self, task_type: str, log_task_path: str, to_init_task: bool = True):
    self.log_task_path = log_task_path
    os.makedirs(self.log_task_path, exist_ok=True)
    
    self.cur_task_type = task_type
    # self.cur_task = task.goal # set in episode_runner.py, after env_op.reset()
    
    if to_init_task:
      # reset to initial state for each ReAct trial
      self.previous_plan = 'You are just starting the task, and no previous plan exists.'
      self.completed_tasks = ['You just started, no plan has been completed yet.']
      self.screen_changes = 'You just started, no actions has been performed yet.'
      self.action_history = []  # store execution_info (get from env_op and summarizer_agent)
    else:
      self.previous_plan = 'You ran the rpa code generated earlier.'
      # No need to reset completed_tasks. It will be set in run_tasks_rpa.py
      self.screen_changes = 'Because the code was run directly, no screen_changes were recorded. The screen prior to execution was the desktop.'
      # No need to reset action_history and env_op when Breakpoint_Analyzer_Agent output 'Y'
    
    self.flag_done = False
    self.agent_traj = []  # store ReActStepInfo
    
    return len(self.action_history)
  
  def rpa_testing(self) -> JSON_models.RPAExecTraj:
    
    print_with_color('============================================', 'magenta')
    print_with_color(f"Current Stage: {self.rpa_mode}\n", 'magenta')
    
    rpa_dict = self.rpa_bank.rpa_dict
    
    if self.cur_task_type not in rpa_dict:
      print_with_color("rpa doesn't exist", 'magenta')
      return JSON_models.RPAExecTraj()
    
    rpa = rpa_dict[self.cur_task_type]
    # -----start: RPA Verification and Testing
    function_call, env_op_traj, exec_result = self.Execute_rpa_code(
      task=self.cur_task,
      execution_file_path=self.log_task_path,
      rpa=rpa
    )
    print(f'answer return: {exec_result.answer_return}\n')
    
    rpa_exec_traj = JSON_models.RPAExecTraj(
      task=self.cur_task,
      function_call=function_call,
      rpa_code=rpa['rpa_code'],
      exec_result=exec_result,
      action_history=self.env_op.action_history,  # self.action_history
      env_op_traj=env_op_traj,
    )
    self.action_history = rpa_exec_traj.action_history
    self.flag_done = exec_result.done
    return rpa_exec_traj
  
  def step(self) -> JSON_models.ReActStepInfo:
    
    step_n = len(self.action_history) + 1
    print_with_color(f'# Step {step_n}', 'magenta')
    
    # -----start: plan
    planner_result = self.Planner_Agent(
      log_task_path=self.log_task_path,
      goal=self.cur_task,
      step_n=step_n,
      current_obs=self.env_op.cur_obs,
    )
    
    # planner_output = copy.deepcopy(planner_result.data.output)
    planner_output = JSON_models.PlannerOutput_w_soft(**copy.deepcopy(planner_result.data.output).dict())
    # -----end: plan
    
    # -----start: execute code
    traj, exec_result = self.env_op.execute_code(planner_output.code, vars={}, save_path=self.log_task_path)
    action_related_element = traj[-1].related_elements
    exec_feedback = exec_result.exec_feedback
    self.flag_done = exec_result.done
    print_with_color('exec_result', 'magenta')
    print_with_color(exec_result, 'magenta')
    # -----end: execute code
    
    planner_output.soft_action = exec_result.executed_code
    if FLAGS.agent_name == 'agent_rpa':
      # Note: Action translation is now done in batch before RPA Builder
      # Removed real-time translation here to improve efficiency
      # if FLAGS.use_action_translator and (traj[-1].is_screen_changed or is_final_step):
      #   planner_output.soft_action = self.ActionTranslator_Agent(...)
      if FLAGS.react_soft_action:
        planner_output.soft_action = planner_result.data.output.soft_action
    
    # Whether to include exec_feedback
    if len(self.env_op.action_history):
      execution_info = f"summarize_and_analyze:\n{planner_output.summarize_and_analyze}\n{self.env_op.action_history[-1]}"
    else:
      execution_info = f"summarize_and_analyze:\n{planner_output.summarize_and_analyze}\nNo action has been performed."
    self.screen_changes = ""
    
    self.action_history.append(execution_info)
    
    # Extract Action result from current step's summarize_and_analyze, update prev step's execution_summary
    # Step N+1's summarize_and_analyze describes the result after Step N execution
    if step_n > 1 and len(self.agent_traj) > 0:
      action_result = self._extract_action_result(planner_output.summarize_and_analyze)
      if action_result:
        # Update previous step (Step N) execution_summary
        self.agent_traj[-1].execution_summary = action_result
    
    print_with_color('--------------------------------------------', 'magenta')
    print_with_color(f'# Completed Step {step_n}\n', 'magenta')
    
    react_step_info = JSON_models.ReActStepInfo(
      step_n=step_n,
      ui_content=self.env_op.before_obs.ui_content,
      obs_description=planner_output.summarize_and_analyze,
      action_reason=planner_output.code_reason,
      action=planner_output.code,
      soft_coded_action=planner_output.soft_action,
      related_elements=action_related_element,
      execution_summary="",  # Current step's execution_summary updated in next step
      action_step_str=self.action_history[-1] if len(self.action_history) else None,
      exec_step_info=traj[-1],
    )
    self.agent_traj.append(react_step_info)
    
    return react_step_info
  
  def Planner_Agent(
    self,
    log_task_path: str,
    goal: str,
    step_n: int,
    current_obs: ScreenObs,
  ) -> JSON_models.PlannerInteractionResult:
    
    print_with_color('============================================', 'green')
    print_with_color("Current Agent: Planner\n", 'green')
    
    state = f'step-{step_n}_before'
    
    planner_prompt = get_planner_prompt(
      goal=goal,
      previous_plan=self.previous_plan,
      completed_plan=self.completed_tasks[-1],
      action_history=self.action_history,
      ui_content=current_obs.ui_content,
      screen_changes=self.screen_changes,
      reflection=self.reflection,  # Add the result of the previous reflection
      additional_guidelines=self.additional_guidelines,
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_planner_prompt.txt', content=planner_prompt)
    
    planner_output, planner_raw_response = self.planner_llm.predict_mm(
      planner_prompt,
      [current_obs.screenshot],
      output_format=JSON_models.PlannerOutput_w_soft if FLAGS.react_soft_action else JSON_models.PlannerOutput
    )
    agent_utils.write_to_file(file_path=log_task_path,
                              file_name=state + '_planner_raw_response.txt',
                              content=planner_raw_response)
    # store step_tokens
    planner_tokens = planner_raw_response.usage
    self.record_token.step = str(step_n)
    self.record_token.agent = 'Planner'
    self.record_token.step_tokens = planner_tokens
    self.record_token.llm = self.planner_llm.model_name
    agent_utils.record_cost_tokens(self.record_token)
    agent_utils.write_to_file(file_path=log_task_path, file_name=state + '_planner_output.txt', content=planner_output)
    
    self.previous_plan = planner_output.plan_list
    self.completed_tasks.append(planner_output.completed_tasks)
    
    step_data_pl = PlannerStepData(
      obs=current_obs,
      output=planner_output,
    )
    
    # -----start: print planner_output
    print_with_color(f'Summarize and Analyze:\n{planner_output.summarize_and_analyze}\n', 'green')
    if planner_output.consider_reflection:
      print_with_color(f'Reflection Consideration:\n{planner_output.consider_reflection}\n', 'green')
    print_with_color(f'Completed Tasks:\n{planner_output.completed_tasks}\n', 'green')
    print_with_color(f'Plan Justification:\n{planner_output.plan_reason}\n', 'green')
    print_with_color(f'Plan List:\n{planner_output.plan_list}\n', 'green')
    print_with_color(f'Next Action Justification:\n{planner_output.code_reason}\n', 'green')
    print_with_color(f'Action:\n{planner_output.code}\n', 'green')
    if hasattr(planner_output, 'soft_action'):
      print_with_color(f'Soft Action:\n{planner_output.soft_action}\n', 'green')
    sys.stdout.flush()
    # -----end: print planner_output
    
    return JSON_models.PlannerInteractionResult(data=step_data_pl)
  
  def Execute_rpa_code(
    self,
    task: str,
    execution_file_path: str,
    rpa: Any,
  ):
    print_with_color('============================================', 'cyan')
    print_with_color("Current Module: RPA Exec\n", 'cyan')
    
    rpa_description = rpa['rpa_description']
    rpa_params = rpa['rpa_params']
    rpa_code = rpa['rpa_code']
    rpa_example = rpa['example_usage']
    
    # -----start: use llm to extract parameters for function_call
    # based on 'rpa_description', 'parameters', 'new task' to extract current parameters
    prompt = (
      "You are an expert in extracting task parameters for Android RPA functions. "
      "Your task is to accurately extract the required parameters for a new task, "
      "based on the provided rpa_description and rpa_parameters format.\n\n"
      
      "[Input]\n"
      f"rpa_description: {rpa_description}\n"
      "rpa_parameters:\n"
      f"{rpa_params}\n"
      f"Example Usage: {rpa_example}\n"
      f"New Task: {task}\n\n"
      
      "[Output Format]\n"
      "Extract the appropriate parameters from the **New Task** according to the rpa_parameters specification, "
      "and construct a function call following the **Example Usage**.\n"
      "Do not change the function name or any of the parameter names in **Example Usage** under any circumstances.\n\n"
      
      "Output Example:\n"
      "{\n"
      '  "function_call": "delete_file(file_name=\\"record.txt\\")"\n'
      "}"
    )
    output, raw_response = self.params_extractor_llm.predict_mm(prompt, [], output_format=JSON_models.ParamsExtractionOutput)
    agent_utils.write_to_file(file_path=execution_file_path, file_name='0_extract_params_output.txt', content=output)
    
    cost_tokens = raw_response.usage
    self.record_token.step = '0'
    self.record_token.agent = 'extract params'
    self.record_token.step_tokens = cost_tokens
    self.record_token.llm = self.params_extractor_llm.model_name
    agent_utils.record_cost_tokens(self.record_token)
    
    function_call = output.function_call
    if function_call:
      try:
        func_name = agent_utils.extract_function_names(rpa_example)
        pattern = r'\((?:[^()]+|(?R))*\)'  # (?R) is recursive
        params = (regex.findall(pattern, function_call))[0]
      except Exception as e:
        print(f'Error occurred when extracting params: {e}')
      else:
        function_call = f'{func_name}{params}'
    print_with_color(f"Generated function call:\n{function_call}", 'cyan')
    # -----end: use llm to extract parameters for function_call
    
    env_op_traj, exec_result = self.env_op.execute_code(code=rpa_code, vars={"function_call": function_call},
                                                        save_path=execution_file_path, flag_exec_rpa=True)
    
    return function_call, env_op_traj, exec_result
  
  def Concluder_Agent(
    self,
    goal: str,
    log_task_path: str,
    episode_results: JSON_models.EpisodeResult,
  ) -> JSON_models.ConcluderOutput:
    print('--------------------------------------------')
    print("Current Agent: Concluder\n")
    
    is_success = False
    if episode_results.task_successful == 1.0 and episode_results.agent_done:
      is_success = True
    
    concluder_prompt = get_concluder_prompt(
      goal=goal,
      completed_tasks=self.completed_tasks[-1],
      action_history=self.action_history,
      ui_info_str=self.env_op.cur_obs.ui_content,
      reflection_history=self.reflection_history,
      env_feedback=agent_utils.get_env_feedback(episode_results.task_successful, episode_results.agent_done),
      is_success=is_success,
    )
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_prompt.txt', content=concluder_prompt)
    
    concluder_output, raw_response = self.concluder_llm.predict_mm(concluder_prompt, [self.env_op.cur_obs.screenshot],
                                                                    output_format=JSON_models.ConcluderOutput)
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_raw_output.txt', content=raw_response)
    agent_utils.write_to_file(file_path=log_task_path, file_name='concluder_output.txt', content=concluder_output)
    
    cost_tokens = raw_response.usage
    self.record_token.agent = 'Concluder'
    self.record_token.step_tokens = cost_tokens
    self.record_token.llm = self.concluder_llm.model_name
    agent_utils.record_cost_tokens(self.record_token)
    
    if not raw_response:
      print("Error: Didn't get concluder response.")
    
    print(f"Episode Conclusion:\n{concluder_output.episode_conclusion}\n")
    print(f"Reflection:\n{concluder_output.reflection}\n")
    
    if concluder_output.reflection is not None:
      self.reflection = concluder_output.reflection
      self.reflection_history.append(concluder_output.reflection)
    
    return concluder_output
  
  def Breakpoint_Analyzer_Agent(
    self,
    rpa_exec_traj: JSON_models.RPAExecTraj,
    log_path: str,
  ) -> JSON_models.ExecEvaluatorOutput:
    print('============================================')
    print("Current Agent: Breakpoint_Analyzer_Agent\n")
    
    if not os.path.exists(log_path):
      os.makedirs(log_path)
    
    ui_content = self.env_op.cur_obs.ui_content
    
    # get prompt
    prompt = get_exec_evaluator_prompt(rpa_exec_traj=rpa_exec_traj, ui_content=ui_content)
    agent_utils.write_to_file(file_path=log_path, file_name='Exec_Evaluator_Agent_prompt.txt', content=prompt)
    
    # call MLLM
    output, raw_response = self.breakpoint_analyzer_llm.predict_mm(prompt, [],
                                                                    output_format=JSON_models.ExecEvaluatorOutput)
    agent_utils.write_to_file(file_path=log_path, file_name='Exec_Evaluator_Agent_output.txt', content=output)
    cost_tokens = raw_response.usage
    self.record_token.step = '-'
    self.record_token.agent = 'Exec Evaluator'
    self.record_token.step_tokens = cost_tokens
    self.record_token.llm = self.breakpoint_analyzer_llm.model_name
    agent_utils.record_cost_tokens(self.record_token)
    
    print(f'Observations:\n{output.observation}\n')
    print(f'Completed Tasks:\n{output.completed_tasks}\n')
    print(f'Code Diagnosis:\n{output.code_diagnosis}\n')
    print(f'Plan Justification:\n{output.plan_reason}\n')
    print(f'Plan List:\n{output.plan_list}\n')
    print(f'Whether To Continue:\n{output.to_continue}\n')
    
    return output
  
  def ActionTranslator_Agent(
    self,
    log_path: str,
    goal: str,
    step_n: int,
    step_data: Any,  # Can be PlannerStepData or SimpleNamespace
    related_element: str,
    related_index: int = None,
    suppress_header: bool = False,
  ) -> str:
    if not suppress_header:
      print_with_color('============================================', 'light_red')
      print_with_color("Current Agent: ActionTranslator_Agent\n", 'light_red')
    
    if not os.path.exists(log_path):
      os.makedirs(log_path)
    file_prefix = f'step-{step_n}'
    
    prompt = get_action_translator_prompt(goal=goal, obs_analysis=step_data.output.observation,
                                          action_reason=step_data.output.code_reason,
                                          action=step_data.output.code,
                                          related_element=related_element,
                                          ui_info_str=step_data.obs.ui_content)
    agent_utils.write_to_file(file_path=log_path, file_name=f'{file_prefix}_ActionTranslator_Agent_prompt.txt',
                              content=prompt)
    
    output, raw_response = self.actiontranslator_llm.predict_mm(prompt, [step_data.obs.screenshot],
                                                                 output_format=JSON_models.ActionTranslatorOutput)
    agent_utils.write_to_file(file_path=log_path, file_name=f'{file_prefix}_ActionTranslator_Agent_output.txt',
                              content=output)
    cost_tokens = raw_response.usage
    self.record_token.step = str(step_n)
    self.record_token.agent = 'ActionTranslator'
    self.record_token.step_tokens = cost_tokens
    self.record_token.llm = self.actiontranslator_llm.model_name
    agent_utils.record_cost_tokens(self.record_token)
    
    print(f'Thought:\n{output.thought}\n')
    print(f'Soft Action:\n{output.soft_action}\n')
    
    # if 'kwargs' in output.soft_action:  # Soft action with kwargs needs index; extract_ui_value ensures kwargs accuracy
    #   output.soft_action = agent_utils.extract_ui_value(output.soft_action, related_element, related_index)
    #
    # print(f'Optimized Soft Action:\n{output.soft_action}\n')
    
    return output.soft_action
  
  def _extract_action_result(self, summarize_and_analyze: str) -> str:
    """Extract Action result from summarize_and_analyze.
    
    Args:
      summarize_and_analyze: Planner-generated summarize_and_analyze string
      
    Returns:
      Extracted Action result, or empty string on failure
    """
    if not summarize_and_analyze or not isinstance(summarize_and_analyze, str):
      return ""
    
    # Match content between **Action result**: and **Page layout**:
    # Use regex for multiline
    pattern = r'\*\*Action result\*\*:\s*(.*?)\s*\*\*Page layout\*\*:'
    match = regex.search(pattern, summarize_and_analyze, regex.DOTALL)
    if match:
      result = match.group(1).strip()
      return result
    
    # If format is non-standard, try looser match
    # Match **Action result**: to next ** marker
    pattern_fallback = r'\*\*Action result\*\*:\s*(.*?)(?=\s*\*\*[^*]|$)'
    match_fallback = regex.search(pattern_fallback, summarize_and_analyze, regex.DOTALL)
    if match_fallback:
      result = match_fallback.group(1).strip()
      return result
    
    return ""
  
  def _is_passthrough_action(self, action: str | None) -> bool:
    """Return True if the action should bypass ActionTranslator entirely.
    
    These actions don't depend on specific UI elements and don't need translation:
    - scroll(direction): Directional scrolling
    - go_back(), go_forward(): Browser navigation
    - new_tab(), close_tab(): Tab management
    
    Note: ask_mllm and get_ui_content don't appear in react stage, so no need to check.
    """
    if not action or not isinstance(action, str):
      return False
    s = action.strip()
    if not s:
      return False
    # Normalize optional env_op prefix
    if s.startswith("env_op."):
      s2 = s[len("env_op."):]
    else:
      s2 = s
    # Extract function name
    m = regex.match(r"^([a-zA-Z_]\w*)\s*\(", s2)
    if not m:
      return False
    fn = m.group(1)
    # Hard whitelist: these don't need translation.
    if fn in {"scroll", "go_back", "go_forward", "new_tab", "close_tab"}:
      return True
    return False
  
  def _build_action_translation_context_from_react_traj(
    self,
    react_traj: JSON_models.ReActTraj
  ) -> list[dict]:
    """
    Build action translation context from ReActTraj for batch translation.
    
    Args:
      react_traj: ReActTraj to build context from
      
    Returns:
      List of context dictionaries for each step
    """
    translation_context = []
    
    # Build context from react_traj steps
    for step_info in react_traj.traj:
      # Get execution info from exec_step_info
      exec_step_info = step_info.exec_step_info
      
      is_screen_changed = exec_step_info.is_screen_changed if exec_step_info else False
      
      # Check if this is the final step
      action_code = step_info.soft_coded_action or step_info.action
      is_final_step = (
        'env_op.stop' in action_code or 
        action_code.strip().startswith('stop(') or
        step_info.step_n == len(react_traj.traj)
      )
      
      # Load screenshot from path if available
      screenshot = None
      if exec_step_info and exec_step_info.before_screenshot_path:
        screenshot_path = exec_step_info.before_screenshot_path
        if screenshot_path and screenshot_path.strip():
          try:
            screenshot = agent_utils.load_image_as_ndarray(screenshot_path)
          except Exception as e:
            print_with_color(f"  ⚠️  Failed to load screenshot for step {step_info.step_n}: {e}", 'yellow')
      
      # Create ScreenObs
      screen_obs = ScreenObs(
        screenshot=screenshot,
        ui_content=step_info.ui_content
      )
      
      # Create step_data using SimpleNamespace (similar to Android World)
      # Note: PlannerOutput uses 'summarize_and_analyze' but ActionTranslator expects 'observation'
      from types import SimpleNamespace
      
      # Create a simple output object with observation attribute
      output_obj = SimpleNamespace(
        observation=step_info.obs_description,
        code_reason=step_info.action_reason,
        code=step_info.action,
        summarize_and_analyze=step_info.obs_description,  # Keep for compatibility
      )
      
      # Create step_data using SimpleNamespace (more flexible than Pydantic model)
      step_data = SimpleNamespace(
        obs=screen_obs,
        output=output_obj,
        obs_description=step_info.obs_description,
        action_reason=step_info.action_reason,
        action=step_info.action,
      )
      
      translation_context.append({
        'step_n': step_info.step_n,
        'step_data': step_data,
        'related_element': step_info.related_elements,
        'related_index': exec_step_info.related_target if exec_step_info else None,
        'is_screen_changed': is_screen_changed,
        'is_final_step': is_final_step,
        'action': action_code
      })
    
    return translation_context
  
  def batch_translate_actions(
    self,
    react_trajs: list[JSON_models.ReActTraj],
    log_path: str = None,
  ) -> list[JSON_models.ReActTraj]:
    """
    Translate all actions in ReAct trajectories before RPA Builder.
    
    Args:
      react_trajs: List of ReAct trajectories to translate
      log_path: Optional log path for translation results
      
    Returns:
      List of ReAct trajectories with updated soft_coded_action fields
    """
    if not FLAGS.use_action_translator:
      # Action translation disabled, return as-is
      print_with_color("Action translation disabled, skipping batch translation.", 'yellow')
      return react_trajs
    
    print_with_color("\n" + "="*80, 'blue')
    print_with_color("🔧 Batch Action Translation (Before RPA Builder)", 'blue')
    print_with_color("="*80, 'blue')
    
    translated_trajs = []
    
    # Build translation context from the last (most recent) trajectory
    action_translation_context = []
    if react_trajs:
      print_with_color("📦 Building action translation context from ReActTraj...", 'cyan')
      last_traj = react_trajs[-1]  # Use the last (most recent) trajectory
      action_translation_context = self._build_action_translation_context_from_react_traj(last_traj)
      print_with_color(
        f"📦 Built action translation context with {len(action_translation_context)} steps",
        'cyan'
      )
    
    # Only translate the last trajectory (most recent ReAct episode)
    # Previous trajectories are kept as-is
    for traj_idx, react_traj in enumerate(react_trajs):
      is_last_traj = (traj_idx == len(react_trajs) - 1)
      
      if is_last_traj and action_translation_context:
        print_with_color(f"\n📋 Processing trajectory {traj_idx + 1}/{len(react_trajs)}:", 'cyan')
        
        # Create a mapping from step_n to context for easier lookup
        context_map = {ctx['step_n']: ctx for ctx in action_translation_context}
        
        # Determine the log path to use
        effective_log_path = log_path or self.log_task_path
        if not effective_log_path or not effective_log_path.strip():
          print_with_color(
            "⚠️  Warning: No valid log path available for action translation. "
            "Translation logs will not be saved.",
            'yellow'
          )
          effective_log_path = os.path.join(os.path.dirname(__file__), 'temp_translation_logs')
          os.makedirs(effective_log_path, exist_ok=True)
        
        translation_folder = os.path.join(effective_log_path, 'batch_action_translation')
        os.makedirs(translation_folder, exist_ok=True)
        
        # Process each step
        for step_info in react_traj.traj:
          ctx = context_map.get(step_info.step_n)
          
          # Skip if no context available
          if not ctx:
            print_with_color(f"  ⏭️  Step {step_info.step_n}: No context available, skipping", 'yellow')
            # Ensure soft_coded_action is set (use original action if not already set)
            if not step_info.soft_coded_action or not step_info.soft_coded_action.strip():
              step_info.soft_coded_action = step_info.action
            continue
          
          # Check if already soft-coded
          # First check if already soft-coded (contains find_element or ask_mllm)
          if step_info.soft_coded_action and step_info.soft_coded_action.strip():
            if 'find_element' in step_info.soft_coded_action or 'ask_mllm' in step_info.soft_coded_action:
              print_with_color(f"  ✓ Step {step_info.step_n}: Already soft-coded (find_element/ask_mllm), skipping translation", 'green')
              continue
          
          # Ensure soft_coded_action has a value (fallback to action if not set)
          if not step_info.soft_coded_action or not step_info.soft_coded_action.strip():
            step_info.soft_coded_action = step_info.action
          
          # Check if passthrough action (no translation needed) - check by action name
          if self._is_passthrough_action(step_info.action):
            print_with_color(f"  ⏭️  Step {step_info.step_n}: Passthrough action, no translation needed: {step_info.action}", 'green')
            # Set soft_coded_action to the original action
            step_info.soft_coded_action = step_info.action
            continue
          
          # Check if needs translation (screen changed or final step)
          if not (ctx['is_screen_changed'] or ctx['is_final_step']):
            print_with_color(f"  ⏭️  Step {step_info.step_n}: No screen change and not final step, skipping translation", 'yellow')
            # Ensure soft_coded_action is set (use original action if not already set)
            if not step_info.soft_coded_action or not step_info.soft_coded_action.strip():
              step_info.soft_coded_action = step_info.action
            continue
          
          # Translate the action
          try:
            print_with_color(f"  🔄 Step {step_info.step_n}: Translating action...", 'cyan')
            translated_action = self.ActionTranslator_Agent(
              log_path=translation_folder,
              goal=react_traj.task,
              step_n=step_info.step_n,
              step_data=ctx['step_data'],
              related_element=ctx['related_element'],
              related_index=ctx['related_index'],
              suppress_header=True
            )
            step_info.soft_coded_action = translated_action
            print_with_color(f"  ✓ Step {step_info.step_n}: Translation successful", 'green')
          except Exception as e:
            print_with_color(f"  ❌ Step {step_info.step_n}: Translation failed: {e}", 'red')
            # Keep original action if translation fails
            step_info.soft_coded_action = step_info.action
        
        translated_trajs.append(react_traj)
      else:
        # Keep previous trajectories as-is
        translated_trajs.append(react_traj)
    
    print_with_color("\n✅ Batch translation completed", 'green')
    return translated_trajs