"""
AutoRPA Main Entry Point

This script orchestrates the AutoRPA system for automated RPA (Robotic Process Automation)
generation and testing on Android applications.

Key Components:
  - GUI Agent: Explores tasks and generates trajectories (React*, DroidRun, AskUI)
  - RPA Builder: Converts trajectories into reusable RPA code
  - RPA Executor: Tests and verifies generated RPAs

Parameter Organization:
  1. Experiment Mode Selection - Choose agent type and test mode
  2. GUI Agent Configuration - Configure exploration agent (type-specific)
  3. LLM Model Configuration - Specify models for different components
  4. Task Configuration - Define task exploration parameters
  5. Action Generation Configuration - Control action translation and optimization
  6. Knowledge Bank Configuration - Manage RPA and trajectory persistence
  7. Testing Configuration - Configure RPA testing behavior
  8. Benchmark & Task Suite Configuration - Select evaluation tasks
  9. Android Emulator Configuration - Set up device connection
  10. Experiment Logging Configuration - Control output and logs
  11. MiniWoB Benchmark Configuration - MiniWoB-specific settings

Conditional Parameters (⚙️):
  - Some parameters are only active under specific conditions (e.g., gui_agent_type)
  - Refer to individual parameter help strings for activation conditions

See USAGE EXAMPLES section below for common command-line invocations.
"""

import os

# Set env vars before importing any gRPC-related code to suppress gRPC warnings
os.environ['GRPC_VERBOSITY'] = 'ERROR'
os.environ['GRPC_TRACE'] = ''
os.environ['GLOG_minloglevel'] = '2'  # 0=INFO, 1=WARNING, 2=ERROR, 3=FATAL

from gui_agents.react_star.adapter import ReactStarAgent

import datetime
import math

import sys
import time
from collections.abc import Sequence

from absl import app, flags, logging

from autorpa.core import agent_rpa
from autorpa import suite_utils as suite_utils
from autorpa.env_operation import EnvOperation
from autorpa.utils.llm_client import get_llm_wrapper
from autorpa.utils.rpa_bank_utils import RPABank
from autorpa.utils.traj_utils import ReactTrajBank
from android_world import registry
from android_world.env import env_launcher

# import ssl
# ssl._create_default_https_context = ssl._create_unverified_context

logging.set_verbosity(logging.WARNING)

from dotenv import load_dotenv, find_dotenv
load_dotenv(find_dotenv())

## ============================================================================
## FLAG DEFINITIONS
## ============================================================================
# Flags are organized by functional category for better maintainability.
# Conditional flags (marked with ⚙️) are only used under specific conditions.

# =============================================================================
# 1. EXPERIMENT MODE SELECTION
# =============================================================================
flags.DEFINE_string(
    'agent_name', 'autorpa',
    help="Experiment mode: 'gui-agent' (exploration only), 'autorpa' (full pipeline)"
)

flags.DEFINE_boolean(
    'test_rpa_mode', False, 
    help='If True, test existing RPAs from rpa_bank instead of generating new ones. '
         'Automatically loads rpa_bank.json when enabled. '
         'update_rpa_bank has no effect in this mode (no new RPAs generated).'
)

flags.DEFINE_integer(
    'reflection_rounds', 2,
    help='Number of reflection rounds for GUI agent exploration. '
         'Higher values may improve success rate but increase cost. '
         'Only used when agent_name=gui-agent or in AutoRPA exploration phase.'
)

# =============================================================================
# 2. GUI AGENT CONFIGURATION
# =============================================================================
flags.DEFINE_string(
    'gui_agent_type', 'react_star', 
    help="GUI agent for exploration phase:\n"
         "  - 'react_star': React* Planner + Summarizer (default)\n"
         "  - 'droidrun': DroidRun agent\n"
         "  - 'askui': AskUI agent"
)

# ⚙️ DroidRun Agent Specific Configuration (only when gui_agent_type='droidrun')
flags.DEFINE_string(
    'droidrun_config_path', 'config.yaml', 
    help='[DroidRun only] Path to DroidRun configuration file'
)
flags.DEFINE_integer(
    'droidrun_timeout', 600, 
    help='[DroidRun only] Timeout for DroidRun agent execution (seconds)'
)

# =============================================================================
# 3. LLM MODEL CONFIGURATION
# =============================================================================
# Available models: 'gpt-4o', 'gpt-4.1', 'gpt-5-low', 
#                   'gemini-2.5-pro-thinking', 'claude-sonnet-4-5'
# gpt-5-low means gpt-5 low reasoning effort

flags.DEFINE_string(
    'default_llm', 'gpt-5-low',
    help="Default LLM model for all components (unless overridden below)"
)

# --- Specialized LLM Models (optional overrides) ---
flags.DEFINE_string(
    'builder_llm', 'gpt-5-medium',
    help="LLM for RPA Builder Agent (generates RPA code from trajectories)"
)

flags.DEFINE_string(
    'grounder_llm', 'gpt-5-low',
    help="LLM for UI element grounding in find_element() calls. "
         "Note: Use non-thinking models like 'gemini-2.5-pro-nothinking' for faster grounding."
)

flags.DEFINE_string(
    'actiontranslator_llm', 'gpt-5-mini',
    help="LLM for ActionTranslator Agent (converts hardcoded actions to soft-coded actions)"
)

flags.DEFINE_string(
    'breakpoint_analyzer_llm', 'gpt-5-low',
    help="LLM for Breakpoint Analyzer Agent (analyzes breakpoints in RPA code)"
)

flags.DEFINE_string(
    'concluder_llm', 'gpt-5-low',
    help="LLM for Concluder Agent (concludes RPA code)"
)

flags.DEFINE_string(
    'params_extractor_llm', 'gpt-5-mini',
    help="LLM for Params Extractor Agent (extracts parameters from RPA code)"
)

flags.DEFINE_string(
    'ask_mllm_llm', 'gpt-5-low',
    help="LLM for AskMLLM action (asks questions to the LLM for information retrieval)"
)

flags.DEFINE_boolean(
    'enable_shell_action', False,
    help='Enable shell action support across entire pipeline (exploration + building). '
         'When enabled: GUI agent can execute ADB shell commands, and ActionTranslator/RPA Builder will translate them. '
         'Use with caution - shell commands provide system-level access.'
)

# ⚙️ React* Agent Specific LLMs (only when gui_agent_type='react_star')
flags.DEFINE_string(
    'planner_llm', 'claude-sonnet-4-5',
    help="[React* only] LLM for Planner Agent (generates action plans)"
)

flags.DEFINE_string(
    'summarizer_llm', 'gpt-5-low',
    help="[React* only] LLM for Summarizer Agent (summarizes execution results)"
)

flags.DEFINE_enum(
    'react_star_action_space', 'index',
    ['index', 'coordinate'],
    help="[React* only] Action space mode: 'index' (use element indexes) or 'coordinate' (use pixel coordinates). "
         "Auto-inferred from react_star_ui_info if not set: screenshot_with_tree/screenshot_only_som → index, screenshot_only → coordinate."
)

flags.DEFINE_enum(
    'react_star_ui_info', 'screenshot_with_tree',
    ['screenshot_with_tree', 'screenshot_only', 'screenshot_only_som'],
    help="[React* only] UI information mode: 'screenshot_with_tree' (screenshot + ally tree), "
         "'screenshot_only' (screenshot only), 'screenshot_only_som' (screenshot with SOM markers). "
         "Affects react_star_action_space auto-inference: screenshot_with_tree/screenshot_only_som → index, screenshot_only → coordinate."
)

flags.DEFINE_enum(
    'react_star_img_resize_mode', 'resized',
    ['original', 'resized'],
    help="[React* only] Image resize mode: 'original' (use original screenshots) or 'resized' (use resized screenshots 461x1024). When 'resized' and action_space_mode='coordinate', coordinates will be automatically converted from resized to original scale."
)

# =============================================================================
# 4. TASK CONFIGURATION
# =============================================================================
flags.DEFINE_integer(
    'num_tasks_to_explore', 3,
    help='Number of task instances to explore per task type. '
         'Directly impacts the reliability and generalization of learned RPAs. '
         'Recommended range: 1-10.'
)

flags.DEFINE_integer(
    'max_attempts_per_task', 3, 
    help='Maximum attempts to build/fix RPA for a task before abandoning it.'
)

# Internal state variable (auto-managed, do not set manually)
flags.DEFINE_integer(
    'cur_attempt_cnt', 1,
    help='[INTERNAL] Current attempt number during RPA building. '
         'Automatically managed by the system. Do not set this manually.'
)

# =============================================================================
# 5. ACTION GENERATION CONFIGURATION
# =============================================================================
flags.DEFINE_boolean(
    'use_action_translator', True,
    help='Enable ActionTranslator Agent to convert hardcoded actions (e.g., click(5)) '
         'to soft-coded actions (e.g., find_element + click). '
         'Significantly improves RPA generalization across different task instances.'
)

flags.DEFINE_boolean(
    'use_fetch_info', True, 
    help='Enable RPA Builder to fetch additional UI information from trajectories '
         'when generating RPA code. Improves code quality but increases LLM calls.'
)

# =============================================================================
# 6. KNOWLEDGE BANK CONFIGURATION
# =============================================================================
flags.DEFINE_boolean(
    'update_rpa_bank', True, 
    help='[Normal mode only] Save newly generated RPAs to data/rpa_bank.json after successful generation. '
         'Has no effect when test_rpa_mode=True (no new RPAs generated). '
         'Temporary RPA files are always saved to log directory regardless of this setting.'
)

flags.DEFINE_boolean(
    'use_react_trajs_bank', True, 
    help='Load and use previously successful React trajectories from react_trajs_bank.json. '
         'Can speed up RPA generation by reusing known successful paths.'
)

flags.DEFINE_boolean(
    'update_react_trajs_bank', True, 
    help='Save successful React trajectories to react_trajs_bank.json for future reuse.'
)

flags.DEFINE_boolean(
    'force_update_react_trajs_bank', False, 
    help='Force update react_trajs_bank.json even if new trajectory quality is lower than existing one. '
         'When True, skips quality-based comparison and always replaces existing trajectories for the same instance_id.'
)

# =============================================================================
# 7. TESTING CONFIGURATION
# =============================================================================
flags.DEFINE_list(
    'to_test_tasks', [0], 
    help='Task indices to test (0-based). Used when test_rpa_mode=True or run_react_test_tasks=True. '
         'Default [0] tests first task. Examples: [0], [0,1,2], [5,10,15].'
)

flags.DEFINE_boolean(
    'run_react_test_tasks', False, 
    help='[Debug] When True, use to_test_tasks list and run React agent instead of RPA execution. '
         'Useful for comparing React vs RPA performance. '
         'Automatically set to True when agent_name=gui-agent.'
)

# =============================================================================
# 8. BENCHMARK & TASK SUITE CONFIGURATION
# =============================================================================
flags.DEFINE_enum(
    'suite_family', registry.TaskRegistry.ANDROID_WORLD_FAMILY,
    [registry.TaskRegistry.ANDROID_WORLD_FAMILY,
     registry.TaskRegistry.MINIWOB_FAMILY_SUBSET,
     registry.TaskRegistry.MINIWOB_FAMILY,
     registry.TaskRegistry.ANDROID_FAMILY,
     registry.TaskRegistry.INFORMATION_RETRIEVAL_FAMILY],
    help='Task suite family to evaluate. See registry.py for details. '
         'Note: Only one family can be run at a time.'
)

flags.DEFINE_list(
    'tasks', None,
    help='Specific tasks to run from the suite family. '
         'If None, runs all tasks in the suite. '
         'Special values: "subset" loads predefined TASKS_SUBSET from configs/task_subsets.py. '
         'Examples: None (all tasks), ["FilesDeleteFile","ContactsAddContact"], ["subset"], ["rest"]'
)

flags.DEFINE_integer(
    'task_random_seed', 30, 
    help='Random seed for task parameter generation. '
         'Ensures reproducibility across runs.'
)

flags.DEFINE_boolean(
    'fixed_task_seed', False,
    help='Use identical task parameters across all task instances. '
         'Useful for debugging RPA generation with consistent task variations.'
)

# =============================================================================
# 9. ANDROID EMULATOR CONFIGURATION
# =============================================================================
def _find_adb_directory() -> str:
  """Automatically locate adb executable in common Android SDK paths."""
  potential_paths = [
    os.path.expanduser('~/Library/Android/sdk/platform-tools/adb'),  # macOS
    os.path.expanduser('~/Android/Sdk/platform-tools/adb'),  # Linux
    os.path.expanduser('~/AppData/Local/Android/Sdk/platform-tools/adb.exe')  # Windows
  ]
  for path in potential_paths:
    if os.path.isfile(path):
      return path
  raise EnvironmentError(
    'adb not found in common Android SDK paths. Please install Android SDK '
    'and ensure adb is in one of the expected directories, or specify --adb_path.'
  )


flags.DEFINE_string(
    'adb_path', _find_adb_directory(), 
    help='Path to adb executable. Auto-detected by default. '
         'Override if adb is installed in a custom location.'
)

flags.DEFINE_integer(
    'console_port', 5554, 
    help='Console port of the running Android emulator. '
         'Default 5554 corresponds to emulator-5554.'
)

# =============================================================================
# 10. EXPERIMENT LOGGING CONFIGURATION
# =============================================================================
flags.DEFINE_string(
    'log_folder_exp', '', 
    help='[Auto-generated] Path to save experiment logs and intermediate files. '
         'Automatically set to log/{agent_name}_{timestamp}_{llm}/ if empty.'
)

flags.DEFINE_boolean(
    'enable_llm_logging', False,
    help='Enable logging of each LLM call to local log folder. '
         'When False, LLM call logs (prompts, images, metadata) will not be saved.'
)

flags.DEFINE_enum(
    'log_level', 'INFO',
    ['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'],
    help='Console logging level. Controls which log messages are displayed in terminal. '
         'Note: Log files always contain all levels (including DEBUG) for post-analysis. '
         'Use DEBUG for development, INFO for production runs.'
)

# =============================================================================
# 11. MINIWOB BENCHMARK CONFIGURATION (suite_family='miniwob_*')
# =============================================================================
flags.DEFINE_float(
    'miniwob_transition_pause', 0.2,
    help='[MiniWoB only] Pause duration (seconds) between actions. '
         'MiniWoB is lightweight and loads quickly, so short pauses suffice.'
)

flags.DEFINE_string(
    'miniwob_guidelines',
    '- This task is running in a mock app, you MUST STAY IN this app and DO NOT use the `env_op.go_home()` action.\n'
    '- Complete the task by clicking the "Submit" button when ready. Do NOT use env_op.stop() or env_op.answer() as the task will be automatically evaluated after submission.',
    help='[MiniWoB only] Additional task-specific guidelines for the agent.'
)

FLAGS = flags.FLAGS

# =============================================================================
# Import Task Subsets from Configuration
# =============================================================================
# Task lists are now maintained in configs/task_subsets.py for better organization
# Available subsets: TASKS_SUBSET (40 tasks), TASKS_CHOSEN_SUBSET (38 tasks), RAG_TEST_TASKS
from configs.task_subsets import REST_TASKS, TASKS_SUBSET

def set_up_configs(current_time: str):
  ## Android-related info
  os.environ['ADB_PATH'] = os.path.expanduser('~/Library/Android/sdk/platform-tools/adb')
  # os.environ['AVD_PATH'] = '/Users/susu/.android/avd/AndroidWorldAvd.avd/snapshotsa'
  # os.environ['SNAPSHOTS'] = 'snap_2025-01-06_21-14-26' # adb -s emulator-5554 emu avd snapshot list to see real tag name
  
  # Ensure gRPC logs are fully suppressed (set at top of file, re-affirmed here)
  os.environ['GRPC_VERBOSITY'] = 'ERROR'
  os.environ['GRPC_TRACE'] = ''
  os.environ['GLOG_minloglevel'] = '2'
  
  # Configure Python logging
  import logging as py_logging
  
  # Suppress gRPC-related loggers
  py_logging.getLogger('grpc').setLevel(py_logging.CRITICAL)
  py_logging.getLogger('grpc._cython.cygrpc').setLevel(py_logging.CRITICAL)
  py_logging.getLogger('google.auth').setLevel(py_logging.CRITICAL)
  
  # Configure root logger for AutoRPA
  # Set console output level first
  console_log_level = getattr(py_logging, FLAGS.log_level)
  
  # Create console handler (temporary; later replaced by DualOutput)
  console_handler = py_logging.StreamHandler(sys.stdout)
  console_handler.setLevel(console_log_level)
  console_formatter = py_logging.Formatter(
    '%(asctime)s [%(levelname)s] %(name)s - %(message)s',
    datefmt='%H:%M:%S'
  )
  console_handler.setFormatter(console_formatter)
  
  # AutoRPA root logger
  autorpa_logger = py_logging.getLogger('autorpa')
  autorpa_logger.setLevel(py_logging.DEBUG)  # Capture all levels
  autorpa_logger.addHandler(console_handler)
  
  # GUI-agents root logger
  gui_logger = py_logging.getLogger('gui-agents')
  gui_logger.setLevel(py_logging.DEBUG)
  gui_logger.addHandler(console_handler)
  
  ### Create a folder to store intermediate files
  # Determine the path for the log folder
  log_folder = "log"
  os.makedirs(log_folder, exist_ok=True)
  # Each folder stores the intermediate files for one experiment
  if FLAGS.test_rpa_mode:
    FLAGS.log_folder_exp = os.path.join(log_folder, f"test_{current_time}_{FLAGS.default_llm}")
  else:
    FLAGS.log_folder_exp = os.path.join(log_folder, f"{FLAGS.agent_name}_{current_time}_{FLAGS.default_llm}")
  os.makedirs(FLAGS.log_folder_exp, exist_ok=True)
  # Create the full path for the log file
  log_file_name = os.path.join(FLAGS.log_folder_exp, f"output_{current_time}.log")
  
  ### Redirect sys.stdout and register cleanup
  import atexit
  import logging as py_logging
  from autorpa.utils.logging_utils import DualOutput, DualError
  from autorpa.utils.config_validator import validate_flags
  
  dual_output = DualOutput(log_file_name)
  dual_error = DualError(log_file_name)
  
  sys.stdout = dual_output
  sys.stderr = dual_error
  
  # Register cleanup handlers to ensure files are closed on exit
  atexit.register(dual_output.close)
  atexit.register(dual_error.close)
  
  # File handler (log all levels to file)
  file_handler = py_logging.FileHandler(log_file_name)
  file_handler.setLevel(py_logging.DEBUG)  # File records all levels
  file_formatter = py_logging.Formatter(
    '%(asctime)s [%(levelname)s] %(name)s:%(lineno)d - %(message)s',
    datefmt='%Y-%m-%d %H:%M:%S'
  )
  file_handler.setFormatter(file_formatter)
  
  # Add file handler to AutoRPA and GUI agents loggers
  py_logging.getLogger('autorpa').addHandler(file_handler)
  py_logging.getLogger('gui_agents').addHandler(file_handler)
  py_logging.getLogger('main').addHandler(file_handler)
  
  # Print log level info
  if FLAGS.log_level == 'DEBUG':
    print(f"📊 Logging Level: DEBUG (showing all debug messages)")
  else:
    print(f"📊 Logging Level: {FLAGS.log_level} (use --log_level=DEBUG to see debug messages)")
  print(f"📁 Log File: {log_file_name} (contains all levels including DEBUG)")
  print()
  
  # Validate configuration after setup
  validate_flags()


def get_rpa_agent(env_op: EnvOperation):
  """Gets RPA agent with configured LLM models.
  
  Returns:
    Agent_RPA: The core RPA agent instance
  """
  print('Initializing RPA agent...')
  
  # Create main LLM wrapper
  default_llm = get_llm_wrapper(model_name=FLAGS.default_llm, enable_logging=FLAGS.enable_llm_logging)
  
  # Create ActionTranslator LLM wrapper if different model specified
  actiontranslator_llm = None
  if FLAGS.actiontranslator_llm != FLAGS.default_llm:
    print(f'Using ActionTranslator model: {FLAGS.actiontranslator_llm}')
    actiontranslator_llm = get_llm_wrapper(model_name=FLAGS.actiontranslator_llm, enable_logging=FLAGS.enable_llm_logging)
  
  # Create Breakpoint Analyzer LLM wrapper if different model specified
  breakpoint_analyzer_llm = None
  if FLAGS.breakpoint_analyzer_llm != FLAGS.default_llm:
    print(f'Using Breakpoint Analyzer model: {FLAGS.breakpoint_analyzer_llm}')
    breakpoint_analyzer_llm = get_llm_wrapper(model_name=FLAGS.breakpoint_analyzer_llm, enable_logging=FLAGS.enable_llm_logging)
  
  # Create Concluder LLM wrapper if different model specified
  concluder_llm = None
  if FLAGS.concluder_llm != FLAGS.default_llm:
    print(f'Using Concluder model: {FLAGS.concluder_llm}')
    concluder_llm = get_llm_wrapper(model_name=FLAGS.concluder_llm, enable_logging=FLAGS.enable_llm_logging)
  
  # Create Params Extractor LLM wrapper if different model specified
  params_extractor_llm = None
  if FLAGS.params_extractor_llm != FLAGS.default_llm:
    print(f'Using Params Extractor model: {FLAGS.params_extractor_llm}')
    params_extractor_llm = get_llm_wrapper(model_name=FLAGS.params_extractor_llm, enable_logging=FLAGS.enable_llm_logging)
  
  # Create RPA agent with LLM wrappers
  rpa_agent = agent_rpa.Agent_RPA(
    env_op, 
    default_llm,
    actiontranslator_llm=actiontranslator_llm, 
    breakpoint_analyzer_llm=breakpoint_analyzer_llm,
    concluder_llm=concluder_llm,
    params_extractor_llm=params_extractor_llm,
  )
  
  if FLAGS.suite_family and FLAGS.suite_family.startswith('miniwob') and hasattr(rpa_agent, 'set_task_guidelines'):
    rpa_agent.set_task_guidelines(FLAGS.miniwob_guidelines)
  
  if FLAGS.suite_family.startswith('miniwob'):
    # MiniWoB pages change quickly, no need to wait for screen to stabilize.
    rpa_agent.transition_pause = FLAGS.miniwob_transition_pause
  else:
    rpa_agent.transition_pause = None
  
  return rpa_agent


def create_gui_agent(gui_agent_type: str, agent_rpa_instance):
  """
  Create a GUI agent for the exploration phase.
  
  Uses the agent registry for automatic discovery and creation.
  
  Args:
    gui_agent_type: Type of GUI agent ('react_star', 'droidrun', 'askui', etc.)
    agent_rpa_instance: Instance of Agent_RPA (passed to agents that need it)
    
  Returns:
    BaseGUIAgent: GUI agent instance
  """
  from gui_agents import agent_registry
  
  # Prepare agent-specific kwargs
  kwargs = {'agent_rpa': agent_rpa_instance}
  
  # Add type-specific parameters
  if gui_agent_type == 'react_star':
    print('🤖 Creating React* Agent (Planner + Summarizer)')
    
    # Create Planner LLM wrapper
    if FLAGS.planner_llm != FLAGS.default_llm:
      print(f'  Using Planner model: {FLAGS.planner_llm}')
    planner_llm = get_llm_wrapper(model_name=FLAGS.planner_llm, enable_logging=FLAGS.enable_llm_logging)
    
    # Create Summarizer LLM wrapper
    if FLAGS.summarizer_llm != FLAGS.default_llm:
      print(f'  Using Summarizer model: {FLAGS.summarizer_llm}')
    summarizer_llm = get_llm_wrapper(model_name=FLAGS.summarizer_llm, enable_logging=FLAGS.enable_llm_logging)
    
    # Get action_space_mode and ui_info_mode from FLAGS
    from autorpa.run_tasks_gui_agent import infer_react_star_action_space
    action_space_mode = infer_react_star_action_space(
      FLAGS.react_star_action_space,
      FLAGS.react_star_ui_info
    )
    
    # Create ReactStarAgent directly
    from gui_agents.react_star.adapter import ReactStarAgent
    return ReactStarAgent(
      agent=agent_rpa_instance,
      planner_llm=planner_llm,
      summarizer_llm=summarizer_llm,
      action_space_mode=action_space_mode,
      ui_info_mode=FLAGS.react_star_ui_info,
      img_resize_mode=FLAGS.react_star_img_resize_mode,
      enable_shell_action=FLAGS.enable_shell_action
    )
  
  elif gui_agent_type == 'droidrun':
    print('🤖 Creating DroidRun Agent')
    kwargs.update({
      'droidrun_config_path': FLAGS.droidrun_config_path,
      'timeout': FLAGS.droidrun_timeout,
    })
  
  elif gui_agent_type == 'askui':
    print('🤖 Creating AskUI Agent')
    # askui-specific kwargs will be added here
    pass
  
  # Create agent via registry
  try:
    return agent_registry.create(gui_agent_type, **kwargs)
  except ValueError as e:
    available = ', '.join(agent_registry.list_agents())
    raise ValueError(
      f"Unknown gui_agent_type: {gui_agent_type}. "
      f"Available agents: {available}"
    ) from e


def _main(current_time: str) -> None:
  start_time = time.time()
  
  ## create raw_env & env
  raw_env = env_launcher.load_and_setup_env(
    console_port=FLAGS.console_port,
    emulator_setup=False,  # Emulator setup is handled separately, not needed here
    adb_path=FLAGS.adb_path,
  )
  env_op = EnvOperation(raw_env)
  
  # Load banks from data directory
  # In test mode, we must load existing RPAs to test them
  # In normal mode, we don't load (always generate new RPAs)
  project_root = os.path.dirname(os.path.abspath(__file__))
  rpa_bank_path = os.path.join(project_root, 'data', 'rpa_bank.json')
  data_path = os.path.join(project_root, 'data')
  
  rpa_bank = RPABank(
    file_name=rpa_bank_path,
    load_local_bank=FLAGS.test_rpa_mode,  # Only load in test mode
    start_timestamp=current_time  # Use same timestamp as log folder
  )
  react_traj_bank = ReactTrajBank(
    save_path=data_path,  # Use base path to enable config-based separation
    load_local_bank=FLAGS.use_react_trajs_bank,
    start_timestamp=current_time  # Use same timestamp as log folder
  )
  
  if FLAGS.test_rpa_mode:
    FLAGS.tasks = list(rpa_bank.rpa_dict.keys())
  
  ## registry tasks
  if FLAGS.tasks:
    if 'subset' in FLAGS.tasks:
      FLAGS.tasks = TASKS_SUBSET
    elif 'rest' in FLAGS.tasks:
      FLAGS.tasks = REST_TASKS
  task_registry = registry.TaskRegistry()
  task_suite = suite_utils.create_suite(
    task_registry.get_registry(family=FLAGS.suite_family),
    n_task_combinations=max(FLAGS.num_tasks_to_explore, FLAGS.to_test_tasks[-1]) + 1,
    seed=FLAGS.task_random_seed,
    tasks=FLAGS.tasks,
    use_identical_params=FLAGS.fixed_task_seed,
  )
  task_suite.suite_family = FLAGS.suite_family
  
  ## create agent
  rpa_agent = get_rpa_agent(env_op)
  # Action translation is coupled with GUI agent action space, so let Agent_RPA know
  # which gui-agent is selected (react_star / droidrun / askui / ...).
  if hasattr(rpa_agent, "set_gui_agent_type"):
    rpa_agent.set_gui_agent_type(FLAGS.gui_agent_type)
  if FLAGS.agent_name == 'gui-agent': FLAGS.run_react_test_tasks = True
  
  print(f'Starting eval with agent {FLAGS.agent_name}')
  
  # Create GUI Agent for exploration phase (pluggable)
  gui_agent = create_gui_agent(FLAGS.gui_agent_type, rpa_agent)
  
  import json
  # Load task templates from configs directory
  project_root = os.path.dirname(os.path.abspath(__file__))
  config_path = os.path.join(project_root, 'configs', 'androidworld_task_templates.json')
  with open(config_path, 'r', encoding='utf-8') as f:
    data = json.load(f)
  task_templates = {item['task_name']: item['task_template'] for item in data}
  
  # Common parameters for both runners
  common_params = {
    'task_suite': task_suite,
    'env_op': env_op,
    'react_traj_bank': react_traj_bank,
    'task_templates': task_templates,
    'gui_agent': gui_agent,
    'agent': rpa_agent,
  }
  
  # Choose runner and execute based on agent_name
  if FLAGS.agent_name == 'gui-agent':
    # Pure exploration mode - use simplified runner
    from autorpa import run_tasks_gui_agent as run_tasks
    run_tasks.run(**common_params)
  else:
    # Full AutoRPA mode - exploration + building + verification
    from autorpa import run_tasks_rpa as run_tasks
    run_tasks.run(
      **common_params,
      rpa_bank=rpa_bank
    )
  
  print(f'Finished running agent {FLAGS.agent_name} on {FLAGS.suite_family} family.')
  
  spend_time = time.time() - start_time
  hours = math.floor(spend_time / 3600)
  minutes = math.floor((spend_time - hours * 3600) / 60)
  seconds = int(spend_time - hours * 3600 - minutes * 60)
  print(f"Take {hours}hours {minutes}minutes {seconds}seconds.")
  raw_env.close()


def main(argv: Sequence[str]) -> None:
  del argv
    # Get the current time and generate a filename
  current_time = datetime.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
  set_up_configs(current_time)
  _main(current_time)


if __name__ == '__main__':
  app.run(main)
