"""
Utility functions for React* agent.

Independent utility functions that don't depend on external frameworks.
"""

import json
import os
from typing import List, Dict, Any, Optional

import numpy as np
from PIL import Image
from openai.types.completion_usage import CompletionUsage

# Optional imports
try:
    import cv2
    HAS_CV2 = True
except ImportError:
    HAS_CV2 = False

try:
    import pandas as pd
    HAS_PANDAS = True
except ImportError:
    HAS_PANDAS = False

try:
    from absl.flags import FLAGS
    HAS_FLAGS = True
except ImportError:
    HAS_FLAGS = False


def parse_ui_content(ui_content_str: str) -> List[Dict[str, Any]]:
    """
    Parse UI content string to list of UI elements.
    
    Args:
        ui_content_str: String representation of UI elements
        
    Returns:
        List of UI element dictionaries
    """
    try:
        # Try to parse as JSON
        if ui_content_str.strip().startswith('['):
            return json.loads(ui_content_str)
        
        # Otherwise, parse line by line
        elements = []
        lines = ui_content_str.split('\n')
        
        for line in lines:
            line = line.strip()
            if not line:
                continue
            
            # Try to extract structured information
            element = {"raw_text": line}
            
            # Try to parse as JSON line
            try:
                if line.startswith('{'):
                    element = json.loads(line)
            except:
                pass
            
            elements.append(element)
        
        return elements
    except Exception as e:
        print(f"Warning: Failed to parse UI content: {e}")
        return []


def format_action_history(action_history: List[str]) -> str:
    """
    Format action history for prompting.
    
    Args:
        action_history: List of action strings
        
    Returns:
        Formatted string
    """
    if not action_history:
        return "No previous actions."
    
    formatted = []
    for idx, action in enumerate(action_history, 1):
        formatted.append(f"Step {idx}:\n{action}\n")
    
    return "\n".join(formatted)


def print_with_color(message: Any, color: str) -> None:
    """
    Prints a message to the console with the specified color.
    
    Args:
        message: The message to print. It will be converted to a string if not already.
        color: The color to use for the message. Supported colors are 'red', 'green', 
               'yellow', 'blue', 'magenta', 'cyan', 'white', 'light_gray', 'dark_gray', 
               'light_red', and 'light_green'.
    """
    color_codes = {
        'red': '\033[91m',
        'green': '\033[92m',
        'yellow': '\033[93m',
        'blue': '\033[94m',
        'magenta': '\033[95m',
        'cyan': '\033[96m',
        'white': '\033[37m',
        'light_gray': '\033[37m',
        'dark_gray': '\033[90m',
        'light_red': '\033[91;1m',
        'light_green': '\033[92;1m',
    }
    reset_code = '\033[0m'
    color_code = color_codes.get(color, reset_code)
    print(f"{color_code}{message}{reset_code}")


def write_to_file(file_path: str, file_name: str, content: Any) -> None:
    """
    Write content to a file.
    
    Args:
        file_path: Directory path
        file_name: File name
        content: Content to write
    """
    os.makedirs(file_path, exist_ok=True)
    full_path = os.path.join(file_path, file_name)
    with open(full_path, 'w', encoding="utf-8") as file:
        file.write(str(content))
        file.flush()


def store_image(image_data, image_name: str, file_path: str) -> str:
    """
    Store an image to disk.
    
    Args:
        image_data: Image as numpy ndarray (matches agent_utils.py signature)
        image_name: File name
        file_path: Directory path
        
    Returns:
        Full path to saved image
    """
    os.makedirs(file_path, exist_ok=True)
    image = Image.fromarray(np.uint8(image_data))
    image_path = os.path.join(file_path, image_name)
    image.save(image_path)
    return image_path


def add_screenshot_label(screenshot: np.ndarray, label: str) -> None:
    """
    Add a text label to the right bottom of the screenshot.
    
    Args:
        screenshot: The screenshot as a numpy ndarray (modified in place)
        label: The text label to add, just a single word
    """
    if not HAS_CV2:
        # If cv2 is not available, skip adding label
        return
    
    height, width, _ = screenshot.shape
    screenshot[height - 30: height, width - 150: width, :] = (255, 255, 255)
    cv2.putText(
        screenshot,
        label,
        (width - 120, height - 5),
        cv2.FONT_HERSHEY_SIMPLEX,
        1,
        (0, 0, 0),
        thickness=2,
    )


def extract_action_type(action_code: str) -> str:
    """
    Extract action type from action code.
    
    Args:
        action_code: Action code string
        
    Returns:
        Action type
    """
    action_code_lower = action_code.lower()
    
    action_types = [
        ('click', 'click'),
        ('input_text', 'type'),
        ('type', 'type'),
        ('swipe', 'swipe'),
        ('open_app', 'open_app'),
        ('go_back', 'navigate_back'),
        ('go_home', 'navigate_home'),
        ('wait', 'wait'),
        ('answer', 'answer'),
        ('stop', 'stop'),
        ('shell', 'shell'),
    ]
    
    for keyword, action_type in action_types:
        if keyword in action_code_lower:
            return action_type
    
    return 'unknown'


def extract_action_parameters(action_code: str) -> Dict[str, Any]:
    """
    Extract parameters from action code.
    Supports both index-based and coordinate-based actions.
    
    Args:
        action_code: Action code string
        
    Returns:
        Dictionary of parameters
    """
    import re
    
    params = {}
    
    # Extract text parameter
    text_match = re.search(r'["\']([^"\']+)["\']', action_code)
    if text_match and ('input_text' in action_code or 'answer' in action_code):
        params['text'] = text_match.group(1)
    
    # Extract coordinates for coordinate-based actions
    # Pattern: env_op.click(x, y) or env_op.swipe(start_x, start_y, end_x, end_y)
    coord_pattern = r'\((\d+),\s*(\d+)\)'
    coord_matches = list(re.finditer(coord_pattern, action_code))
    
    if 'click' in action_code.lower() or 'long_press' in action_code.lower():
        # click(x, y) or long_press(x, y)
        if coord_matches:
            params['x'] = int(coord_matches[0].group(1))
            params['y'] = int(coord_matches[0].group(2))
    elif 'swipe' in action_code.lower():
        # Check for coordinate-based swipe: swipe(start_x, start_y, end_x, end_y)
        if len(coord_matches) >= 2:
            # Coordinate-based swipe
            params['start_x'] = int(coord_matches[0].group(1))
            params['start_y'] = int(coord_matches[0].group(2))
            params['end_x'] = int(coord_matches[1].group(1))
            params['end_y'] = int(coord_matches[1].group(2))
        else:
            # Legacy direction-based swipe
            direction_match = re.search(r'["\']([^"\']+)["\']', action_code)
            if direction_match:
                params['direction'] = direction_match.group(1)
    elif 'drag_and_drop' in action_code.lower():
        # Pattern: drag_and_drop(start_index, end_index) or drag_and_drop(start_x, start_y, end_x, end_y)
        if len(coord_matches) >= 2:
            # Coordinate-based drag_and_drop: drag_and_drop(start_x, start_y, end_x, end_y)
            params['start_x'] = int(coord_matches[0].group(1))
            params['start_y'] = int(coord_matches[0].group(2))
            params['end_x'] = int(coord_matches[1].group(1))
            params['end_y'] = int(coord_matches[1].group(2))
        elif len(coord_matches) == 0:
            # Index-based drag_and_drop: drag_and_drop(start_index, end_index)
            index_match = re.search(r'drag_and_drop\(\s*(\d+)\s*,\s*(\d+)', action_code)
            if index_match:
                params['start_index'] = int(index_match.group(1))
                params['end_index'] = int(index_match.group(2))
    elif 'input_text' in action_code.lower():
        # input_text(text, x, y, clear_text) or input_text(text, index, clear_text)
        # First check for coordinates
        if coord_matches and len(coord_matches) >= 1:
            # Check if the second parameter is a coordinate (not index)
            # Pattern: input_text("text", x, y, ...)
            # We need to find all numbers after the text parameter
            numbers = re.findall(r'\d+', action_code)
            if len(numbers) >= 2:
                # Assume first number after text is x, second is y
                # This is a heuristic - may need refinement
                try:
                    # Try to parse as coordinate-based
                    # Look for pattern: input_text("text", x, y
                    after_text = action_code.split('"', 2)[-1] if '"' in action_code else action_code
                    coord_nums = re.findall(r'\d+', after_text)
                    if len(coord_nums) >= 2:
                        params['x'] = int(coord_nums[0])
                        params['y'] = int(coord_nums[1])
                except:
                    pass
    
    # Extract index parameter (for index-based actions)
    if 'index' not in params and 'x' not in params:
        # Only extract index if we haven't already extracted coordinates
        index_match = re.search(r'\((\d+)\)', action_code)
        if index_match:
            params['index'] = int(index_match.group(1))
    
    # Extract clear_text parameter for input_text
    if 'input_text' in action_code.lower():
        if 'clear_text=False' in action_code or 'clear_text=false' in action_code:
            params['clear_text'] = False
        elif 'clear_text=True' in action_code or 'clear_text=true' in action_code:
            params['clear_text'] = True
        # Default is True if not specified
    
    # Extract shell command parameter
    if 'shell' in action_code.lower():
        # Pattern: shell('command') or shell("command")
        shell_match = re.search(r'shell\(["\'](.+?)["\']\)', action_code, re.DOTALL)
        if shell_match:
            params['command'] = shell_match.group(1)
    
    # Extract seconds parameter for wait action
    if 'wait' in action_code.lower():
        # Pattern: wait(seconds) or wait(2.5) or env_op.wait(seconds=1.0)
        wait_match = re.search(r'wait\([^)]*?(?:seconds\s*=\s*)?([\d.]+)', action_code)
        if wait_match:
            params['seconds'] = float(wait_match.group(1))
    
    return params


def record_cost_tokens(record_token: Any) -> None:
    """
    Record token usage for cost tracking.
    
    Args:
        record_token: Token record object (should have file_path, task_type, etc.)
    """
    # Ensure the file_path exists
    os.makedirs(record_token.file_path, exist_ok=True)
    
    # File name and full path
    file_name = 'step_tokens.csv'
    full_file_path = os.path.join(record_token.file_path, file_name)
    
    # Initialize the table. If the file does not exist, create it
    if not os.path.exists(full_file_path):
        columns = ['Task Type', 'Task Num', 'Attempt', 'Stage', 'Step', 'Agent', 'Input', 'Output', 'Total', 'Cached', "LLM"]
        table = pd.DataFrame(columns=columns)
        table.to_csv(full_file_path, index=False)
    else:
        # If the file exists, load the table
        table = pd.read_csv(full_file_path)
    
    if isinstance(record_token.step_tokens, CompletionUsage):
        input_tokens = record_token.step_tokens.prompt_tokens
        output_tokens = record_token.step_tokens.completion_tokens
        total_tokens = record_token.step_tokens.total_tokens
        cached_tokens = record_token.step_tokens.prompt_tokens_details.cached_tokens if record_token.step_tokens.prompt_tokens_details else 0
    else:
        input_tokens = record_token.step_tokens.input_tokens
        output_tokens = record_token.step_tokens.output_tokens
        total_tokens = input_tokens + output_tokens
        cached_tokens = record_token.step_tokens.cache_creation_input_tokens + record_token.step_tokens.cache_read_input_tokens

    # Add a new row as a DataFrame
    new_row = pd.DataFrame([{
        'Task Type': record_token.task_type,
        'Task Num': record_token.task_num,
        'Attempt': str(FLAGS.cur_attempt_cnt),
        # 'Round': record_token.round,
        'Stage': record_token.stage,
        'Step': record_token.step,
        'Agent': record_token.agent,
        'Input': input_tokens,
        'Output': output_tokens,
        'Total': total_tokens,
        'Cached': cached_tokens,
        'LLM': record_token.llm,
    }])
    
    # Use pd.concat to combine the old table and the new row
    table = pd.concat([table, new_row], ignore_index=True)
    
    # Save the updated table to the file
    table.to_csv(full_file_path, index=False)

