from __future__ import annotations

import datetime
import hashlib
import json
import logging
import os
import random
import re
import shlex
import subprocess
import time
import traceback
from dataclasses import dataclass, field
from pathlib import Path, PurePath
from typing import Any

import gymnasium as gym
import yaml
from ghapi.all import GhApi
from git import Repo
from simple_parsing.helpers.serialization.serializable import FrozenSerializable
from swebench.harness.constants import MAP_REPO_VERSION_TO_SPECS
from swebench.harness.utils import get_environment_yml, get_requirements

import docker
import docker.errors
import docker.models.containers
from sweagent import REPO_ROOT
from sweagent.agent.interactive_commands import (
    INTERACTIVE_SESSIONS_CONFIG,
    InteractiveSession,
    InteractiveSessionConfig,
    get_interactive_commands,
    get_interactive_session,
)
from sweagent.environment.utils import (
    PROCESS_DONE_MARKER_END,
    PROCESS_DONE_MARKER_START,
    InvalidGithubURL,
    NoOutputTimeoutError,
    PatchFormatter,
    attach_network_interface_to_container,
    copy_anything_to_container,
    copy_file_to_container,
    format_trajectory_markdown,
    get_container,
    get_docker_compose,
    get_gh_issue_data,
    get_instances,
    image_exists,
    parse_gh_issue_url,
    read_with_timeout,
    read_with_timeout_experimental,
    terminate_docker_compose,
)
from sweagent.types import AgentInfo
from sweagent.utils.config import keys_config
from sweagent.utils.log import default_logger, get_logger
from sweagent.environment.flag_exceptions import EXCEPTION_FLAGS

LONG_TIMEOUT = float(keys_config.get("SWE_AGENT_ENV_LONG_TIMEOUT", 60))
AGENT_ACTION_TIMEOUT = float(keys_config.get("SWE_AGENT_ACTION_TIMEOUT", 30))  # Changed from 60 seconds to 30 seconds
AGENT_ACTION_NO_OUTPUT_TIMEOUT = float(keys_config.get("SWE_AGENT_ACTION_NO_OUTPUT_TIMEOUT", 15))
PATH_TO_REQS = "/root/requirements.txt"
PATH_TO_ENV_YML = "/root/environment.yml"


@dataclass(frozen=True)
class EnvironmentArguments(FrozenSerializable):
    """Configure data sources and setup instructions for the environment in which we solve the tasks."""

    # Source of issue statement/problem statement. To run over a batch of issues: Path to a data file
    # (`json`, `jsonl`) or directory. To run over single issue: github issue url or path to markdown file
    # with problem statement or problem statement as text prefixed with `text://`.
    data_path: str
    # Name of the docker image to use for the environment. Defaults to sweagent/swe-agent:latest
    image_name: str = "sweagent/swe-agent:latest"
    # When running over SWE-bench issues: Specify the split to use.
    split: str = "dev"
    # Specify a branch name or a commit hash to checkout before running the task.
    # Only used when running over a single problem statement/issue.
    base_commit: str | None = None
    # Use a persistent container with this name. After every task, the container will be paused, but not removed.
    # This is useful for speedup when running multiple tasks from the same repositories in a row, as the repositories
    # will have already been cloned and the conda environments will have been installed.
    container_name: str | None = None
    # Try to install the environment before running the task.
    install_environment: bool = True
    # No effect, kept for backwards compatibility.
    timeout: int | None = None
    # Enable environment logger.
    verbose: bool = False
    # Do not use attempt to use a repository mirror from https://github.com/swe-bench.
    no_mirror: bool = False
    # Cache task images to speed up task initialization. This means that the environment will be saved as a
    # docker image for every repository, base commit, and setup combination. This uses quite a bit of disk space
    # but speeds up task initialization significantly when running over multiple issues from the same repository
    # (or using different models for the same issues).
    cache_task_images: bool = False
    # Custom environment setup. Currently only used when data_path points to a single issue.
    # This needs to be either a string pointing to a yaml file (with yaml, yml file extension)
    # or a shell script (with sh extension).
    # See https://princeton-nlp.github.io/SWE-agent/usage/cl_tutorial#environment-setup
    environment_setup: str | None = None
    # Only used when running on single issue. Path to local repository or github repository.
    repo_path: str = ""
    # Interactive command configuration
    interactive_sessions_config: dict[str, InteractiveSessionConfig] = field(
        default_factory=lambda: INTERACTIVE_SESSIONS_CONFIG
    )
    # Container mounts - additional folders to mount into the environment (useful for caching)
    container_mounts: list[str] = field(default_factory=list)
    # CTF mode flag
    ctf: bool = True
    # Counter to track request count
    request_counter: int = 0
    # Model name
    model_name: str = "unknown"
    # Problem name
    problem_name: str = ""

    def __post_init__(self):
        if self.timeout is not None:
            default_logger.warning("The 'timeout' argument is deprecated and has no effect.")
        if self.cache_task_images and self.container_name:
            msg = (
                "Not allowed to use persistent container with caching task images "
                "(probably doesn't make sense and takes excessive space)."
            )
            raise ValueError(msg)
        if self.container_name is not None and self.container_name.strip() == "":
            msg = "Set container_name to None if you don't want to use a persistent container."
            raise ValueError(msg)


class EnvHook:
    """Hook to be used in `SWEEnv`.

    Subclass this class, add functionality and add it with `SWEEEnv.add_hook(hook)`.
    This allows to inject custom functionality at different stages of the environment
    lifecycle, in particular to connect SWE-agent to a new interface (like a GUI).
    """

    def on_init(self) -> None:
        """Gets called when the hook is added"""

    def on_copy_repo_started(self, *, repo_type: str, repo_path: str) -> None:
        """Gets called when the repository is being cloned to the container

        Args:
            repo_type: Type of repository. Either 'local' or 'github'
            repo_path: Path to the repository
        """

    def on_install_env_started(self) -> None:
        """Called when we start installing the environment"""

    def on_close(self):
        """Called when the environment is closed"""


class SWEEnv(gym.Env):
    """Gym environment for SWE-bench. This class should handle all communication with the docker container."""

    name = "swe_main"
    # This prefix will be prepended to the image name when caching task images
    cached_image_prefix = "swe-agent-task-env-"

    def __init__(self, args: EnvironmentArguments):
        """Initialize environment with arguments."""
        t0 = time.perf_counter()  # Initialization start time
        self.args = args
        self.install_environment = args.install_environment
        
        # System logger
        self.logger = get_logger("SWEEnv")
        self.logger.setLevel(logging.DEBUG)
        
        # Agent logger setup
        self.agent_logger = logging.getLogger("agent_communication")
        self.agent_logger.setLevel(logging.INFO)
        
        # Add special handler to agent logger
        agent_handler = logging.StreamHandler()
        agent_formatter = logging.Formatter('\n🤖 %(message)s\n')  # More visible format
        agent_handler.setFormatter(agent_formatter)
        
        # Add file handler
        log_dir = Path("agent_logs")
        log_dir.mkdir(exist_ok=True)
        current_time = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
        
        # Get problem name (use problem_name if available, otherwise empty string)
        problem_name = getattr(self.args, 'problem_name', '') or ''
        if problem_name:
            # Remove characters that cannot be used in filenames from problem name
            safe_problem_name = "".join(c for c in problem_name if c.isalnum() or c in ('-', '_')).rstrip()
            base_filename = f"{self.args.model_name}_{safe_problem_name}_agent_communication"
        else:
            base_filename = f"{self.args.model_name}_agent_communication"
        
        # If file already exists, add number to create new one
        counter = 1
        log_file = log_dir / f"{base_filename}_{counter}.log"
        while log_file.exists():
            log_file = log_dir / f"{base_filename}_{counter}.log"
            counter += 1
        
        file_handler = logging.FileHandler(log_file)
        file_formatter = logging.Formatter('%(asctime)s - %(message)s')
        file_handler.setFormatter(file_formatter)
        
        # Handler setup
        self.agent_logger.handlers = [agent_handler, file_handler]
        
        # Add attribute to store Agent reference
        self.current_agent = None
        
        self.persistent = args.container_name is not None
        self.container_mounts = args.container_mounts
        self.returncode: None | int = None
        self.image_name = args.image_name
        self.ctf = args.ctf

        #: The commit hash of the swe-agent repository
        self.commit_sha = None
        try:
            repo = Repo(REPO_ROOT, search_parent_directories=True)
            self.commit_sha = repo.head.object.hexsha
        except KeyboardInterrupt:
            raise
        except Exception as e:
            self.logger.exception("Failed to get commit hash for this repo: %s", str(e))

        self._github_token: str = keys_config.get("GITHUB_TOKEN", "")  # type: ignore

        # Load Task Instances
        self.data_path = self.args.data_path
        if not self.data_path:
            # No challenge information
            self.data = []
            self.challenge = None
        else:
            # Use existing JSON file
            self.data = get_instances(
                self.data_path,
                self.args.base_commit,
                self.args.split,
                token=self._github_token,
                repo_path=self.args.repo_path,
            )
            self.challenge = None

        #: Instance we're currently processing. Gets set in self.reset.
        self.record: dict[str, Any] | None = None
        self.logger.info(f"Loaded dataset from {self.data_path}")

        # Initialize container
        self.container: subprocess.Popen | None = None
        self.container_obj = None
        self.container_name = None
        self.docker_compose: Path | None = None
        self._reset_container()

        self.interactive_session: InteractiveSession | None = None

        self.idx = 0
        self.clean_multi_line_functions = lambda x: x
        self.hooks: list[EnvHook] = []

        # Add request counter as class attribute
        self.request_counter = 0

        # Add CTF mode attributes
        self.done = False  # Challenge completion status
        self.submission = None  # Submitted content
        self.submission_valid = False  # Submission validity
        self.total_reward = 0  # Total reward

        # Interactive sessions configuration.
        self.interactive_sessions: dict[str, InteractiveSession] = {}
        self.interactive_sessions_config = args.interactive_sessions_config
        
        # Container mounts
        self.container_mounts = args.container_mounts

        self._image_name = args.image_name
        
        # Skip repo cloning for CTF mode if needed
        if args.ctf or not args.data_path:
            self.ctf = True
            self.query = args.data_path
        else:
            self.ctf = False
            file_path = Path(args.data_path)
            # We assume web-based paths (e.g. GitHub URLs) are not local.
            is_local = file_path.exists() and file_path.is_file()
            if is_local:
                file_content = file_path.read_text()
            elif args.data_path.startswith("text://"):
                file_content = args.data_path.replace("text://", "")
                is_local = True
            else:
                file_content = ""
            if is_local:
                logger.info("Loading content from local")
                try:
                    self.data = self._prepare_data(file_content)
                except Exception as e:
                    logger.exception("Error loading data from local file")
                    msg = "Preparing data failed"
                    raise RuntimeError(msg) from e

        # Note: Some of the below can't be executed in the constructor because we haven't
        # parsed the docker-compose path yet.
        self.repo = None
        try:
            self._reset_container()
        except RuntimeError as e:
            logger.exception("Failed to initialize container")
            self.container = None
            raise e

        # Log initialization completion time
        self.logger.debug("Environment initialization took %.2f seconds", time.perf_counter() - t0)

    def _get_cached_task_image_name(self) -> str:
        assert self.record is not None
        inputs: list[str] = [
            self.record["repo"],
            self.record["base_commit"],
            self.args.environment_setup or "no_setup",
        ]
        tag = hashlib.sha256("".join(inputs).encode()).hexdigest()[:50]
        return f"{self.cached_image_prefix}{tag}"

    def add_hook(self, hook: EnvHook):
        """Add `EnvHook` to the environment.

        This allows to inject custom functionality at different stages of the environment
        lifecycle, in particular to connect SWE-agent to a new interface (like a GUI).
        """
        hook.on_init()
        self.hooks.append(hook)

    @property
    def _repo_name(self) -> str:
        """Name of the local copy of the repository"""
        assert self.record is not None
        return self.record["repo"].replace("/", "__").replace(" ", "-").replace("'", "")

    def _copy_repo(self):
        """Copy repository to container."""
        
        if self.args.ctf:  # Check CTF mode
            # Create ctf_challenge directory
            self.communicate("mkdir -p /ctf_challenge")
            return
            '''
            challenge_dir = Path(self.record["challenge"]["file_path"]).parent
            for file_name in self.record["challenge"].get("files", []):
                file_path = challenge_dir / file_name
                if file_path.exists():
                    self.logger.debug(f"Copying challenge file {file_path} to container")
                    copy_anything_to_container(
                        self.container_obj,
                        str(file_path),
                        "/ctf_challenge/" + file_name,  # Copy inside ctf_challenge directory
                    )
                else:
                    self.logger.warning(f"Challenge file not found: {file_path}")
            return  # Exit here in CTF mode
            '''

        # Existing non-CTF logic
        if not self.record.get("repo"):
            return
        
        # ... existing code ...

    def reset(self, index: int | None = None, apply_test_patch: bool = False) -> tuple[str | None, dict]:
        """
        Function to reset container between each task instance.

        * Clones instance's repository
        * Cleans repository of prior modifications
        * Resets environment variables
        * Check out base commit

        Args:
            index: index of task instance to reset to

        Returns:
            observation: output from container
            info: additional information (e.g. debugging information)
        """
        info = {}
        info["commit_sha"] = self.commit_sha

        # Get task instance
        self.idx = index if index is not None else self.idx
        self.record = self.data[self.idx]
        self.idx += 1

        # Set query, gold command
        self.base_commit = self.record["base_commit"]
        self.query = self.record["problem_statement"]
        self.challenge = self.record.get("challenge")
        self.reward = None

        ### Reset Container ###
        self._init_docker_compose()

        if self.args.cache_task_images:
            cached_image = self._get_cached_task_image_name()
            if image_exists(cached_image):
                self.logger.info(f"Restore environment from cached image {cached_image}")
                self.close()  # stop current container
                self._init_container(cached_image=cached_image)
                self.communicate("export $(xargs </.env)")
                envs = self.communicate("env")
                self.logger.debug(f"Environment variables restored from the image:\n{envs}\n")
                if apply_test_patch:
                    self._apply_test_patch()
                return None, info
            else:
                self.logger.info(f"Cached image {cached_image} not found, rebuilding task environment...")

        # Init docker network
        self._init_docker_network()

        # Clone repository if not already cloned
        self.communicate(input="cd /")
        folders = self.communicate(input="ls").split("\n")
        if self._repo_name not in folders:
            self._copy_repo()

        self._reset_repository()
        self._reset_environment_variables()

        # Set up environment
        self.communicate_with_handling(
            "source /root/miniconda3/etc/profile.d/conda.sh",
            error_msg="Failed to source conda",
        )

        system = self.communicate("uname -s").strip().lower()
        arch = self.communicate("uname -m").strip().lower()
        if system == "linux" and arch == "x86_64":
            self.communicate_with_handling(
                "apt update; apt install build-essential -y",
                error_msg="Failed to install build-essential",
                timeout_duration=LONG_TIMEOUT,
            )

        # Call install environment helper function if specified
        if self.install_environment:
            self.install_env()
        # Install mypy for linting purposes
        self.communicate_with_handling("pip install flake8", error_msg="Failed to install flake8 (lint library)")

        if self.args.cache_task_images:
            envs = self.communicate("env")
            self.logger.debug(f"Environment variables to save:\n{envs}\n")
            self.communicate("env >> /.env")
            assert self.container_obj is not None  # mypy
            self.container_obj.commit(cached_image)
            self.logger.info(f"Container with environment {self.container_obj.id} cached as image {cached_image}")

        if apply_test_patch:
            self._apply_test_patch()
        # Write any metadata to info if necessary
        return None, info

    def _reset_repository(self) -> None:
        """Clean repository of any modifications + Checkout base commit"""
        startup_commands = [
            "echo -n > /root/files_to_edit.txt",
        ]
        
        if not self.args.ctf:  # Only execute git commands when not in CTF mode
            startup_commands.extend([
                f"cd /{self._repo_name}",
                "export ROOT=$(pwd -P)",
                "git status",
                "git restore .",
                f"git reset --hard {self.base_commit}",
                "git clean -fdxq",
            ])
        else:  # Move to ctf_challenge directory in CTF mode
            startup_commands.extend([
                "cd /ctf_challenge",
                "export ROOT=$(pwd -P)",
            ])
        
        self.communicate_with_handling(
            input=" && ".join(startup_commands),
            error_msg="Failed to clean repository",
        )

    def _reset_environment_variables(self) -> None:
        """Reset environment variables (`CURRENT_FILE`) etc. within container"""
        cmd = [
            'export CURRENT_FILE=""',
            "export CURRENT_LINE=0",
            "export SEARCH_RESULTS=()",
            "export SEARCH_FILES=()",
            "export SEARCH_INDEX=0",
        ]
        self.communicate_with_handling(
            input=" && ".join(cmd),
            error_msg="Failed to reset environment variables",
        )

    def reset_for_new_attempt(
        self,
    ) -> None:
        """Compared to `reset`, which prepares the container for a new instance,
        this prepares the container for taking another shot at the same instance.
        """
        self._reset_repository()
        self._reset_environment_variables()

    def _apply_test_patch(self):
        """
        Apply test patch for oracle setting
        """
        assert self.record is not None
        path_to_patch = "test.patch"
        with open(path_to_patch, "w") as f:
            f.write(self.record["test_patch"])
        subprocess.run(
            f"docker cp {path_to_patch} {self.container_name}:/root/test.patch",
            shell=True,
            check=False,
        )
        self.communicate_with_handling(
            input="git apply /root/test.patch",
            error_msg="Failed to apply test patch correctly",
        )
        os.remove(path_to_patch)

    def _get_edited_files_with_context(self, patch: str) -> dict[str, str]:
        """Get the edited files with context from the patch"""
        pf = PatchFormatter(patch, read_method=self.read_file) if patch else None
        out = {}
        for context_length in [30, 50, 70]:
            value = "Empty. No edited files found."
            if pf is not None:
                value = pf.get_files_str(original=False, context_length=context_length)
            out[f"edited_files{context_length}"] = value
        return out

    def _terminate_interactive_session(self, session_name: str):
        """
        Terminates an interactive session.
        """
        if session_name not in self.interactive_sessions:
            return
        session = self.interactive_sessions[session_name]
        session.terminate()
        del self.interactive_sessions[session_name]

    def is_interactive_command(self, action: str) -> bool:
        """
        Check if the given action is an interactive command.
        
        Args:
            action: The command to check
            
        Returns:
            True if the action is an interactive command, False otherwise
        """
        # Command is not a string, return False
        if not isinstance(action, str):
            return False
            
        # Normalize command
        normalized_action = action.strip()
        
        # Check command pattern
        # Example: "start_session session_name" or "terminate_session session_name"
        if normalized_action.startswith("start_session "):
            return True
        if normalized_action.startswith("terminate_session "):
            return True
        if normalized_action.startswith("send_to_session "):
            return True
            
        return False

    def _handle_interactive_commands(self, observation: str) -> str:
        """Handle interactive commands in the environment, essentially substituting dummy
        output for the actual output of the interactive commands.

        Args:
            observation: Output from running the interactive command wrappers in the
                environment. They will returns some dummy output that will be caught and then
                we will run the actual commands in the interactive session and return the
                actual output.

        Returns:
            observation: The observation shown to the model. If no interactive commands
                are detected, this is the same as the input observation.
                Else, only the output from the interactive commands is returned.
        """
        session_name, interactive_commands = get_interactive_commands(observation, logger=self.logger)
        if session_name is None:
            return observation
        if (
            session_name is not None
            and self.interactive_session is not None
            and self.interactive_session.name != session_name
        ):
            return self.interactive_session._get_only_one_interactive_error_message_observation()

        observation = ""
        for command in interactive_commands:
            if command == "START":
                # Start the session if previous session does not exist
                if self.interactive_session is not None:
                    return self.interactive_session._get_only_one_interactive_error_message_observation()
                assert self.container_name is not None
                _observation, self.interactive_session = get_interactive_session(
                    ctr_name=self.container_name,
                    ctr_obj=self.container_obj,
                    cwd="/" + self._repo_name,
                    session_name=session_name,
                    config=self.args.interactive_sessions_config[session_name],
                    logger=self.logger,
                )
                observation += _observation
            elif command == "STOP":
                if self.interactive_session is None:
                    observation = f"Interactive session {session_name!r} is not running, so it cannot be stopped!"
                else:
                    if self.interactive_session.session_process.poll() is None:
                        self.logger.warning("Session did not quit successfully, terminating.")
                        self.interactive_session.session_process.terminate()
                    observation = f"Interactive session {session_name!r} stopped successfully"
                    self.interactive_session = None
            else:
                if self.interactive_session is None:
                    self.logger.warning("Tried to run interactive commands without starting session")
                    start_command = self.args.interactive_sessions_config[session_name].start_command
                    observation = f"Interactive session {session_name!r} is not running! please start it first using `{start_command}`"
                elif self.interactive_session and self.interactive_session.session_process.poll() is not None:
                    start_command = self.args.interactive_sessions_config[session_name].start_command
                    observation = f"Interactive session {session_name!r} was unexpectedly closed! Please start it again using `{start_command}`"
                    self._terminate_interactive_session(session_name=session_name)
                else:
                    _observation, terminate = self.interactive_session.communicate_with_handling(
                        command,
                        timeout_duration=AGENT_ACTION_TIMEOUT,
                        no_output_timeout_duration=AGENT_ACTION_NO_OUTPUT_TIMEOUT,
                    )
                    observation += _observation
                    if terminate:
                        self._terminate_interactive_session(session_name=session_name)
                    observation += "\n"
        return observation

    def step(self, action: str) -> tuple[str | None, int, bool, AgentInfo]:
        """Take a step in the environment.

        Args:
            action: The command to run.

        Returns:
            tuple of (observation, reward, done, info)
        """
        try:
            # Agent action logging - add separator
            self.agent_logger.info("="*50)
            try:
                # Sanitize action to prevent markup errors
                sanitized_action = str(action).replace('[', '\\[').replace(']', '\\]')
                self.agent_logger.info(f"💬 Agent Action:\n{sanitized_action}")
            except Exception as e:
                # Fallback logging if sanitization fails
                self.agent_logger.warning("Failed to log action due to markup error: %s", str(e))
                self.agent_logger.info("💬 Agent Action: [Action logging failed due to special characters]")
            
            # Log agent's complete response information (including thought process)
            if self.current_agent and hasattr(self.current_agent, 'history') and self.current_agent.history:
                try:
                    # Find assistant response from agent's recent history for logging
                    recent_history = self.current_agent.history
                    if recent_history and len(recent_history) > 0:
                        # Find most recent assistant response
                        for item in reversed(recent_history):
                            if item.get("role") == "assistant":
                                thought = item.get("thought", "")
                                action = item.get("action", "")
                                content = item.get("content", "")
                                
                                full_response = f"💭 THOUGHT:\n{thought}\n\n🎬 ACTION:\n{action}\n\n📝 RAW OUTPUT:\n{content}"
                                try:
                                    # Sanitize full response to prevent markup errors
                                    sanitized_full_response = str(full_response).replace('[', '\\[').replace(']', '\\]')
                                    self.agent_logger.info(f"🧠 Agent Full Response:\n{sanitized_full_response}")
                                except Exception as e:
                                    # Fallback logging if sanitization fails
                                    self.agent_logger.warning("Failed to log full response due to markup error: %s", str(e))
                                    self.agent_logger.info("🧠 Agent Full Response: [Full response logging failed due to special characters]")
                                break
                        else:
                            # If assistant response not found
                            self.agent_logger.info("📝 Agent Response Info: No recent assistant response found")
                    else:
                        self.agent_logger.info("📝 Agent Response Info: No history available")
                except Exception as e:
                    self.agent_logger.warning(f"Failed to get agent full response: {e}")
            else:
                # If no agent reference
                self.agent_logger.info("📝 Agent Response Info: No agent reference available")
            
            # Success message pattern check function
            def check_success_message(text: str) -> bool:
                import json
                import re
                
                if text is None or not isinstance(text, str):
                    return False
                    
                try:
                    # 1. Complete JSON response case
                    json_data = json.loads(text.strip())
                    if (isinstance(json_data, dict) and 
                        json_data.get("success") is True and 
                        isinstance(json_data.get("message"), str) and 
                        "[CORRECT]" in json_data.get("message", "")):
                        self.agent_logger.info("✅ Success message found: %s", json_data)
                        return True
                except json.JSONDecodeError:
                    pass
                    
                # 2. JSON format string included in response case
                json_pattern = r'{"success"\s*:\s*true\s*,\s*"message"\s*:\s*"\[CORRECT\][^"]*"}'
                json_matches = re.search(json_pattern, text)
                
                if json_matches:
                    self.agent_logger.info("✅ Success message found: %s", json_matches.group(0))
                    return True
                    
                # 3. Special case: clear success message
                exact_pattern = r'\[CORRECT\].*?(success)'
                if re.search(exact_pattern, text, re.IGNORECASE):
                    self.agent_logger.info("✅ Clear success pattern found")
                    return True
                    
                return False
                
            # Return None if already completed
            if self.done:
                self.agent_logger.info("🔄 Already completed")
                return None, 0, True, {"status": "done"}
                
            # Handle special exit commands
            if isinstance(action, str) and action.strip() in {
                "exit_cost", "exit_error", "exit_context", "exit_format", "exit_api", "exit_forfeit"
            }:
                self.agent_logger.info(f"🛑 Exit command detected: {action}")
                import sys
                from rich.console import Console
                from rich.panel import Panel
                
                console = Console()
                exit_message = Panel.fit(
                    f"🛑 Exit command detected: {action}. Terminating program.",
                    title="EXIT",
                    border_style="yellow"
                )
                console.print(exit_message)
                
                # Clean up environment more thoroughly
                try:
                    self.logger.info("🔄 Beginning environment shutdown for exit command...")
                    
                    # Interactive sessions finish
                    if hasattr(self, 'interactive_session') and self.interactive_session is not None:
                        try:
                            self._terminate_interactive_session(self.interactive_session.name)
                            self.logger.info("✅ Interactive session terminated")
                        except Exception as e:
                            self.logger.warning(f"Failed to terminate interactive session: {e}")
                    
                    # Container finish
                    if self.container is not None:
                        try:
                            self.communicate(input="exit", timeout_duration=10)
                            self.logger.info("✅ Container exit command sent")
                        except Exception as e:
                            self.logger.warning(f"Failed to send exit command to container: {e}")
                        
                        try:
                            # Container force finish
                            self.container.terminate()
                            self.container.wait(timeout=10)
                            self.logger.info("✅ Container terminated")
                        except Exception as e:
                            self.logger.warning(f"Failed to terminate container: {e}")
                            try:
                                self.container.kill()
                                self.logger.info("✅ Container killed")
                            except Exception as kill_error:
                                self.logger.warning(f"Failed to kill container: {kill_error}")
                    
                    # Docker compose finish
                    if self.docker_compose is not None:
                        try:
                            terminate_docker_compose(self.docker_compose)
                            self.logger.info("✅ Docker compose terminated")
                        except Exception as e:
                            self.logger.warning(f"Failed to terminate docker compose: {e}")
                    
                    self.logger.info("✅ Environment shutdown completed")
                    
                except Exception as e:
                    self.logger.error(f"Error during environment shutdown: {e}")
                
                # Return exit status
                agent_info: AgentInfo = {
                    "status": "exit",
                    "exit_status": action,
                    "submission": self.submission,
                    "submission_valid": self.submission_valid
                }
                
                # Raise SystemExit exception so that run.py can handle it appropriately
                raise SystemExit(0)
                
            # Execute command
            observation = None
            if self.is_interactive_command(action):
                observation = self._handle_interactive_commands(action)
                '''
                elif action.startswith("submit"):
                    if self.done:
                        self.agent_logger.info("🔄 Already completed. Not resubmitting.")
                        return None, 0, True, {"status": "already_done"}
                    
                    self.submission = self.get_submission(action)
                    self.submission_valid = self.validate_submission(self.submission or "")
                    
                    if self.submission_valid:
                        self.agent_logger.info("✅ Submission successful!")
                        self.total_reward += 1
                        self.done = True
                        observation = "Submission valid!"
                        return observation, 1, True, {"status": "success"}
                    else:
                        self.agent_logger.error("❌ Invalid submission or extraction pattern")
                        observation = "Invalid submission. No patch could be extracted."
                '''
            else:
                try:
                    # Special handling for edit commands
                    timeout_duration = 60  # Change default timeout to 60 seconds
                    no_output_timeout_duration = 60  # Define no_output_timeout_duration
                    
                    if action.strip().startswith("edit"):
                        timeout_duration = 60  # Edit commands use 60 second timeout
                        no_output_timeout_duration = 60
                        self.logger.info("Edit command detected in step method, using extended timeout")
                        
                        # Process edit command line by line
                        lines = action.split('\n')
                        if len(lines) > 1:
                            # Convert edit command to here-document syntax
                            self.logger.info(f"Processing multi-line edit command with {len(lines)} lines")
                            
                            # Extract edit command from first line
                            first_line = lines[0]
                            if first_line.startswith("edit "):
                                # Add here-document syntax to edit command
                                edit_cmd = first_line + " << end_of_edit"
                                
                                # Collect remaining lines (excluding end_of_edit)
                                content_lines = []
                                for line in lines[1:]:
                                    if line.strip() == "end_of_edit":
                                        break
                                    content_lines.append(line)
                                
                                # Compose full command
                                full_command = edit_cmd + "\n" + "\n".join(content_lines) + "\nend_of_edit"
                                
                                self.logger.info(f"Converted edit command to here-document format")
                                
                                # Send full command at once
                                try:
                                    observation = self.communicate_with_handling(
                                        full_command, "Error executing edit command", 
                                        timeout_duration=timeout_duration,
                                        redact_command_trace="AUTH_TOKEN" in action
                                    )
                                except Exception as e:
                                    self.logger.warning(f"Edit command failed: {e}")
                                    # Attempt container recovery
                                    try:
                                        self.logger.info("Attempting container recovery after edit command failure...")
                                        if self._check_and_recover_container():
                                            self.logger.info("Container recovered, retrying edit command...")
                                            observation = self.communicate_with_handling(
                                                full_command, "Error executing edit command (retry)", 
                                                timeout_duration=timeout_duration,
                                                redact_command_trace="AUTH_TOKEN" in action
                                            )
                                        else:
                                            observation = f"Edit command failed and container recovery failed: {e}"
                                    except Exception as recovery_error:
                                        self.logger.error(f"Container recovery failed: {recovery_error}")
                                        observation = f"Edit command failed: {e}"
                                
                                # Return error messages as-is even if command returns error
                                if self.returncode != 0:
                                    self.logger.warning(f"Error executing the edit command: {observation}")
                                    return f"Error executing the edit command: {observation}", 0, False, {"status": "error"}
                                
                                return observation, 0, False, {"status": "success"}
                            else:
                                # Use existing method if not edit command
                                if "end_of_edit" not in action:
                                    action = action + "\nend_of_edit"
                                    self.logger.info("Automatically added 'end_of_edit' to multi-line edit command")
                                
                                # Send full command at once
                                try:
                                    observation = self.communicate_with_handling(
                                        action, "Error executing edit command", 
                                        timeout_duration=timeout_duration,
                                        redact_command_trace="AUTH_TOKEN" in action
                                    )
                                except Exception as e:
                                    self.logger.warning(f"Edit command failed: {e}")
                                    observation = f"Edit command failed: {e}"
                                
                                # Return error messages as-is even if command returns error
                                if self.returncode != 0:
                                    self.logger.warning(f"Error executing the edit command: {observation}")
                                    return f"Error executing the edit command: {observation}", 0, False, {"status": "error"}
                                
                                return observation, 0, False, {"status": "success"}
                        else:
                            # Use existing method for single-line edit commands
                            if "end_of_edit" not in action:
                                action = action + "\nend_of_edit"
                                self.logger.info("Automatically added 'end_of_edit' to single-line edit command in step method")
                    
                    try:
                        observation = self.communicate_with_handling(
                            action, "Error executing the command", 
                            timeout_duration=timeout_duration,
                            redact_command_trace="AUTH_TOKEN" in action
                        )
                    except Exception as e:
                        self.logger.error(f"Unexpected error in step method during command execution: {e}")
                        self.logger.error(traceback.format_exc())
                        
                        # Check if this is a timeout error, bash script error, unicode error, or file not found error
                        is_timeout_error = isinstance(e, (TimeoutError, NoOutputTimeoutError)) or "TIMEOUT" in str(e)
                        is_bash_error = "here-document" in str(e) or "EOF" in str(e) or "bash:" in str(e)
                        is_unicode_error = isinstance(e, UnicodeError) or "non-unicode" in str(e) or "unicode" in str(e)
                        is_file_not_found = "No such file or directory" in str(e) or "Errno 2" in str(e) or "can't open file" in str(e)
                        
                        # Attempt container recovery - handle different error types appropriately
                        try:
                            if self.container and self.container.poll() is not None:
                                self.logger.warning("Container has exited due to error, attempting recovery...")
                                try:
                                    self.container.stdin.write("echo 'container_exit_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from container exit, may need restart")
                            elif is_timeout_error:
                                # For timeout errors, don't restart if container is still alive
                                self.logger.info("Container is still alive after timeout, continuing without restart...")
                                # Try to restore shell prompt by sending a simple command
                                try:
                                    self.container.stdin.write("echo 'timeout_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to restore shell prompt after timeout")
                            elif is_bash_error:
                                # For bash script errors, try to recover without container restart
                                self.logger.warning("Bash script error detected, attempting recovery without container restart...")
                                try:
                                    self.container.stdin.write("echo 'bash_error_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from bash error, container may need restart")
                            elif is_unicode_error:
                                # For unicode errors, try to recover without container restart
                                self.logger.warning("Unicode error detected, attempting recovery without container restart...")
                                try:
                                    self.container.stdin.write("echo 'unicode_error_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from unicode error, container may need restart")
                            elif is_file_not_found:
                                # For file not found errors, try to recover without container restart
                                self.logger.warning("File not found error detected, attempting recovery without container restart...")
                                try:
                                    self.container.stdin.write("echo 'file_not_found_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from file not found error, container may need restart")
                            else:
                                # For other errors, try to recover without container restart
                                self.logger.warning("Container error detected, attempting recovery without container restart...")
                                try:
                                    self.container.stdin.write("echo 'general_error_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from general error, container may need restart")
                        except Exception as recovery_error:
                            self.logger.error(f"Container recovery failed: {recovery_error}")
                        
                        # Return appropriate error message
                        if is_timeout_error:
                            timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                            observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                        elif is_bash_error:
                            observation = f"BASH SCRIPT ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                        elif is_unicode_error:
                            observation = f"UNICODE ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                        elif is_file_not_found:
                            observation = f"FILE NOT FOUND ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                        else:
                            # Return clear error message for other exceptions
                            error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                            error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                            observation = error_message
                except Exception as e:
                    # Handle unexpected errors
                    self.logger.error(f"Unexpected error in step method: {e}")
                    self.logger.error(traceback.format_exc())
                    
                    # Check if this is a timeout error, bash script error, unicode error, or file not found error
                    is_timeout_error = isinstance(e, (TimeoutError, NoOutputTimeoutError)) or "TIMEOUT" in str(e)
                    is_bash_error = "here-document" in str(e) or "EOF" in str(e) or "bash:" in str(e)
                    is_unicode_error = isinstance(e, UnicodeError) or "non-unicode" in str(e) or "unicode" in str(e)
                    is_file_not_found = "No such file or directory" in str(e) or "Errno 2" in str(e) or "can't open file" in str(e)
                    
                    # Attempt container recovery - only restart if container has actually exited or it's not a timeout
                    try:
                        if self.container and self.container.poll() is not None:
                            self.logger.warning("Container has exited due to error, attempting recovery...")
                            try:
                                self.container.stdin.write("echo 'container_exit_recovery'\n")
                                self.container.stdin.flush()
                                time.sleep(0.1)
                            except Exception:
                                self.logger.warning("Failed to recover from container exit, may need restart")
                        elif is_timeout_error:
                            # For timeout errors, don't restart if container is still alive
                            self.logger.info("Container is still alive after timeout, continuing without restart...")
                            # Try to restore shell prompt by sending a simple command
                            try:
                                self.container.stdin.write("echo 'timeout_recovery'\n")
                                self.container.stdin.flush()
                                time.sleep(0.1)
                            except Exception:
                                self.logger.warning("Failed to restore shell prompt after timeout")
                        elif is_bash_error or is_unicode_error or is_file_not_found:
                            # For bash script, unicode, or file not found errors, try to recover without container restart
                            if is_bash_error:
                                error_type = "Bash script"
                                recovery_cmd = "echo 'bash_error_recovery'\n"
                            elif is_unicode_error:
                                error_type = "Unicode"
                                recovery_cmd = "echo 'unicode_error_recovery'\n"
                            else:
                                error_type = "File not found"
                                recovery_cmd = "echo 'file_not_found_recovery'\n"
                            self.logger.warning(f"{error_type} error detected, attempting recovery without container restart...")
                            try:
                                self.container.stdin.write(recovery_cmd)
                                self.container.stdin.flush()
                                time.sleep(0.1)
                            except Exception:
                                self.logger.warning(f"Failed to recover from {error_type.lower()} error, container may need restart")
                        else:
                            # For other errors, try to recover without container restart
                            self.logger.warning("Container error detected, attempting recovery without container restart...")
                            try:
                                self.container.stdin.write("echo 'general_error_recovery'\n")
                                self.container.stdin.flush()
                                time.sleep(0.1)
                            except Exception:
                                self.logger.warning("Failed to recover from general error, container may need restart")
                    except Exception as recovery_error:
                        self.logger.error(f"Container recovery failed: {recovery_error}")
                    
                    # Return appropriate error message
                    if is_timeout_error:
                        timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                        observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                    elif is_bash_error:
                        observation = f"BASH SCRIPT ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                    elif is_unicode_error:
                        observation = f"UNICODE ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                    elif is_file_not_found:
                        observation = f"FILE NOT FOUND ERROR: {str(e)}. Attempting recovery without container restart. Please try again."
                    else:
                        observation = f"Unexpected error occurred: {str(e)}. Attempting recovery without container restart. Please try again."
                    
                    agent_info: AgentInfo = {
                        "status": "error",
                        "submission": self.submission,
                        "submission_valid": self.submission_valid,
                        "error": str(e)
                    }
                    
                    return observation, 0, False, agent_info
                
                # Check if success message exists
                if observation and check_success_message(observation):
                    self.agent_logger.info("🎉 Found the answer! Exiting program.")
                    import sys
                    from rich.console import Console
                    from rich.panel import Panel
                    
                    console = Console()
                    success_message = Panel.fit(
                        "🎉��🎉 Found the answer! Exit the program. 🎉🎉🎉",
                        title="SUCCESS",
                        border_style="green"
                    )
                    console.print(success_message)
                    self.close()
                    sys.exit(0)
            
            # Agent response logging - add separator
            if observation:
                self.agent_logger.info("-"*50)
                try:
                    # Sanitize observation to prevent markup errors
                    sanitized_observation = str(observation).replace('[', '\\[').replace(']', '\\]')
                    self.agent_logger.info(f"🤖 Agent Response:\n{sanitized_observation}")
                except Exception as e:
                    # Fallback logging if sanitization fails
                    self.agent_logger.warning("Failed to log observation due to markup error: %s", str(e))
                    self.agent_logger.info("🤖 Agent Response: [Observation logging failed due to special characters]")
                self.agent_logger.info("="*50 + "\n")
            
            # Compose Agent info
            agent_info: AgentInfo = {
                "status": "running",
                "submission": self.submission,
                "submission_valid": self.submission_valid,
            }
            
            return observation, 0, False, agent_info
            
        except Exception as e:
            # Handle unexpected errors
            self.logger.error(f"Unexpected error in step method: {e}")
            self.logger.error(traceback.format_exc())
            
            # Check if this is a timeout error
            is_timeout_error = isinstance(e, (TimeoutError, NoOutputTimeoutError)) or "TIMEOUT" in str(e)
            
            # Attempt container recovery - only restart if container has actually exited or it's not a timeout
            try:
                if self.container and self.container.poll() is not None:
                    self.logger.warning("Container has exited due to error, attempting restart...")
                    self.reset_container()
                elif not is_timeout_error:
                    # Force restart if container is alive but unresponsive (only for non-timeout errors)
                    self.logger.warning("Container is unresponsive due to error, forcing restart...")
                    self.reset_container()
                else:
                    # For timeout errors, don't restart if container is still alive
                    self.logger.info("Container is still alive after timeout, continuing without restart...")
                    # Try to restore shell prompt by sending a simple command
                    try:
                        self.container.stdin.write("echo 'timeout_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to restore shell prompt after timeout")
            except Exception as recovery_error:
                self.logger.error(f"Container recovery failed: {recovery_error}")
            
            # Return appropriate error message
            if is_timeout_error:
                timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
            else:
                observation = f"Unexpected error occurred: {str(e)}. Container has been restarted. Please try again."
            
            agent_info: AgentInfo = {
                "status": "error",
                "submission": self.submission,
                "submission_valid": self.submission_valid,
                "error": str(e)
            }
            
            return observation, 0, False, agent_info

    def close(self) -> None:
        """Close the environment and clean up resources."""
        self.logger.info("Beginning environment shutdown...")
        
        try:
            # Terminate interactive sessions
            if hasattr(self, 'interactive_session') and self.interactive_session is not None:
                try:
                    self._terminate_interactive_session(self.interactive_session.name)
                    self.logger.info("✅ Interactive session terminated")
                except Exception as e:
                    self.logger.warning(f"Failed to terminate interactive session: {e}")
            
            # Terminate container
            if self.container is not None:
                try:
                    # First execute exit command inside container
                    self.communicate(input="exit", timeout_duration=10)
                    self.logger.info("✅ Container exit command sent")
                except Exception as e:
                    self.logger.warning(f"Failed to send exit command to container: {e}")
                
                try:
                    # Force terminate container
                    self.container.terminate()
                    self.container.wait(timeout=10)
                    self.logger.info("✅ Container terminated")
                except Exception as e:
                    self.logger.warning(f"Failed to terminate container: {e}")
                    try:
                        self.container.kill()
                        self.logger.info("✅ Container killed")
                    except Exception as kill_error:
                        self.logger.warning(f"Failed to kill container: {kill_error}")
            
            # Terminate Docker compose
            if self.docker_compose is not None:
                try:
                    terminate_docker_compose(self.docker_compose)
                    self.logger.info("✅ Docker compose terminated")
                except Exception as e:
                    self.logger.warning(f"Failed to terminate docker compose: {e}")
                    
        except Exception as e:
            self.logger.warning(f"Errors when exiting container\n{traceback.format_exc()}")
        finally:
            # Final cleanup
            if self.container is not None:
                try:
                    if self.container.poll() is None:
                        self.container.terminate()
                        self.container.wait(timeout=5)
                except Exception:
                    pass
                    
            if self.docker_compose is not None:
                try:
                    terminate_docker_compose(self.docker_compose)
                except Exception:
                    pass
                    
            self.logger.info("Environment shutdown complete")

    # MARK: Helper functions #

    def _backup_ctf_data(self) -> str | None:
        """Backup CTF challenges data before container reset"""
        if not self.ctf or self.container_obj is None or self.container_name is None:
            return None
            
        try:
            # Create backup directory on host
            backup_dir = f"/tmp/ctf_backup_{int(time.time())}"
            os.makedirs(backup_dir, exist_ok=True)
            
            # Copy important directories from container to host
            self.logger.info(f"🔄 Backing up important data to {backup_dir}")
            
            import subprocess
            
            # List of important directories to backup
            important_dirs = [
                "/ctf_challenges",
            ]
            
            backup_success = False
            for dir_path in important_dirs:
                try:
                    # Check if directory exists in container
                    check_result = subprocess.run([
                        "docker", "exec", self.container_name, "test", "-d", dir_path
                    ], capture_output=True, text=True)
                    
                    if check_result.returncode == 0:
                        # Directory exists, backup it
                        result = subprocess.run([
                            "docker", "cp", f"{self.container_name}:{dir_path}", backup_dir
                        ], capture_output=True, text=True)
                        
                        if result.returncode == 0:
                            self.logger.info(f"✅ Backed up {dir_path}")
                            backup_success = True
                        else:
                            self.logger.warning(f"⚠️ Failed to backup {dir_path}: {result.stderr}")
                    else:
                        self.logger.debug(f"📁 Directory {dir_path} does not exist, skipping")
                        
                except Exception as dir_error:
                    self.logger.warning(f"⚠️ Error backing up {dir_path}: {dir_error}")
            
            if backup_success:
                self.logger.info(f"✅ Important data backed up successfully to {backup_dir}")
                return backup_dir
            else:
                self.logger.warning("⚠️ No data was successfully backed up")
                return None
                
        except Exception as e:
            self.logger.error(f"❌ Error backing up data: {e}")
            return None

    def _restore_ctf_data(self, backup_dir: str | None) -> None:
        """Restore important data after container reset"""
        if not self.ctf or backup_dir is None or self.container_obj is None or self.container_name is None:
            return
            
        try:
            self.logger.info(f"🔄 Restoring important data from {backup_dir}")
            
            import subprocess
            
            # List of important directories to restore
            important_dirs = [
                "ctf_challenges",
            ]
            
            restore_success = False
            for dir_name in important_dirs:
                backup_path = os.path.join(backup_dir, dir_name)
                if os.path.exists(backup_path):
                    try:
                        # Determine the target path in container
                        if dir_name == "ctf_challenges":
                            target_path = "/"
                            
                        result = subprocess.run([
                            "docker", "cp", backup_path, f"{self.container_name}:{target_path}"
                        ], capture_output=True, text=True)
                        
                        if result.returncode == 0:
                            self.logger.info(f"✅ Restored {dir_name}")
                            restore_success = True
                        else:
                            self.logger.warning(f"⚠️ Failed to restore {dir_name}: {result.stderr}")
                            
                    except Exception as dir_error:
                        self.logger.warning(f"⚠️ Error restoring {dir_name}: {dir_error}")
                else:
                    self.logger.debug(f"📁 Backup for {dir_name} not found, skipping")
            
            if restore_success:
                self.logger.info("✅ Important data restored successfully")
                
                # Set proper permissions for restored files
                try:
                    for dir_name in important_dirs:
                        if dir_name == "ctf_challenges":
                            target_path = "/ctf_challenges"
                            
                        # Set permissions recursively
                        subprocess.run([
                            "docker", "exec", self.container_name, "chmod", "-R", "755", target_path
                        ], capture_output=True, text=True)
                        
                        # Set ownership to root
                        subprocess.run([
                            "docker", "exec", self.container_name, "chown", "-R", "root:root", target_path
                        ], capture_output=True, text=True)
                        
                except Exception as perm_error:
                    self.logger.warning(f"⚠️ Failed to set permissions: {perm_error}")
                
                # Verify critical directories exist
                try:
                    critical_dirs = ["/ctf_challenges"]
                    for critical_dir in critical_dirs:
                        check_result = subprocess.run([
                            "docker", "exec", self.container_name, "test", "-d", critical_dir
                        ], capture_output=True, text=True)
                        
                        if check_result.returncode == 0:
                            self.logger.info(f"✅ Verified {critical_dir} exists")
                        else:
                            self.logger.warning(f"⚠️ Critical directory {critical_dir} not found after restore")
                            
                except Exception as verify_error:
                    self.logger.warning(f"⚠️ Failed to verify restored directories: {verify_error}")
                
                # Clean up backup directory
                try:
                    import shutil
                    shutil.rmtree(backup_dir)
                    self.logger.info(f"🧹 Cleaned up backup directory {backup_dir}")
                except Exception as cleanup_error:
                    self.logger.warning(f"⚠️ Failed to clean up backup directory: {cleanup_error}")
            else:
                self.logger.warning("⚠️ No data was successfully restored")
                
        except Exception as e:
            self.logger.error(f"❌ Error restoring data: {e}")

    def _reset_container(self) -> None:
        # Backup CTF data before container termination
        backup_dir = self._backup_ctf_data()
        
        if self.container is not None:
            try:
                self.container.terminate()
            except KeyboardInterrupt:
                raise
            except:
                self.logger.warning("Failed to terminate container", exc_info=True)
            else:
                self.logger.debug("Terminated container")
        if self.docker_compose is not None:
            try:
                terminate_docker_compose(self.docker_compose)
            except KeyboardInterrupt:
                raise
            except:
                self.logger.warning("Failed to terminate docker compose", exc_info=True)
            else:
                self.logger.debug("Terminated docker compose")
        
        # Initialize new container
        self._init_container()
        self._init_scripts()
        
        # Restore CTF data after container initialization
        self._restore_ctf_data(backup_dir)

    def reset_container(self) -> None:
        self.close()
        self.container = None
        self.container_obj = None
        self._reset_container()

    @staticmethod
    def _get_container_name(image_name: str) -> str:
        """Return name of container"""
        process_id = str(os.getpid())
        current_time = str(datetime.datetime.now())
        unique_string = current_time + process_id
        hash_object = hashlib.sha256(unique_string.encode())
        image_name_sanitized = image_name.replace("/", "-")
        image_name_sanitized = image_name_sanitized.replace(":", "-")
        return f"{image_name_sanitized}-{hash_object.hexdigest()[:10]}"

    # ctf
    def _init_docker_network(self) -> None:
        """
        Add the "ctfnet" network interface for all the containers used for CTF challenges
        """
        assert self.container_name is not None
        if self.challenge is not None:
            attach_network_interface_to_container(self.container_name)

    # ctf
    def _init_docker_compose(self) -> None:
        """
        Handles docker compose initialization for challenge with docker compose file.
        """
        if self.challenge is not None and self.challenge.get("docker_compose") is not None:
            self.docker_compose = get_docker_compose(self.challenge["docker_compose"])
            self.logger.info("🌱 Initialized docker compose for challenge")

    def _init_container(self, cached_image: str | None = None) -> None:
        """
        Handles container initialization. Defines container name and creates it.
        If cached_image is provided, it will use that image name instead of the default.
        """
        image_name = self.image_name
        if cached_image is not None:
            image_name = cached_image
            self.logger.info(f"Using cached image: {image_name}")
        if self.persistent:
            assert self.container_name is not None
        else:
            # Make sure that we get a new container name just in case removing didn't work.
            # Might be a fix for https://github.com/swe-agent/SWE-agent/issues/451
            self.container_name = self._get_container_name(image_name)
        
        # Try up to 3 times
        max_attempts = 3
        for attempt in range(max_attempts):
            try:
                self.container, self.parent_pids = get_container(
                    self.container_name, image_name, persistent=self.persistent, container_mounts=self.container_mounts
                )
                break
            except (BlockingIOError, OSError) as e:
                if attempt < max_attempts - 1:
                    self.logger.warning(f"IO Error on attempt {attempt+1}/{max_attempts}, retrying: {e}")
                    time.sleep(2 * (attempt + 1))  # Wait progressively longer before retry
                else:
                    self.logger.error(f"Failed to initialize container after {max_attempts} attempts: {e}")
                    raise RuntimeError(f"Container initialization failed: {e}") from e
        
        try:
            client = docker.from_env(timeout=60)
        except docker.errors.DockerException as e:
            if "Error while fetching server API version" in str(e):
                msg = "Docker is not running. Please start Docker and try again."
            else:
                msg = "Unknown docker exception occurred. Are you sure docker is running?"
            raise RuntimeError(msg) from e
        t0 = time.time()
        self.container_obj = None
        while time.time() - t0 < 60:
            try:
                self.container_obj = client.containers.get(self.container_name)
            except docker.errors.NotFound:
                self.logger.debug("Couldn't find container. Let's wait and retry.")
                time.sleep(1)
            else:
                break
        else:
            print(f"{self.persistent=}")
            available_containers = client.containers.list(all=True)
            available_containers_info = json.dumps([str(c.attrs) for c in available_containers], indent=2)
            print(available_containers_info)
            msg = "Failed to get container object."
            raise RuntimeError(msg)
        self.logger.info("🌱 Environment Initialized")

    def _init_scripts(self):
        """
        Initialize custom commands within container
        """
        self.communicate_with_handling(
            "source /root/.bashrc",
            error_msg="Failed to source .bashrc",
        )
        self.communicate_with_handling(
            "mkdir -p /root/commands",
            error_msg="Failed to create commands directory",
        )
        self.communicate_with_handling(
            "touch /root/commands/__init__.py",
            error_msg="Failed to create __init__.py",
        )
        self.communicate_with_handling(
            "export PATH=$PATH:/root/commands",
            error_msg="Failed to add commands directory to PATH",
        )

    def _communicate_experimental(
        self,
        input: str,
        timeout_duration: int | float = 30,  # Changed to 30 seconds
        no_output_timeout_duration: int | float | None = None,  # Allow None for no_output_timeout_duration
    ) -> str:
        """Experimental version of `_communicate`"""
        assert self.container is not None
        # Sleep to ensure that the exit code is in the last line
        # See https://github.com/swe-agent/SWE-agent/issues/595
        command_suffix = (
            f'EXITSTATUS="$?"; sleep 0.01; echo {PROCESS_DONE_MARKER_START}$EXITSTATUS{PROCESS_DONE_MARKER_END}\n'
        )
        try:
            self.returncode = None
            cmd = input if input.endswith("\n") else input + "\n"
            cmd += command_suffix
            os.write(self.container.stdin.fileno(), cmd.encode())  # type: ignore
            time.sleep(0.03)
            self.container.stdin.flush()  # type: ignore
        except BrokenPipeError:
            traceback.print_exc()
            self.logger.error("Failed to communicate with container. Check docker logs for more information.")
            msg = "Failed to communicate with container"
            raise RuntimeError(msg)

        try:
            buffer, exit_code = read_with_timeout_experimental(
                self.container, timeout_duration, no_output_timeout_duration
            )
        except (BlockingIOError, OSError) as e:
            self.logger.error(f"IO Error when reading from container: {e}")
            msg = f"Failed to read from container: {e}"
            raise RuntimeError(msg)
        except (TimeoutError, NoOutputTimeoutError) as e:
            # Terminate only the command when timeout occurs and return clear message
            timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
            self.logger.warning(f"Command {timeout_type} timed out after {timeout_duration} seconds. Attempting to terminate command only...")
            
            try:
                # Terminate only the current command (prevent entire process termination)
                if self.container and self.container.poll() is None:
                    # Send SIGINT (Ctrl+C) signal to terminate command
                    self.container.send_signal(2)  # SIGINT = 2
                    time.sleep(0.5)
                    
                    # Try SIGTERM if still running
                    if self.container.poll() is None:
                        self.container.send_signal(15)  # SIGTERM = 15
                        time.sleep(1)
                    
                    # Finally try SIGKILL if necessary
                    if self.container.poll() is None:
                        self.logger.warning("Force killing command due to timeout")
                        self.container.send_signal(9)  # SIGKILL = 9
                        time.sleep(0.5)
                
                # Read remaining output
                try:
                    remaining_output = read_with_timeout_experimental(
                        self.container, 5, 2
                    )
                    buffer = remaining_output[0]
                    exit_code = remaining_output[1]
                except Exception:
                    buffer = f"\n[COMMAND {timeout_type.upper()} TIMED OUT AFTER {timeout_duration} SECONDS AND WAS TERMINATED]\n"
                    exit_code = "143"  # SIGTERM exit code
                    
            except Exception as interrupt_error:
                self.logger.error(f"Failed to interrupt command: {interrupt_error}")
                buffer = f"\n[COMMAND {timeout_type.upper()} TIMED OUT AFTER {timeout_duration} SECONDS - INTERRUPT FAILED]\n"
                exit_code = "143"
            
            # Check container status after timeout - only restart if container has actually exited
            try:
                if self.container.poll() is not None:
                    self.logger.warning("Container has exited after timeout, attempting recovery...")
                    try:
                        self.container.stdin.write("echo 'timeout_exit_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to recover from timeout exit, may need restart")
                else:
                    # Continue using if container is still alive - no restart needed
                    self.logger.info("Container is still alive after timeout, continuing without restart...")
                    # Try to restore shell prompt by sending a simple command
                    try:
                        self.container.stdin.write("echo 'timeout_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to restore shell prompt after timeout")
            except Exception as recovery_error:
                self.logger.error(f"Container recovery after timeout failed: {recovery_error}")
                
            # Send clear TIMEOUT message to AGENT
            timeout_message = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED AFTER {timeout_duration} SECONDS"
            if timeout_type == "no_output":
                timeout_message += " - NO OUTPUT WAS PRODUCED"
            else:
                timeout_message += " - COMMAND WAS RUNNING TOO LONG"
            
            timeout_message += "\nPLEASE TRY A DIFFERENT APPROACH OR USE A SHORTER COMMAND"
            
            if buffer and buffer.strip():
                timeout_message += f"\n\nPartial output before timeout:\n{buffer}"
            
            self.logger.info(f"Returning timeout message to agent: {timeout_message}")
            buffer = timeout_message
            exit_code = "143"  # SIGTERM exit code
        except Exception as e:
            # Handle all other exceptions - prevent program termination
            self.logger.error(f"Unexpected error in _communicate_experimental: {e}")
            self.logger.error(traceback.format_exc())
            
            # Attempt container recovery
            try:
                if self.container and self.container.poll() is not None:
                    self.logger.warning("Container has exited due to error, attempting recovery...")
                    try:
                        self.container.stdin.write("echo 'communicate_exit_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to recover from communicate exit, may need restart")
                else:
                    # Try to recover without container restart
                    self.logger.warning("Container is unresponsive due to error, attempting recovery...")
                    try:
                        self.container.stdin.write("echo 'communicate_unresponsive_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to recover from communicate unresponsive, may need restart")
            except Exception as recovery_error:
                self.logger.error(f"Container recovery failed: {recovery_error}")
            
            # Send clear error message to agent
            error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
            error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
            
            self.logger.info(f"Returning error message to agent: {error_message}")
            buffer = error_message
            exit_code = "1"  # General error exit code

        if not exit_code.isdigit():
            msg = f"Failed to get exit code. Output:\n---\n{buffer}\n---"
            raise RuntimeError(msg)
        self.returncode = int(exit_code)
        return buffer

    def _communicate(
        self,
        input: str,
        timeout_duration: int | float = 30,
        no_output_timeout_duration: int | float | None = None,
        *,
        set_last_action: bool = False,
        redact_command_trace: bool = False,
    ) -> str:
        """Runs command in container and returns output

        Args:
            input: command to run in container
            timeout_duration: duration to wait for output
            no_output_timeout_duration: duration to wait when the process stopped produce any output
        """
        assert self.container is not None
        communicate_method = keys_config.get(
            "SWE_AGENT_COMMUNICATE_METHOD", default="end-marker", choices=["end-marker", "processes"]
        )
        if communicate_method == "end-marker":
            return self._communicate_experimental(input, timeout_duration, no_output_timeout_duration)
        try:
            self.returncode = None
            cmd = input if input.endswith("\n") else input + "\n"
            os.write(self.container.stdin.fileno(), cmd.encode())  # type: ignore
            time.sleep(0.1)
            self.container.stdin.flush()  # type: ignore
        except BrokenPipeError:
            traceback.print_exc()
            self.logger.error("Failed to communicate with container. Check docker logs for more information.")
            msg = "Failed to communicate with container"
            raise RuntimeError(msg)
        try:
            buffer = read_with_timeout(self.container, self.get_pids, timeout_duration)
            self.container.stdin.write("echo $?\n")  # type: ignore
            time.sleep(0.1)
            self.container.stdin.flush()  # type: ignore
            exit_code = read_with_timeout(self.container, self.get_pids, 5).strip()
        except Exception as e:
            self.logger.error(f"Read with timeout failed on input:\n---\n{input}\n---")
            # Only raise exception for non-timeout exceptions
            if not isinstance(e, (TimeoutError, NoOutputTimeoutError)):
                # Prevent program termination for unexpected exceptions
                self.logger.error(f"Unexpected error in _communicate: {e}")
                self.logger.error(traceback.format_exc())
                
                # Attempt container recovery
                try:
                    if self.container and self.container.poll() is not None:
                        self.logger.warning("Container has exited due to error, restarting...")
                        self.reset_container()
                    else:
                        # Force restart if container is alive but unresponsive
                        self.logger.warning("Container is unresponsive due to error, forcing restart...")
                        self.reset_container()
                except Exception as recovery_error:
                    self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Send clear error message to agent
                error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                
                self.logger.info(f"Returning error message to agent: {error_message}")
                buffer = error_message
                exit_code = "1"  # General error exit code
                return buffer
                
            # Terminate only the command when timeout occurs and return clear message
            timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
            
            # Attempt to terminate only the timed out command
            try:
                if self.container and self.container.poll() is None:
                    # Send SIGINT (Ctrl+C) signal to terminate command
                    self.container.send_signal(2)  # SIGINT = 2
                    time.sleep(0.5)
                    
                    # Try SIGTERM if still running
                    if self.container.poll() is None:
                        self.container.send_signal(15)  # SIGTERM = 15
                        time.sleep(1)
                    
                    # Finally try SIGKILL if necessary
                    if self.container.poll() is None:
                        self.logger.warning("Force killing command due to timeout")
                        self.container.send_signal(9)  # SIGKILL = 9
                        time.sleep(0.5)
                
                # Read remaining output
                try:
                    remaining_output = read_with_timeout(self.container, self.get_pids, 5)
                    buffer = remaining_output
                except Exception:
                    buffer = ""
                    
            except Exception as interrupt_error:
                self.logger.warning(f"Failed to interrupt timed out command: {interrupt_error}")
                buffer = ""
            
            # Send clear TIMEOUT message to AGENT
            timeout_message = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED AFTER {timeout_duration} SECONDS"
            if timeout_type == "no_output":
                timeout_message += " - NO OUTPUT WAS PRODUCED"
            else:
                timeout_message += " - COMMAND WAS RUNNING TOO LONG"
            
            timeout_message += "\nPLEASE TRY A DIFFERENT APPROACH OR USE A SHORTER COMMAND"
            
            if buffer and buffer.strip():
                timeout_message += f"\n\nPartial output before timeout:\n{buffer}"
            
            self.logger.info(f"Returning timeout message to agent: {timeout_message}")
            buffer = timeout_message
            exit_code = "143"  # SIGTERM exit code
        if not exit_code.isdigit():
            msg = f"Failed to get exit code. Output:\n---\n{buffer}\n---"
            raise RuntimeError(msg)
        self.returncode = int(exit_code)
        return buffer

    def _check_syntax(self, input: str) -> tuple[str, bool]:
        """
        Check syntax of command.

        Returns:
            output: Output of the command
            success: whether the exit code was 0
        """
        output = self._communicate(f"/bin/bash -n <<'EOF'\n{input}\nEOF\n")
        return output, self.returncode == 0

    def communicate(
        self,
        input: str,
        timeout_duration: int | float = 30,
        no_output_timeout_duration: int | float | None = None,
        *,
        set_last_action: bool = False,
        redact_command_trace: bool = False,
    ) -> str:
        """
        Sends input to container and returns output

        Args:
            input: input to send to container
            timeout_duration: duration to wait for output
            set_last_action: whether to set the LAST_ACTION environment variable
            redact_command_trace: Whether to redact the command that is being run when logging
                it to trace level
        Returns:
            output: output from container
        """
        assert self.container is not None

        # Special handling for edit commands
        is_edit_command = input.strip().startswith("edit")
        if is_edit_command:
            # Use appropriate timeout for edit commands
            timeout_duration = max(timeout_duration, 30)  # Change minimum to 30 seconds
            no_output_timeout_duration = max(no_output_timeout_duration or timeout_duration, 15)
            self.logger.info(f"Edit command detected in communicate, using extended timeout: {timeout_duration} seconds")
            
            # Add end_of_edit if not present
            if "end_of_edit" not in input:
                input = input + "\nend_of_edit"
                self.logger.info("Automatically added 'end_of_edit' to edit command")
            
            # Process entire edit command at once
            self.logger.info(f"Processing edit command with extended timeout")

        # Add timeout options to curl commands
        if "curl" in input and "http://host.docker.internal" in input:
            input = input.replace("curl", "curl --connect-timeout 10 --max-time 60")

        if no_output_timeout_duration is None:
            no_output_timeout_duration = timeout_duration

        if input.strip() != "exit":
            # Log input command
            self.logger.info("🔄 Agent Command: %s", input)

            if redact_command_trace:
                self.logger.log(logging.TRACE, "Input:\nREDACTED")  # type: ignore
            else:
                self.logger.log(logging.TRACE, "Input:\n%s", input)  # type: ignore
            output, valid = self._check_syntax(input)
            if not valid:
                self.logger.warning("❌ Syntax Error: %s", output)
                return output  # shows syntax errors
            output = self._communicate(
                input,
                timeout_duration=timeout_duration,
                no_output_timeout_duration=no_output_timeout_duration,
            )
            # Log output result - sanitize output to prevent markup errors
            try:
                # Sanitize output to prevent Rich markup errors
                sanitized_output = str(output).replace('[', '\\[').replace(']', '\\]')
                self.logger.info("📝 Agent Response:\n%s", sanitized_output)
                self.logger.log(logging.TRACE, "Output:\n%s", sanitized_output)  # type: ignore
            except Exception as e:
                # Fallback logging if sanitization fails
                self.logger.warning("Failed to log output due to markup error: %s", str(e))
                self.logger.info("📝 Agent Response: [Output logging failed due to special characters]")
                self.logger.log(logging.TRACE, "Output: [Output logging failed due to special characters]")  # type: ignore
            self.communicate_output = output
            if set_last_action:
                # Cannot merge this with last command, because of multiline command
                # handling.
                last_action_string = shlex.quote(input.strip())
                input = f"export LAST_ACTION={last_action_string}"
                self._communicate(input, timeout_duration=5, no_output_timeout_duration=5)
            return output
        else:
            self.container.terminate()
            self.returncode = 0
            self.communicate_output = ""
            return ""

    def _check_and_recover_container(self) -> bool:
        try:
            if self.container is None:
                self.logger.warning("Container is None, reinitializing...")
                try:
                    self._init_container()
                    return True
                except Exception as e:
                    self.logger.error(f"Failed to initialize container: {e}")
                    return False
                
            if self.container.poll() is not None:
                self.logger.warning("Container has exited, attempting recovery...")
                try:
                    self.container.stdin.write("echo 'check_recover_exit_recovery'\n")
                    self.container.stdin.flush()
                    time.sleep(0.1)
                    return True
                except Exception as e:
                    self.logger.error(f"Failed to recover from container exit: {e}")
                    return False
                
                    # Check if container is alive
            try:
                # Check container response with simple command (use shorter timeout)
                test_output = self._communicate("echo 'test'", timeout_duration=3, no_output_timeout_duration=3)
                if "test" in test_output:
                    return True
                else:
                    self.logger.warning("Container is not responding properly, attempting recovery...")
                    try:
                        self.container.stdin.write("echo 'check_recover_unresponsive_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                        return True
                    except Exception as e:
                        self.logger.error(f"Failed to recover from container unresponsive: {e}")
                        return False
            except Exception as e:
                self.logger.warning(f"Container health check failed: {e}, attempting recovery...")
                try:
                    self.container.stdin.write("echo 'check_recover_health_failed_recovery'\n")
                    self.container.stdin.flush()
                    time.sleep(0.1)
                    return True
                except Exception as recovery_error:
                    self.logger.error(f"Failed to recover from container health check: {recovery_error}")
                    return False
                
        except Exception as e:
            self.logger.error(f"Container recovery failed: {e}")
            return False

    def _safe_communicate(self, input: str, timeout_duration: int | float = 30, no_output_timeout_duration: int | float = None, *, redact_command_trace: bool = False) -> str:
        try:
                    # Set no_output_timeout_duration to timeout_duration if None
            if no_output_timeout_duration is None:
                no_output_timeout_duration = timeout_duration
                
            # Special handling for edit commands
            is_edit_command = input.strip().startswith("edit")
            if is_edit_command:
                # Use appropriate timeout for edit commands
                timeout_duration = max(timeout_duration, 30)  # Change minimum to 30 seconds
                no_output_timeout_duration = max(no_output_timeout_duration, 15)
                self.logger.info(f"Edit command detected in _safe_communicate, using extended timeout: {timeout_duration} seconds")
                
                # Add end_of_edit if not present
                if "end_of_edit" not in input:
                    input = input + "\nend_of_edit"
                    self.logger.info("Automatically added 'end_of_edit' to edit command in _safe_communicate")
                
                # Process entire edit command at once
                self.logger.info(f"Processing edit command with extended timeout in _safe_communicate")
            
            # Check and recover container status
            if not self._check_and_recover_container():
                return f"Error: Container recovery failed. Please try again."
            
            # Call communicate method
            return self.communicate(
                input, 
                timeout_duration=timeout_duration,
                no_output_timeout_duration=no_output_timeout_duration,
                redact_command_trace=redact_command_trace
            )
            
        except Exception as e:
            self.logger.error(f"Unexpected error in _safe_communicate: {e}")
            self.logger.error(traceback.format_exc())
            
            # Check if this is a timeout error
            is_timeout_error = isinstance(e, (TimeoutError, NoOutputTimeoutError)) or "TIMEOUT" in str(e)
            
            # Attempt container recovery - only restart if container has actually exited or it's not a timeout
            try:
                if self.container and self.container.poll() is not None:
                    self.logger.warning("Container has exited due to error, restarting...")
                    self.reset_container()
                elif not is_timeout_error:
                    # Force restart if container is alive but unresponsive (only for non-timeout errors)
                    self.logger.warning("Container is unresponsive due to error, forcing restart...")
                    self.reset_container()
                else:
                    # For timeout errors, don't restart if container is still alive
                    self.logger.info("Container is still alive after timeout, continuing without restart...")
                    # Try to restore shell prompt by sending a simple command
                    try:
                        self.container.stdin.write("echo 'timeout_recovery'\n")
                        self.container.stdin.flush()
                        time.sleep(0.1)
                    except Exception:
                        self.logger.warning("Failed to restore shell prompt after timeout")
            except Exception as recovery_error:
                self.logger.error(f"Container recovery failed: {recovery_error}")
            
            # Send clear error message to agent
            if is_timeout_error:
                timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                error_message = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
            else:
                error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
            
            self.logger.info(f"Returning error message to agent: {error_message}")
            return error_message

    def communicate_with_handling(
        self, input: str, error_msg: str, timeout_duration: int | float = 30, *, redact_command_trace: bool = False
    ) -> str:
        """
        Returns error messages as-is without terminating the program when errors occur.
        This allows the LLM to see error messages and solve problems on its own.
        """
        max_retries = 3  # Reduce retry count (prevent entire process termination)
        retry_delay = 1  # Initial retry wait time (seconds)
        
        # Special handling for edit commands
        is_edit_command = input.strip().startswith("edit")
        if is_edit_command:
            # Use appropriate timeout for edit commands
            timeout_duration = max(timeout_duration, 30)  # Change minimum to 30 seconds
            self.logger.info(f"Edit command detected, using extended timeout: {timeout_duration} seconds")
            
            # Add end_of_edit if not present
            if "end_of_edit" not in input:
                input = input + "\nend_of_edit"
                self.logger.info("Automatically added 'end_of_edit' to edit command in communicate_with_handling")
            
            # Process entire edit command at once
            self.logger.info(f"Processing edit command with extended timeout in communicate_with_handling")
        
        for attempt in range(max_retries):
            try:
                # Use safe communication method
                output = self._safe_communicate(input, timeout_duration=timeout_duration, redact_command_trace=redact_command_trace)
                
                # Return error messages as-is even if command returns error
                if self.returncode != 0:
                    self.logger.warning(f"{error_msg}: {output}")
                    return f"{error_msg}: {output}"
                    
                return output
                
            except TimeoutError as e:
                # Terminate only the command when timeout occurs and send clear message to AGENT
                timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                timeout_duration_used = timeout_duration
                
                self.logger.warning(f"Command timeout ({timeout_type}) after {timeout_duration_used} seconds: {input}")
                
                # Attempt to terminate only the timed out command (prevent entire process termination)
                try:
                    # Terminate only the current command
                    if self.container and self.container.poll() is None:
                        # Send SIGINT (Ctrl+C) signal to terminate command
                        self.container.send_signal(2)  # SIGINT = 2
                        time.sleep(0.5)
                        
                        # Try SIGTERM if still running
                        if self.container.poll() is None:
                            self.container.send_signal(15)  # SIGTERM = 15
                            time.sleep(1)
                        
                        # Finally try SIGKILL if necessary
                        if self.container.poll() is None:
                            self.logger.warning("Force killing command due to timeout")
                            self.container.send_signal(9)  # SIGKILL = 9
                            time.sleep(0.5)
                    
                    # Read remaining output
                    try:
                        remaining_output = read_with_timeout_experimental(
                            self.container, 5, 2
                        )
                        output = remaining_output[0]
                    except Exception:
                        output = ""
                        
                except Exception as interrupt_error:
                    self.logger.warning(f"Failed to interrupt timed out command: {interrupt_error}")
                    output = ""
                
                # Send clear TIMEOUT message to AGENT
                timeout_message = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED AFTER {timeout_duration_used} SECONDS"
                if timeout_type == "no_output":
                    timeout_message += " - NO OUTPUT WAS PRODUCED"
                else:
                    timeout_message += " - COMMAND WAS RUNNING TOO LONG"
                
                timeout_message += f"\nCOMMAND: {input}"
                timeout_message += "\nPLEASE TRY A DIFFERENT APPROACH OR USE A SHORTER COMMAND"
                
                if output:
                    timeout_message += f"\n\nPartial output before timeout:\n{output}"
                
                self.logger.info(f"Returning timeout message to agent: {timeout_message}")
                
                # Check container status after timeout - only restart if container has actually exited
                try:
                    if self.container.poll() is not None:
                        self.logger.warning("Container has exited after timeout, restarting...")
                        self.reset_container()
                    else:
                        # Continue using if container is still alive - no restart needed
                        self.logger.info("Container is still alive after timeout, continuing without restart...")
                        # Try to restore shell prompt by sending a simple command
                        try:
                            self.container.stdin.write("echo 'timeout_recovery'\n")
                            self.container.stdin.flush()
                            time.sleep(0.1)
                        except Exception:
                            self.logger.warning("Failed to restore shell prompt after timeout")
                except Exception as recovery_error:
                    self.logger.error(f"Container recovery after timeout failed: {recovery_error}")
                
                return timeout_message
                        
            except RuntimeError as e:
                # Handle runtime errors
                if attempt < max_retries - 1:
                    self.logger.warning(f"{error_msg}: Runtime error on attempt {attempt + 1}/{max_retries}. Retrying in {retry_delay} seconds... {e}")
                    time.sleep(retry_delay)
                    retry_delay *= 2
                    
                    try:
                        if "reset_after_exception" in str(e):
                            self.container.stdin.write("echo 'reset_container_recovery'\n")
                            self.container.stdin.flush()
                            time.sleep(0.1)
                        else:
                            # Attempt container recovery
                            if self.container and self.container.poll() is not None:
                                self.logger.warning("Container has exited due to error, attempting recovery...")
                                try:
                                    self.container.stdin.write("echo 'reset_container_exit_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from reset_container exit, may need restart")
                            else:
                                # Try to recover without container restart
                                self.logger.warning("Container is unresponsive due to error, attempting recovery...")
                                try:
                                    self.container.stdin.write("echo 'reset_container_unresponsive_recovery'\n")
                                    self.container.stdin.flush()
                                    time.sleep(0.1)
                                except Exception:
                                    self.logger.warning("Failed to recover from reset_container unresponsive, may need restart")
                    except Exception as reset_error:
                        self.logger.warning(f"Container reset failed: {reset_error}")
                    
                    continue
                else:
                    # Failed even on last attempt
                    self.logger.warning(f"{error_msg}: Runtime error after {max_retries} attempts. {e}")
                    error_message = str(e)
                    cause = getattr(e, "__cause__", None)
                    if cause is not None:
                        error_message += f" caused by {cause}"
                        
                    # Check if container reset is needed
                    reset_after_exception = "reset_after_exception" in error_message
                    output = f"{error_msg}: {error_message}"
                    
                    if reset_after_exception:
                        self.reset_container()
                        
                    return output
                    
            except Exception as e:
                if attempt < max_retries - 1:
                    self.logger.warning(f"{error_msg}: Unexpected error on attempt {attempt + 1}/{max_retries}. Retrying in {retry_delay} seconds... {e}")
                    time.sleep(retry_delay)
                    retry_delay *= 2
                    
                    # Attempt container recovery
                    try:
                        if self.container and self.container.poll() is not None:
                            self.logger.warning("Container has exited due to error, restarting...")
                            self.reset_container()
                        else:
                            # Force restart if container is alive but unresponsive
                            self.logger.warning("Container is unresponsive due to error, forcing restart...")
                            self.reset_container()
                    except Exception as recovery_error:
                        self.logger.warning(f"Container recovery failed: {recovery_error}")
                    
                    continue
                else:
                    # Failed even on last attempt
                    self.logger.warning(f"{error_msg}: Unexpected error after {max_retries} attempts. {e}")
                    self.logger.error(traceback.format_exc())
                    
                    # Return special message for timeout cases
                    if isinstance(e, (TimeoutError, NoOutputTimeoutError)):
                        timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                        return f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                    
                    # Return clear error message for other exceptions
                    error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                    error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                    
                    self.logger.info(f"Returning error message to agent: {error_message}")
                    return error_message

    def get_available_actions(self) -> list[str]:
        """
        Returns list of available actions in current environment state

        Currently not in use.
        """
        return []

    def get_pids(self, all_pids: bool = False) -> list[tuple[str, str]]:
        """
        Gets list of processes running inside docker container

        Args:
            all_pids: whether to return all pids, or whether to exclude ps
                and parent PIDs

        Returns:
            list of PIDs
        """
        assert self.container_obj is not None
        pids = self.container_obj.exec_run("ps -eo pid,comm,ppid --no-headers").output.decode().split("\n")
        pids = [x.split() for x in pids if x]
        if not all_pids:
            # Get just the PIDs of processes that are descendants of parent_pids and not others
            pids = [
                (x[0], x[1])
                for x in pids
                if x[1] != "ps"
                and x[0] not in self.parent_pids
                and x[1] != getattr(self.interactive_session, "name", None)
                and x[2] in self.parent_pids
            ]
        return pids

    # ctf
    def validate_submission(self, submission: str) -> bool:
        """
        Function to validate submission value for CTF challenge.
        
        Args:
            submission: Extracted submission value
            
        Returns:
            Validates if it follows the defined flag format
        """
        submission = submission.strip()
        
        # Check exception flag list
        if submission in EXCEPTION_FLAGS:
            self.logger.warning(f"Exception flag detected: {submission}")
            return False

        return True

    def get_submission(self, output: str) -> str | None:
        """
        Function for extracting diff patch submission at the end of an episode.

        Args:
            output: `submit` observation

        Returns:
            submission: diff patch submission
        """
        pattern = r"\<\<SUBMISSION\|\|(.*)\|\|SUBMISSION\>\>"
        match = re.search(pattern, output, re.DOTALL)
        if match is None:
            return None
        return match.group(1)

    def run_shell_script(self, script_path: Path, *, location: str) -> None:
        """Run custom script supplied by user at `script_path`

        Args:
            script_path: path to script file
            location: location of script file 'host' or 'container'
        """
        if location == "host":
            return self._run_shell_script_host(script_path)
        elif location == "container":
            raise NotImplementedError
        msg = f"Invalid 'location': {location}"
        raise ValueError(msg)

    def _run_shell_script_host(self, script_path: Path) -> None:
        """Run shell script file (located on host) in container"""
        if not script_path.is_file():
            msg = f"Script not found at {script_path}"
            raise FileNotFoundError(msg)
        shell_commands = Path(script_path).read_text().splitlines(keepends=True)
        for i, cmd in enumerate(shell_commands):
            self.communicate_with_handling(
                cmd,
                error_msg=f"Failed to execute line {i}.",
                timeout_duration=LONG_TIMEOUT,
            )

    def _get_install_configs(self) -> dict | None:
        """Return config for environment setup"""
        assert self.record is not None  # mypy
        if (
            self.record["problem_statement_source"] != "swe-bench" or self.record["repo_type"] == "local"
        ) and self.args.environment_setup is None:
            self.logger.warning(
                "install_environment is set to True, but the data path is a GitHub URL "
                "without an environment config file (environment_config key/flag). "
                "Skipping conda environment installation.",
            )
            return None
        if self.args.environment_setup is not None:
            assert isinstance(self.args.environment_setup, (str, os.PathLike))
            if Path(self.args.environment_setup).suffix in [".yml", ".yaml"]:
                try:
                    return yaml.safe_load(Path(self.args.environment_setup).read_text())
                except Exception as e:
                    msg = "Environment config file needs to be a yaml file"
                    raise ValueError(msg) from e
            elif Path(self.args.environment_setup).suffix == ".sh":
                return {
                    "shell_script_path": self.args.environment_setup,
                }
            else:
                msg = "Environment config file needs to be a yaml file or shell script"
                raise ValueError(msg)
        else:
            try:
                return MAP_REPO_VERSION_TO_SPECS[self.record["repo"]][str(self.record["version"])]
            except KeyError as e:
                msg = (
                    "Tried to look up install configs in swe-bench, but failed. "
                    "You can set a custom environment config with the environment_config key/flag."
                )
                raise ValueError(msg) from e

    def _conda_environment_exists(self, env_name: str) -> bool:
        env_check = self.communicate(f"conda env list | grep {env_name}", timeout_duration=LONG_TIMEOUT)
        return env_check.strip() != ""

    def install_env(self) -> None:
        """
        Creates conda environment and installs third party dependencies to allow code execution
        """
        t0 = time.perf_counter()
        for hook in self.hooks:
            hook.on_install_env_started()
        install_configs = self._get_install_configs()
        if not install_configs:
            return
        if "shell_script_path" in install_configs:
            assert len(install_configs) == 1
            self.run_shell_script(Path(install_configs["shell_script_path"]), location="host")
            return
        assert self.record is not None  # mypy
        # Create environment if does not exist yet
        env_name = f"{self._repo_name}__{self.record['version']}"
        if not self._conda_environment_exists(env_name):
            self.logger.info(f"{env_name} conda env not found, creating...")
            packages = install_configs.get("packages", "")
            if packages == "requirements.txt":
                # Create conda environment
                self.communicate_with_handling(
                    f"conda create -n {env_name} python={install_configs['python']} -y",
                    error_msg="Failed to create conda environment",
                    timeout_duration=LONG_TIMEOUT,
                )
                self.logger.debug("Created conda environment")
                # Write reqs to requirements.txt in docker container
                content_reqs = get_requirements(self.record)
                copy_file_to_container(self.container_obj, content_reqs, PATH_TO_REQS)
                # Create conda environment + install reqs
                self.communicate_with_handling(
                    f"conda activate {env_name}",
                    error_msg="Failed to activate conda environment",
                )
                self.communicate_with_handling(
                    f"pip install -r {PATH_TO_REQS}",
                    error_msg="Failed to install requirements.txt",
                    timeout_duration=LONG_TIMEOUT,
                )
                self.logger.debug("Installed requirements from requirements.txt")
                self.communicate(f"rm {PATH_TO_REQS}")
            elif packages == "environment.yml":
                # Write environment.yml to file
                content_env_yml = get_environment_yml(self.record, env_name)
                # Hotfix for
                if not install_configs.get("no_use_env"):
                    content_env_yml += f'\n  - python={install_configs["python"]}\n'
                copy_file_to_container(self.container_obj, content_env_yml, PATH_TO_ENV_YML)
                if install_configs.get("no_use_env"):
                    # Create conda environment
                    self.communicate_with_handling(
                        f"conda create -c conda-forge -n {env_name} python={install_configs['python']} -y",
                        error_msg="Failed to create conda environment",
                        timeout_duration=LONG_TIMEOUT,
                    )
                    self.logger.debug("Created conda environment")
                    # Install packages
                    self.communicate_with_handling(
                        f"conda env update -f {PATH_TO_ENV_YML}",
                        error_msg="Failed to install environment.yml",
                        timeout_duration=LONG_TIMEOUT,
                    )
                    self.logger.debug("Installed packages from environment.yml")
                else:
                    # Create environment + install packages
                    self.communicate_with_handling(
                        f"conda env create --file {PATH_TO_ENV_YML}",
                        error_msg="Failed to create conda environment with environment.yml",
                        timeout_duration=LONG_TIMEOUT,
                    )
                    self.logger.debug("Created conda environment with environment.yml")
                self.communicate(f"rm {PATH_TO_ENV_YML}")
            else:
                python_env = f"python{install_configs['python']}"
                if self._conda_environment_exists(python_env):
                    self.communicate_with_handling(
                        f"conda create --name {env_name} --clone {python_env}",
                        error_msg="Failed to clone conda environment",
                        timeout_duration=LONG_TIMEOUT,
                    )
                    self.logger.debug("Cloned python conda environment")
                else:
                    self.logger.debug(f"Could not find {python_env}, creating new environment")
                    self.communicate_with_handling(
                        f"conda create -n {env_name} python={install_configs['python']} -y",
                        error_msg="Failed to create conda environment",
                        timeout_duration=LONG_TIMEOUT,
                    )
                self.communicate_with_handling(
                    f"conda activate {env_name}",
                    error_msg="Failed to activate conda environment",
                )
                if packages.strip():
                    self.communicate_with_handling(
                        f"conda install {packages} -y",
                        error_msg="Failed to install packages",
                        timeout_duration=LONG_TIMEOUT,
                    )
                    self.logger.debug("Installed conda packages")
            # Install extra pip packages if specified
            if install_configs.get("pip_packages"):
                self.communicate_with_handling(
                    f"source activate {env_name} && pip install {' '.join(install_configs['pip_packages'])}",
                    error_msg="Failed to install pip packages",
                    timeout_duration=LONG_TIMEOUT,
                )
                self.logger.debug("Installed extra pip dependencies")

        # Activate environment
        self.communicate_with_handling(f"conda activate {env_name}", error_msg="Failed to activate conda environment")

        # Install repo at base commit
        if install_configs.get("pre_install"):
            self.logger.info("Running pre-install commands...")
            for pre_install_cmd in install_configs["pre_install"]:
                self.communicate_with_handling(
                    pre_install_cmd,
                    error_msg="Pre-install commands failed to execute successfully",
                    timeout_duration=LONG_TIMEOUT,
                )
            self.logger.debug("Ran pre-install commands")
        self.logger.info(f"Installing {self._repo_name} at base commit...")
        if install_configs.get("install"):
            install_cmd = install_configs["install"]
            self.communicate_with_handling(
                install_cmd,
                error_msg="Install command failed to execute successfully",
                timeout_duration=LONG_TIMEOUT,
            )
            self.logger.debug("Ran install command")
        if install_configs.get("post_install"):
            self.logger.info("Running post-install commands...")
            for post_install_cmd in install_configs["post_install"]:
                self.communicate_with_handling(
                    post_install_cmd,
                    error_msg="Post-install commands failed to execute successfully",
                )
            self.logger.debug("Ran post-install commands")

        self.logger.info("Installation step took %.2f seconds", time.perf_counter() - t0)

    def add_commands(self, commands: list[dict]) -> None:
        """
        Adds custom commands to container
        """
        for command in commands:
            name = command["name"]
            contents = command["contents"]
            copy_file_to_container(self.container_obj, contents, f"/root/commands/{name}")
            if command["type"] == "source_file":
                self.communicate_with_handling(
                    f"source /root/commands/{name}",
                    error_msg=(
                        f"Failed to source {name}. If you meant to make a script,"
                        " start the file with a shebang (e.g. #!/usr/bin/env python)."
                    ),
                )
            elif command["type"] == "script":
                self.communicate_with_handling(
                    f"chmod +x /root/commands/{name}",
                    error_msg=f"Failed to chmod {name}",
                )
            elif command["type"] == "utility":
                # nothing to do for utility scripts
                pass
            else:
                msg = f"Invalid command type: {command['type']}"
                raise ValueError(msg)

        try:
            keys_path = Path(REPO_ROOT) / "keys.cfg"
            if keys_path.exists():
                with open(keys_path, "r") as f:
                    keys_content = f.read()
                copy_file_to_container(
                    self.container_obj,
                    keys_content, 
                    "/root/commands/keys.cfg"
                )
            else:
                self.logger.warning("can not found keys.cfg")
        except Exception as e:
            self.logger.warning(f"fail to copy keys.cfg : {str(e)}")

    def interrupt(self) -> str:
        """
        Send interrupt signal to container and exhaust stdout buffer with a communicate call
        """
        assert self.container is not None
        assert self.container_obj is not None
        pids = self.get_pids()
        for pid, _ in pids:
            # Sending signal several times ensures that the process is dead
            for _ in range(3):
                self.container_obj.exec_run(f"kill -9 {pid}")
        observation = ""
        try:
            observation += read_with_timeout(self.container, self.get_pids, 20)
        except TimeoutError:
            pass
        try:
            # This is a workaround because of bash behaviour
            # when sometimes we get the prints of Killed after we press some "Enter" in stdin
            self.communicate(input="echo 'interrupted'", timeout_duration=5)
            output = self.communicate(input="echo 'interrupted'", timeout_duration=5)
            assert output.strip().endswith("interrupted"), "container health check failed"
        except TimeoutError:
            msg = "Failed to interrupt container"
            raise RuntimeError(msg)
        return observation

    def open_pr(self, *, trajectory, _dry_run: bool = False) -> None:
        """Create PR to repository

        Args:
            trajectory: Trajectory of actions taken by the agent
            _dry_run: Whether to actually push anything or just simulate it
        """
        self.logger.info("Opening PR")
        # TODO: have better way of handling this
        # Adding random string suffix to avoid name conflicts if we had a previously failed run
        issue_url = self.args.data_path
        try:
            issue = get_gh_issue_data(issue_url, token=self._github_token)
        except InvalidGithubURL as e:
            msg = "Data path must be a github issue URL if --open_pr is set."
            raise ValueError(msg) from e
        branch_name = f"swe-agent-fix-#{issue.number}-" + str(random.random())[2:10]

        self.communicate_with_handling(
            input="rm -f model.patch",
            error_msg="Failed to remove model patch",
            timeout_duration=10,
        )
        self.communicate_with_handling(
            input=f"git checkout -b {branch_name}",
            error_msg="Failed to switch to new branch",
            timeout_duration=10,
        )
        self.communicate_with_handling(
            input="git add .",
            error_msg="Failed to add commits",
            timeout_duration=10,
        )
        dry_run_flag = "--allow-empty" if _dry_run else ""
        commit_msg = [
            shlex.quote("Fix: {issue.title}"),
            shlex.quote("Closes #{issue.number}"),
        ]
        self.communicate_with_handling(
            input=f"git commit -m {commit_msg[0]} -m  {commit_msg[1]} {dry_run_flag}",
            error_msg="Failed to commit changes",
            timeout_duration=10,
        )

        owner, repo, _ = parse_gh_issue_url(issue_url)
        # If `--repo_path` was specified with a different github URL, then the record will contain
        # the forking user
        assert self.record is not None
        if self.record["repo_type"] != "github":
            # We already validated that `--data_path` is a github issue URL
            # so this is the only case where we can reach here
            msg = "--repo_path must point to a github URL if --open_pr is set"
            raise ValueError(msg)
        forker, _ = self.record["repo"].split("/")
        head = branch_name
        remote = "origin"
        if forker != owner:
            head = f"{forker}:{branch_name}"
            token_prefix = ""
            if self._github_token:
                token_prefix = f"{self._github_token}@"
            fork_url = f"https://{token_prefix}github.com/{forker}/{repo}.git"
            self.logger.debug(f"Using fork: {fork_url}")
            self.communicate_with_handling(
                input=f"git remote add fork {fork_url}",
                error_msg="Failed to create new git remote",
                timeout_duration=10,
            )
            remote = "fork"
        dry_run_prefix = "echo " if _dry_run else ""
        self.communicate_with_handling(
            input=f"{dry_run_prefix} git push {remote} {branch_name}",
            error_msg=(
                "Failed to push branch to remote. Please check your token and permissions. "
                "You might want to push to a fork with the push_gh_repo_url option."
            ),
            timeout_duration=10,
        )
        body = (
            f"This is a PR opened by AI tool [SWE Agent](https://github.com/swe-agent/SWE-agent/) "
            f"to close [#{issue.number}]({issue_url}) ({issue.title}).\n\nCloses #{issue.number}."
        )
        body += "\n\n" + format_trajectory_markdown(trajectory)
        api = GhApi(token=self._github_token)
        if not _dry_run:
            pr_info = api.pulls.create(  # type: ignore
                owner=owner,
                repo=repo,
                title=f"SWE-agent[bot] PR to fix: {issue.title}",
                head=head,
                base="main",
                body=body,
                draft=True,
            )
            self.logger.info(
                f"🎉 PR created as a draft at {pr_info.html_url}. Please review it carefully, push "
                "any required changes onto the branch and then click "
                "'Ready for Review' to bring it to the attention of the maintainers.",
            )

    def read_file(self, path: str | PurePath) -> str:
        """Read file contents from container

        Args:
            path: Path to file relative to repository root

        Returns:
            file_contents: Contents of file as string
        """
        path_in_container = f"/{self._repo_name}/{path}"
        return self.communicate(f"cat {str(path_in_container)}")
