from __future__ import annotations

import copy
import json
import re
import time
import traceback
from collections import defaultdict
from dataclasses import dataclass
from pathlib import Path
from typing import Any, TypedDict

from simple_parsing.helpers.fields import field
from simple_parsing.helpers.flatten import FlattenedAccess
from simple_parsing.helpers.serialization.serializable import FrozenSerializable
from tenacity import RetryError

from sweagent.agent.commands import Command, ParseCommand
from sweagent.agent.history_processors import HistoryProcessor
from sweagent.agent.models import (
    APIStats,
    ContextWindowExceededError,
    CostLimitExceededError,
    ModelArguments,
    get_model,
)
from sweagent.agent.parsing import FormatError, ParseFunction
from sweagent.agent.summarizer import SummarizerConfig
from sweagent.environment.swe_env import SWEEnv
from sweagent.environment.utils import NoOutputTimeoutError
from sweagent.types import AgentInfo, History, HistoryItem, Trajectory, TrajectoryStep
from sweagent.utils.config import convert_paths_to_abspath
from sweagent.utils.log import get_logger


@dataclass(frozen=True)
class Subroutine(FrozenSerializable):
    name: str
    agent_file: str
    # one of "action", "observation", "response", "state", "thought"
    return_type: str = None  # type: ignore
    init_observation: str | None = None
    end_name: str | None = None
    signature: str | None = None
    docstring: str | None = None
    model: ModelArguments | None = None
    agent_args: Any | None = None


@dataclass(frozen=True)
class AgentConfig(FrozenSerializable):
    system_template: str
    instance_template: str
    next_step_template: str | None = None  # defaults to instance_template
    next_step_no_output_template: str | None = None  # defaults to next_step_template
    strategy_template: str | None = None
    demonstration_template: str | None = None
    # Paths to demonstrations. If path is not absolute, it is assumed to be
    # relative to the SWE_AGENT_CONFIG_ROOT (if set) or the SWE-agent repository root
    demonstrations: list[str | Path] = field(default_factory=list)
    put_demos_in_history: bool = False  # if True, add demonstration to history instead of as a single message
    # defaults to format_error_template in ParseFunction
    format_error_template: str = None  # type: ignore
    # Paths to command files. If path is not absolute, it is assumed to be
    # relative to the SWE_AGENT_CONFIG_ROOT (if set) or the SWE-agent repository root
    command_files: list[str | Path] = field(default_factory=list)
    env_variables: dict[str, str] = field(default_factory=dict)
    util_functions: list[str] = field(default_factory=list)
    submit_command: str = "submit"
    parse_function: str = "ThoughtActionParser"
    parse_command: str = "ParseCommandBash"
    history_processor: str = "DefaultHistoryProcessor"
    history_processor_args: dict[str, Any] = field(default_factory=dict)
    command_docs: str = None  # type: ignore
    summarizer_config: SummarizerConfig = field(default_factory=SummarizerConfig)
    blocklist_error_template: str = "Interactive operation '{name}' is not supported by this environment"
    blocklist: tuple[str, ...] = (
        "vim",
        "vi",
        "emacs",
        "nano",
        "nohup",
        "git",
        "gdb",
    )
    blocklist_standalone: tuple[str, ...] = (
        "python",
        "python3",
        "ipython",
        "bash",
        "sh",
        "exit",
        "/bin/bash",
        "/bin/sh",
        "nohup",
        "vi",
        "vim",
        "emacs",
        "nano",
        "su",
    )
    block_unless_regex: dict[str, str] = field(default_factory=dict)
    # Should extract environment state in a json readable form
    state_command: Command = Command(
        name="state",
        code="""state() {
            echo '{"working_dir": "'$(realpath --relative-to=$ROOT/.. $PWD)'"}';
        };""",
    )
    _commands: list[Command] = field(default_factory=list)
    _subroutines: dict[str, Subroutine] = field(default_factory=dict)
    subroutine_types: list[Subroutine] = field(default_factory=list)

    def __post_init__(self):
        object.__setattr__(self, "command_files", convert_paths_to_abspath(self.command_files))
        object.__setattr__(self, "demonstrations", convert_paths_to_abspath(self.demonstrations))

        if self.next_step_template is None:
            object.__setattr__(self, "next_step_template", self.instance_template)
        if self.next_step_no_output_template is None:
            object.__setattr__(self, "next_step_no_output_template", self.next_step_template)

        object.__setattr__(self, "parse_command", ParseCommand.get(self.parse_command))
        for file in self.command_files:
            commands = self.parse_command.parse_command_file(file)

            util_functions = [command for command in commands if command.name.startswith("_")]
            commands = [command for command in commands if not command.name.startswith("_")]

            object.__setattr__(self, "util_functions", self.util_functions + util_functions)
            object.__setattr__(self, "_commands", self._commands + commands)

        for subroutine in self.subroutine_types:
            if subroutine.name == "submit":
                msg = "Cannot use 'submit' as a subroutine name"
                raise ValueError(msg)
            agent_args = AgentArguments(
                model=subroutine.model,
                config_file=subroutine.agent_file,
            )
            object.__setattr__(subroutine, "agent_args", agent_args)
            object.__setattr__(self, "_subroutines", {**self._subroutines, subroutine.name: subroutine})

        multi_line_command_endings = {
            command.name: command.end_name
            for command in [*self._commands, *self._subroutines.values()]
            if command.end_name is not None
        }
        object.__setattr__(self, "multi_line_command_endings", multi_line_command_endings)
        object.__setattr__(
            self,
            "command_docs",
            self.parse_command.generate_command_docs(
                self._commands,
                self.subroutine_types,
                **self.env_variables,
            ),
        )
        object.__setattr__(self, "parse_function", ParseFunction.get(self.parse_function))
        if self.format_error_template is None:
            object.__setattr__(
                self,
                "format_error_template",
                self.parse_function.format_error_template,
            )
        object.__setattr__(
            self,
            "format_error_template",
            self.format_error_template.format(**self.__dict__),
        )
        for command in self._commands:
            if command.name == self.submit_command:
                object.__setattr__(self, "submit_command_end_name", command.end_name)
                break
        object.__setattr__(
            self,
            "history_processor",
            HistoryProcessor.get(self.history_processor, **self.history_processor_args),
        )
        if "WINDOW" in self.env_variables:
            window_size = self.env_variables["WINDOW"]
            if self.summarizer_config.window_length < int(window_size):
                msg = f"Summarizer window length is set to {self.summarizer_config.window_length} which is less than the window length {window_size}"
                raise ValueError(msg)
        object.__setattr__(
            self,
            "block_unless_regex",
            {"radare2": r"\b(?:radare2)\b.*\s+-c\s+.*", "r2": r"\b(?:radare2)\b.*\s+-c\s+.*"},
        )


@dataclass(frozen=True)
class AgentArguments(FlattenedAccess, FrozenSerializable):
    """Configure the agent's behaviour (templates, parse functions, blocklists, ...)."""

    model: ModelArguments = None

    # Policy can only be set via config yaml file from command line
    config_file: Path | None = None
    config: AgentConfig | None = field(default=None, cmd=False)

    def __post_init__(self):
        if self.config is None and self.config_file is not None:
            # If unassigned, we load the config from the file to store its contents with the overall arguments
            config = AgentConfig.load_yaml(self.config_file)
            object.__setattr__(self, "config", config)
        assert self.config is not None  # mypy
        for subroutine in getattr(self.config, "subroutines", {}).values():
            model_args = subroutine.model
            object.__setattr__(
                model_args,
                "per_instance_cost_limit",
                self.model.per_instance_cost_limit,
            )
            object.__setattr__(model_args, "total_cost_limit", self.model.total_cost_limit)


class AgentHook:
    def on_init(self, *, agent: Agent):
        """Note: Depending on the internals of `Agent` should be done with care,
        it's best to use this as little as possible.
        """

    def on_run_start(
        self,
    ): ...

    def on_step_start(self): ...

    def on_actions_generated(self, *, thought: str, action: str, output: str): ...

    def on_sub_action_started(self, *, sub_action: str): ...

    def on_sub_action_executed(self, *, obs: str, done: bool): ...

    def on_step_done(self, *, trajectory_step: TrajectoryStep, model_stats: APIStats): ...

    def on_run_done(self, *, trajectory: Trajectory, info: AgentInfo): ...

    def on_model_query(self, *, query: str, agent: str):
        """Actually query the model with the complete history."""

    def on_query_message_added(
        self,
        *,
        role: str,
        content: str,
        agent: str,
        is_demo: bool = False,
        thought: str = "",
        action: str = "",
    ): ...

    def on_setup_done(self): ...


class SubAction(TypedDict):
    agent: str
    action: str
    cmd_name: str | None
    args: str


class Agent:
    """Agent handles the behaviour of the model and how it interacts with the environment."""

    def __init__(self, name: str, args: AgentArguments):
        self.name = name
        # todo: currently only used to get the model name, so might remove this later
        self._args = args
        self.model = get_model(args.model, args.config._commands + args.config.subroutine_types)
        self.summarizer_model = get_model(
            args.config.summarizer_config.model if args.config.summarizer_config.model is not None else args.model
        )
        self.config = args.config
        assert self.config is not None  # mypy
        self.system_args = {
            "command_docs": self.config.command_docs,
            **self.config.env_variables,
        }
        self.instance_args = None
        self._parse_command_patterns()
        self.last_container_id = None
        self.hooks = []
        self.logger = get_logger("agent")
        # Requires instance, so is set in `setup` methods
        self._rloop = None

        # Set in run method
        self._env: SWEEnv | None = None
        self.traj_dir: None | Path = None

        #: Number of attempts to solve the issue when using a review loop
        self._i_attempt: int = 0

        #: The following three attributes collect the information about how the agent
        #: solved the problem.
        self._history_by_attempt: dict[int, list] = defaultdict(list)
        self._trajectory_by_attempt: dict[int, Trajectory] = defaultdict(list)
        self._info_by_attempt: dict[int, AgentInfo] = defaultdict(dict)

        #: Variables to be referenced in the templates that are forwarded from one
        #: solution attempt to the next
        self._forwarded_vars: dict[str, Any] = {}
        
        # Properties for error tracking
        self._consecutive_errors = 0
        self._max_consecutive_errors = 5  # Maximum consecutive error count

    @property
    def history(self) -> History:
        """History that is passed on to the model.
        Use `_append_history` to modify.
        """
        return self._history_by_attempt[self._i_attempt]

    @history.setter
    def history(self, value: History):
        self._history_by_attempt[self._i_attempt] = value

    @property
    def trajectory(self) -> Trajectory:
        """Trajectory of the agent for the current instance. In contrast to `history`,
        this is mostly for the informational value of how the agent interacted with
        the environment and is also what is being used when replaying the trajectory
        """
        return self._trajectory_by_attempt[self._i_attempt]

    @trajectory.setter
    def trajectory(self, value: Trajectory):
        self._trajectory_by_attempt[self._i_attempt] = value

    @property
    def info(self) -> AgentInfo:
        """Information about the agent's run"""
        return self._info_by_attempt[self._i_attempt]

    @info.setter
    def info(self, value: AgentInfo):
        self._info_by_attempt[self._i_attempt] = value

    @property
    def traj_path(self) -> Path | None:
        """Returns path to the trajectory.
        The path is reset for every new instance.
        """
        if self.traj_dir and self._env is not None:
            assert self._env.record
            return self.traj_dir / (self._env.record["instance_id"] + ".traj")
        return None

    def add_hook(self, hook: AgentHook) -> None:
        """Add hook to agent"""
        hook.on_init(agent=self)
        self.hooks.append(hook)

    def _append_history(self, item: HistoryItem) -> None:
        """Adds an item to the history."""
        for hook in self.hooks:
            hook.on_query_message_added(**item)
        self.history.append(item)

    # todo: klieret: Long term: Might make more sense to reinitialize the agent class for every instance instead of this
    def setup(self, instance_args: dict[str, Any], init_model_stats: APIStats | None = None) -> None:
        """Setup the agent for a new instance. This includes
        formatting the system message and adding demonstrations to the history.

        Args:
            instance_args: Arguments for the instance
        """
        assert self.config is not None  # mypy
        self.instance_args = instance_args

        self._i_attempt = 0
        self._history_by_attempt = defaultdict(list)
        self._trajectory_by_attempt = defaultdict(list)
        self._info_by_attempt = defaultdict(dict)  # type: ignore
        self._forwarded_vars = {}
        if self._rloop is not None:
            self._forwarded_vars = self._rloop.get_forwarded_vars()
        
        # Reset consecutive error counter
        self._consecutive_errors = 0

        self.setup_attempt(init_model_stats=init_model_stats)

        for hook in self.hooks:
            hook.on_setup_done()

    def setup_attempt(self, *, init_model_stats: APIStats | None = None) -> None:
        """Setup the agent for a new attempt. This includes resetting the model stats."""
        assert self.config is not None  # mypy
        if self._i_attempt > 0 and init_model_stats is not None:
            msg = (
                "We might be dealing with nested retries, where subroutines are mixed with retries. "
                "Currently, this messes up accounting with init_model_stats."
            )
            raise ValueError(msg)
        if self._i_attempt > 0:
            assert self._env is not None  # mypy
            self._env.reset_for_new_attempt()
        self.model.reset_stats(init_model_stats)
        # self.model = get_model(self._args.model, self.config._commands + self.config.subroutine_types)
        # fixme: This doesn't reset total cost
        system_msg = self.config.system_template.format(**self.system_args, **self.instance_args)
        self.logger.info(f"SYSTEM ({self.name})\n{system_msg}")
        self._append_history(HistoryItem({"role": "system", "content": system_msg, "agent": self.name}))
        if "history_to_messages" in dir(self.model):
            for demonstration_path in self.config.demonstrations:
                if self.config.demonstration_template is None and not self.config.put_demos_in_history:
                    msg = "Cannot use demonstrations without a demonstration template or put_demos_in_history=True"
                    raise ValueError(msg)

                # Load history
                self.logger.info(f"DEMONSTRATION: {demonstration_path}")
                demo_history = json.loads(Path(demonstration_path).read_text())["history"]
                demo_history = [
                    entry
                    for entry in demo_history
                    if ("agent" not in entry) or ("agent" in entry and entry["agent"] == self.name)
                ]

                if self.config.put_demos_in_history:
                    if self.config.demonstration_template is not None:
                        self.logger.warning("Demonstration template is ignored for put_demos_in_history=True")
                    # Add demonstration to history directly as separate messages
                    for entry in demo_history:
                        if entry["role"] != "system":
                            entry["is_demo"] = True
                            self._append_history(entry)
                else:
                    # Add demonstration as single message to history
                    demo_message = self.model.history_to_messages(
                        demo_history,
                        is_demonstration=True,
                    )
                    demonstration = self.config.demonstration_template.format(demonstration=demo_message)
                    self._append_history(
                        {
                            "agent": self.name,
                            "content": demonstration,
                            "is_demo": True,
                            "role": "user",
                        },
                    )

    @property
    def state_command(self) -> str:
        """Get bash command for extracting env. state"""
        assert self.config is not None  # mypy
        if hasattr(self.config, 'state_command') and self.config.state_command:
            return self.config.state_command.code
        else:
            # Provide default state command if state_command is not configured
            self.logger.warning("No state command configured, using default state command")
            return """state() {
                local working_dir="$PWD";
                local open_file="n/a";
                local interactive_session="${INTERACTIVE_SESSION:-n/a}";
                if [ ! -z $CURRENT_FILE ]; then
                    open_file=$(realpath $CURRENT_FILE);
                fi
                echo '{"open_file": "'$open_file'", "working_dir": "'$working_dir'", "interactive_session": "'$interactive_session'"}';
            };"""

    @property
    def local_history(self) -> list[dict[str, str]]:
        """Return the history of the agent since the last reset."""
        return self.config.history_processor([entry for entry in self.history if entry["agent"] == self.name])

    def _get_total_stats(self) -> APIStats:
        """Combine model stats of different attempts"""
        total_stats = APIStats()
        for stats in self._info_by_attempt.values():
            assert "model_stats" in stats  # mypy
            attempt_stats = APIStats(**stats["model_stats"])  # type: ignore
            total_stats += attempt_stats
        if self._rloop is not None:
            total_stats += self._rloop.model_stats
        return total_stats

    def save_trajectory(
        self,
    ) -> None:
        """Save the trajectory to disk.
        This includes the history, the environment state, and the model stats.
        """

        def get_attempt_data(attempt_idx: int) -> dict[str, Any]:
            """Get data saved for every attempt"""
            assert self._env is not None
            # The deepcopy here is important because else the
            # data["info"]["model_stats"] update will create havoc!
            return copy.deepcopy(
                {
                    "environment": self._env.name,
                    "trajectory": self._trajectory_by_attempt[attempt_idx],
                    "history": self._history_by_attempt[attempt_idx],
                    "info": self._info_by_attempt[attempt_idx],
                }
            )

        data = {
            **get_attempt_data(0),
        }

        assert self.traj_path is not None
        self.traj_path.write_text(json.dumps(data, indent=2))

    def _get_first_match(self, action: str, pattern_type: str) -> re.Match | None:
        """Return the first match of a command pattern in the action string."""
        assert self.config is not None  # mypy
        if pattern_type == "subroutine":
            patterns = {k: v for k, v in self.subroutine_patterns.items()}
        elif pattern_type == "multi_line":
            patterns = {
                k: v
                for k, v in self.command_patterns.items()
                if k in self.config.multi_line_command_endings or k == self.config.submit_command
            }
            patterns += {
                k: v for k, v in self.subroutine_patterns.items() if k in self.config.multi_line_command_endings
            }
        elif pattern_type == "multi_line_no_subroutines":
            patterns = {k: v for k, v in self.command_patterns.items() if k in self.config.multi_line_command_endings}
        else:
            msg = f"Unknown pattern type: {pattern_type}"
            raise ValueError(msg)
        matches = list()
        for _, pat in patterns.items():
            match = pat.search(action)
            if match:
                matches.append(match)
        if len(matches) == 0:
            return None
        matches = sorted(matches, key=lambda x: x.start())
        return matches[0]

    def _guard_multiline_input(self, action: str) -> str:
        """Split action by multiline commands, then append the first line in each multiline command with "<< '{end_name}'".
        Multiline commands (which are specified by an end_name) are commands that span multiple lines and are terminated by a specific end_name.

        Their multi-line argument is sent using a heredoc, which is a way to send a multi-line string to a command in bash.
        """
        parsed_action = list()
        rem_action = action
        while rem_action.strip():
            first_match = self._get_first_match(rem_action, "multi_line_no_subroutines")
            if first_match:
                pre_action = rem_action[: first_match.start()]
                match_action = rem_action[first_match.start() : first_match.end()]
                rem_action = rem_action[first_match.end() :]
                if pre_action.strip():
                    parsed_action.append(pre_action)
                if match_action.strip():
                    eof = first_match.group(3).strip()
                    if not match_action.split("\n")[0].strip().endswith(f"<< '{eof}'"):
                        guarded_command = match_action[first_match.start() :]
                        first_line = guarded_command.split("\n")[0]
                        guarded_command = guarded_command.replace(first_line, first_line + f" << '{eof}'", 1)
                        parsed_action.append(guarded_command)
                    else:
                        parsed_action.append(match_action)
            else:
                parsed_action.append(rem_action)
                rem_action = ""
        return "\n".join(parsed_action)

    def split_actions(self, action: str, pattern_type="subroutine") -> list[SubAction]:
        """Split an action into a list of actions in a greedy manner, each of which is a subroutine call or a single command."""
        parsed_action: list[SubAction] = list()
        rem_action = action
        while rem_action.strip():
            first_match = self._get_first_match(rem_action, pattern_type)
            if first_match:
                pre_action = rem_action[: first_match.start()]
                match_action = rem_action[first_match.start() : first_match.end()]
                rem_action = rem_action[first_match.end() :]
                if pre_action.strip():
                    parsed_action.append({"agent": self.name, "action": pre_action, "cmd_name": None, "args": ""})
                if match_action.strip():
                    if match_action.split()[0] == self.config.submit_command:
                        parsed_action.append(
                            SubAction(
                                {
                                    "agent": self.name,
                                    "action": match_action,
                                    "cmd_name": first_match.group(1),
                                    "args": "",
                                },
                            )
                        )  # submit command is not a subroutine
                    else:
                        parsed_action.append(
                            SubAction(
                                {
                                    "agent": first_match.group(1),
                                    "args": first_match.group(2),
                                    "action": match_action,
                                    "cmd_name": first_match.group(1),
                                },
                            )
                        )
            else:
                parsed_action.append(
                    SubAction({"agent": self.name, "action": rem_action, "cmd_name": None, "args": ""})
                )
                rem_action = ""
        return parsed_action

    def _parse_command_patterns(self) -> None:
        assert self.config is not None  # mypy
        self.command_patterns = dict()
        for command in self.config._commands:
            if command.end_name is not None:
                pat = re.compile(
                    rf"^\s*({command.name})\s*(.*?)^({command.end_name})\s*$",
                    re.DOTALL | re.MULTILINE,
                )
                self.command_patterns[command.name] = pat
            else:
                pat = re.compile(rf"^\s*({command.name})\s*(.*?)$", re.MULTILINE)
                self.command_patterns[command.name] = pat
        self.subroutine_patterns = dict()
        for _, subroutine in self.config._subroutines.items():
            if subroutine.end_name is None:
                pat = re.compile(rf"^\s*({subroutine.name})\s*(.*?)$", re.MULTILINE)
                self.subroutine_patterns[subroutine.name,] = pat
            else:
                pat = re.compile(
                    rf"^\s*({subroutine.name})\s*(.*?)^({subroutine.end_name})\s*$",
                    re.DOTALL | re.MULTILINE,
                )
                self.subroutine_patterns[subroutine.name] = pat
        if hasattr(self.config, "submit_command_end_name"):
            submit_pat = re.compile(
                rf"^\s*({self.config.submit_command})\s*(.*?)^({self.config.submit_command_end_name})\s*$",
                re.DOTALL | re.MULTILINE,
            )
        else:
            submit_pat = re.compile(rf"^\s*({self.config.submit_command})(\s*)$", re.MULTILINE)  # group 2 is nothing
        self.subroutine_patterns[self.config.submit_command] = submit_pat
        self.command_patterns[self.config.submit_command] = submit_pat

    def forward(self, observation: str | None, available_actions: list[str], state: str) -> tuple[str, str, str]:
        """Forwards the model

        Args:
            observation: Observation
            available_actions: Currently not used
            state:

        Returns:
            thought: model reasoning
            action: action that the model proposes
            output: raw model output (not output of the action)
        """
        thought, action, output = self.forward_with_error_check(observation, state)

        self._append_history(
            {
                "role": "assistant",
                "content": output,
                "thought": thought,
                "action": action,
                "agent": self.name,
            },
        )

        try:
            # Sanitize thought and action to prevent Rich markup errors
            sanitized_thought = str(thought).replace('[', '\\[').replace(']', '\\]')
            sanitized_action = str(action).replace('[', '\\[').replace(']', '\\]')
            self.logger.info(f"💭 THOUGHT ({self.name})\n{sanitized_thought}")
            self.logger.info(f"🎬 ACTION ({self.name})\n{sanitized_action}")
        except Exception as e:
            # Fallback logging if sanitization fails
            self.logger.warning("Failed to log thought/action due to markup error: %s", str(e))
            self.logger.info(f"💭 THOUGHT ({self.name}): [Thought logging failed due to special characters]")
            self.logger.info(f"🎬 ACTION ({self.name}): [Action logging failed due to special characters]")

        return thought, action, output

    def forward_model(self, observation: str | None, state: str) -> str:
        """Query the model with the current state and observation with the appropriate template.

        Returns:
            output: raw model output (not output of the command)
        """
        assert self.config is not None  # mypy
        try:
            state_vars = json.loads(state)
        except json.JSONDecodeError as e:
            # Use default values if state is not valid JSON
            self.logger.warning(f"State '{state}' is not valid JSON. Using default state. Error: {e}")
            state_vars = {
                "current_directory": "/root",
                "working_dir": "/root",
                "open_file": "n/a",
                "interactive_session": "n/a",
                "available_commands": [],
                "environment": "default"
            }
        except Exception as e:
            # Use default values for other exceptions as well
            self.logger.warning(f"Unexpected error parsing state '{state}': {e}")
            state_vars = {
                "current_directory": "/root", 
                "working_dir": "/root",
                "open_file": "n/a",
                "interactive_session": "n/a",
                "available_commands": [],
                "environment": "default"
            }

        templates: list[str] = []
        # Determine observation template based on what prior observation was
        if self.history[-1]["role"] == "system" or self.history[-1].get("is_demo", False):
            # Show instance template if prev. obs. was initial system message
            templates = [self.config.instance_template]
            if self.config.strategy_template is not None:
                templates.append(self.config.strategy_template)
        elif observation is None or observation.strip() == "":
            # Show no output template if observation content was empty
            templates = [self.config.next_step_no_output_template]
        else:
            # Show standard output template if there is observation content
            templates = [self.config.next_step_template]

        # Populate selected template(s) with information (e.g., issue, arguments, state)
        messages = []
        for template in templates:
            try:
                # Check if all required variables for template are available and provide defaults
                template_vars = {
                    **self.instance_args,
                    **self.system_args,
                    **state_vars,
                    "observation": (observation if observation is not None else ""),
                    **self._forwarded_vars,
                }
                
                # Check variables used in template and provide defaults for missing ones
                import string
                formatter = string.Formatter()
                template_vars_needed = [field_name for _, field_name, _, _ in formatter.parse(template) if field_name is not None]
                
                for var_name in template_vars_needed:
                    if var_name not in template_vars:
                        self.logger.warning(f"Template variable '{var_name}' not found, using default value")
                        if var_name == "open_file":
                            template_vars[var_name] = "n/a"
                        elif var_name == "working_dir":
                            template_vars[var_name] = "/root"
                        elif var_name == "interactive_session":
                            template_vars[var_name] = "n/a"
                        else:
                            template_vars[var_name] = "n/a"
                
                messages.append(template.format(**template_vars))
            except KeyError as e:
                # If there are still missing variables, replace with defaults
                self.logger.warning(f"Template formatting failed due to missing variable: {e}")
                # Remove or replace problematic parts in template with defaults
                safe_template = template.replace("{open_file}", "n/a").replace("{working_dir}", "/root").replace("{interactive_session}", "n/a")
                messages.append(safe_template.format(
                    **self.instance_args,
                    **self.system_args,
                    **state_vars,
                    observation=(observation if observation is not None else ""),
                    **self._forwarded_vars,
                ))

        message = "\n".join(messages)

        try:
            # Sanitize message to prevent Rich markup errors
            sanitized_message = str(message).replace('[', '\\[').replace(']', '\\]')
            self.logger.info(f"🤖 MODEL INPUT\n{sanitized_message}")
        except Exception as e:
            # Fallback logging if sanitization fails
            self.logger.warning("Failed to log model input due to markup error: %s", str(e))
            self.logger.info("🤖 MODEL INPUT: [Model input logging failed due to special characters]")
        self._append_history({"role": "user", "content": message, "agent": self.name})

        for hook in self.hooks:
            hook.on_model_query(query=self.local_history, agent=self.name)
        return self.model.query(self.local_history)

    def retry_after_format_fail(self, output: str) -> str:
        """Ask the model to correct (without committing to persistent history) after a malformatted model output"""
        format_error_template = self.config.format_error_template

        try:
            # Sanitize output and format_error_template to prevent Rich markup errors
            sanitized_output = str(output).replace('[', '\\[').replace(']', '\\]')
            sanitized_format_error = str(format_error_template).replace('[', '\\[').replace(']', '\\]')
            self.logger.warning(f"MALFORMED OUTPUT\n{sanitized_output}")
            self.logger.warning(f"FORMAT ERROR\n{sanitized_format_error}")
        except Exception as e:
            # Fallback logging if sanitization fails
            self.logger.warning("Failed to log malformed output due to markup error: %s", str(e))
            self.logger.warning("MALFORMED OUTPUT: [Output logging failed due to special characters]")
            self.logger.warning("FORMAT ERROR: [Format error logging failed due to special characters]")

        temp_history = self.local_history + [
            {"role": "assistant", "content": output, "agent": self.name},
            {"role": "user", "content": format_error_template, "agent": self.name},
        ]
        return self.model.query(temp_history)

    def retry_after_blocklist_fail(self, output: str, action: str) -> str:
        """Ask the model to correct (without committing to persistent history) after a disallowed command"""
        name = action.strip().split()[0]
        blocklist_error_message = self.config.blocklist_error_template.format(name=name)

        try:
            # Sanitize output and blocklist_error_message to prevent Rich markup errors
            sanitized_output = str(output).replace('[', '\\[').replace(']', '\\]')
            sanitized_blocklist_error = str(blocklist_error_message).replace('[', '\\[').replace(']', '\\]')
            self.logger.warning(f"BLOCKLISTED OUTPUT\n{sanitized_output}")
            self.logger.warning(f"BLOCKLIST ERROR\n{sanitized_blocklist_error}")
        except Exception as e:
            # Fallback logging if sanitization fails
            self.logger.warning("Failed to log blocklisted output due to markup error: %s", str(e))
            self.logger.warning("BLOCKLISTED OUTPUT: [Output logging failed due to special characters]")
            self.logger.warning("BLOCKLIST ERROR: [Blocklist error logging failed due to special characters]")

        temp_history = self.local_history + [
            {"role": "assistant", "content": output, "agent": self.name},
            {"role": "user", "content": blocklist_error_message, "agent": self.name},
        ]
        return self.model.query(temp_history)

    def should_block_action(self, action: str) -> bool:
        """Check if the command should be blocked."""
        names = action.strip().split()
        if len(names) == 0:
            return False
        name = names[0]
        if name in self.config.blocklist:
            return True
        if name in self.config.blocklist_standalone and name == action.strip():
            return True
        if name in self.config.block_unless_regex and not re.search(self.config.block_unless_regex[name], action):
            return True
        return False

    def check_format_and_requery(
        self,
        output: str,
    ) -> tuple[str, str, str]:
        """Query the model with the current state and observation with the appropriate template.

        Try to parse the output into a thought and action. Retry if the output is malformatted or the action is blocked.

        Returns:
            thought: model reasoning
            action: action that the model proposes
            output: raw model output
        """
        # Condition for handling outputs with no thought (just action)
        if self.model.args.model_name == "human":
            return "", output, output
        elif self.model.args.model_name == "human_thought":
            thought, action = ParseFunction.get("ThoughtActionParser")(
                output,
                self.config._commands + self.config.subroutine_types,
                strict=False,
            )
            return thought, action, output

        format_fails = blocklist_fails = 0

        while format_fails + blocklist_fails <= 2:
            try:
                thought, action = self.config.parse_function(
                    output,
                    self.config._commands + self.config.subroutine_types,
                    strict=False,
                )
            except KeyboardInterrupt:
                raise
            except FormatError:
                format_fails += 1
                output = self.retry_after_format_fail(output)
                continue
            if self.should_block_action(action):
                blocklist_fails += 1
                output = self.retry_after_blocklist_fail(output, action)
            else:
                return thought, action, output
        try:
            # Sanitize output to prevent Rich markup errors
            sanitized_output = str(output).replace('[', '\\[').replace(']', '\\]')
            self.logger.warning(f"Malformat limit reached: \n{sanitized_output}")
        except Exception as e:
            # Fallback logging if sanitization fails
            self.logger.warning("Failed to log malformat limit output due to markup error: %s", str(e))
            self.logger.warning("Malformat limit reached: [Output logging failed due to special characters]")
        return "Exit due to format error", "exit_format", output

    def forward_with_error_check(self, observation: str | None, state: str) -> tuple[str, str, str]:
        """Wrapper around `self.forward_model` that handles errors and retries
        due to format errors or blocked actions.

        Returns:
            thought: model reasoning
            action: action that the model proposes
            output: raw model output
        """
        try:
            return self.check_format_and_requery(self.forward_model(observation, state))
        except KeyboardInterrupt:
            raise
        except RuntimeError as e:
            self.logger.warning(f"Runtime error: {e}")
            return (
                f"Exit due to runtime error: {e}",
                "exit_error",
                f"exit due to runtime error: {e}",
            )
        except ContextWindowExceededError:
            self.logger.warning("Context window exceeded")
            return "Exit due to context window", "exit_context", "Exit due to context window"
        except CostLimitExceededError:
            self.logger.warning("Cost limit exceeded")
            return "Exit due to cost limit", "exit_cost", "Exit due to cost limit"
        except RetryError as e:
            self.logger.warning(f"Retry error: {e}")
            return (
                f"Exit due to retry error: {e}",
                "exit_api",
                f"exit due to retry error: {e}",
            )

    def init_environment_vars(self, env: SWEEnv):
        assert self.config is not None
        self.set_environment_vars(env, self.config.env_variables)

    def set_environment_vars(self, env: SWEEnv, env_variables: dict[str, Any]) -> None:
        """Sets environment variables in the container and for example makes sure
        that all the commands are available in the PATH on the container.
        """
        assert self.config is not None  # mypy
        commands_to_execute = (
            [self.config.state_command.code]
            +
            # [code for code in self.config.util_functions] +
            # [command.code for command in self.config._commands] +
            [f"{k}={v}" for k, v in env_variables.items()]
        )
        commands = "\n".join(commands_to_execute)
        try:
            output = env.communicate(commands)
            if env.returncode != 0:
                msg = f"Nonzero return code: {env.returncode}\nOutput: {output}"
                raise RuntimeError(msg)
        except KeyboardInterrupt:
            raise
        except Exception as e:
            self.logger.warning(f"Failed to set environment variables: {traceback.format_exc()}")
            raise e
        command_files = list()
        for file in self.config.command_files:
            datum = dict()
            with open(file) as f:
                contents = f.read()
            datum["contents"] = contents
            filename = Path(file).name
            if not contents.strip().startswith("#!"):
                if filename.endswith(".sh"):
                    # files are sourced, so they are not executable
                    datum["name"] = Path(file).name
                    datum["type"] = "source_file"
                elif filename.startswith("_"):
                    # files are sourced, so they are not executable
                    datum["name"] = Path(file).name
                    datum["type"] = "utility"
                else:
                    msg = (
                        f"Non-shell script file {file} does not start with shebang.\n"
                        "Either add a shebang (#!) or change the file extension to .sh if you want to source it.\n"
                        "You can override this behavior by adding an underscore to the file name (e.g. _utils.py)."
                    )
                    raise ValueError(msg)
            else:
                # scripts are made executable
                datum["name"] = Path(file).name.rsplit(".", 1)[0]
                datum["type"] = "script"
            command_files.append(datum)
        env.add_commands(command_files)

    def get_environment_vars(self, env: SWEEnv) -> dict[str, Any]:
        """Get environment variables inside of the container"""
        assert self.config is not None  # mypy
        env_vars = dict()
        for var in self.config.env_variables:
            env_vars[var] = env.communicate(f"echo ${var}").strip()
        return env_vars

    def call_subroutine(self, agent_name: str, sub_action: SubAction, env: SWEEnv):
        """Call subroutine"""
        assert self.config is not None  # mypy
        env_vars = self.get_environment_vars(env)
        cwd = env.communicate("pwd -P").strip()
        init_observation = self.config._subroutines[agent_name].init_observation
        if init_observation is not None:
            obs, _, _, _ = env.step(init_observation.format(args=sub_action["args"]))
        else:
            obs = None
        if env.returncode != 0:
            self._append_history(HistoryItem({"role": "user", "content": obs, "agent": agent_name}))
            msg = f"Nonzero return code: {env.returncode} for init_observation in {agent_name}.\n{obs}"
            raise RuntimeError(msg)
        return_type = self.config._subroutines[agent_name].return_type
        sub_agent = Agent(agent_name, self.config._subroutines[agent_name].agent_args)
        sub_agent_output = sub_agent.run(
            {"issue": sub_action["args"]},
            env,
            observation=obs,
            return_type=return_type,
            init_model_stats=self.model.stats,
        )
        self.history += sub_agent.history
        self.set_environment_vars(env, env_vars)
        env.communicate(f"cd {cwd}")
        self.model.stats.replace(sub_agent.model.stats)
        return sub_agent_output

    def _update_summarizer_stats(self, cost: APIStats):
        """Update stats for summarizer"""
        self.model.stats += cost
        if "summarizer" not in self.info:
            self.info["summarizer"] = {
                "model_stats": APIStats().to_dict(),
                "n_calls": 0,
            }
        total_cost = APIStats(**self.info["summarizer"]["model_stats"])
        total_cost += cost
        self.info["summarizer"]["model_stats"] = total_cost.to_dict()
        self.info["summarizer"]["n_calls"] += 1

    def _run_sub_action(self, sub_action: SubAction) -> tuple[str | None, bool]:
        """Execute a sub-action. If the sub-action is a command, execute it.
        If it is a subroutine, call the subroutine.

        Returns:
            observation: Observation
            done: Whether `submit` or another exit reason was called
        """
        assert self._env is not None
        assert self.config is not None
        if sub_action["agent"] == self.name or sub_action["cmd_name"] == self.config.submit_command:
            # Normal command, not a subroutine
            for hook in self.hooks:
                hook.on_sub_action_started(sub_action=sub_action)
            try:
                observation, _, done, _info = self._env.step(sub_action["action"])
                observation, additional_cost = self.config.summarizer_config.function(  # type: ignore
                    sub_action["action"], observation, self._env, self.summarizer_model
                )
                self._update_summarizer_stats(additional_cost)
                self.info.update(_info)
                for hook in self.hooks:
                    hook.on_sub_action_executed(obs=observation, done=done)
                if sub_action["cmd_name"] == self.config.submit_command:
                    done = True
            except Exception as e:
                # Prevent program termination in all exception scenarios
                self.logger.error(f"Unexpected error in _run_sub_action during env.step: {e}")
                self.logger.error(traceback.format_exc())
                
                # Attempt container recovery without restart
                try:
                    if self._env and hasattr(self._env, 'container') and self._env.container:
                        if self._env.container.poll() is not None:
                            self.logger.warning("Container has exited due to error, attempting restart...")
                            self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self._env.container.stdin.flush()
                            time.sleep(0.1)
                        else:
                            # Try to recover without container restart
                            self.logger.warning("Container error detected, attempting recovery without container restart...")
                            try:
                                self._env.container.stdin.write("echo 'agent_error_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                            except Exception:
                                self.logger.warning("Failed to recover from agent error, container may need restart")
                except Exception as recovery_error:
                    self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Return special message for timeout cases
                if isinstance(e, (NoOutputTimeoutError, TimeoutError)):
                    timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                    observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                    
                    # For timeout cases, don't restart container unless it has actually exited
                    try:
                        if self._env and hasattr(self._env, 'container') and self._env.container:
                            if self._env.container.poll() is not None:
                                self.logger.warning("Container has exited after timeout, restarting...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                            else:
                                # Continue using if container is still alive - no restart needed
                                self.logger.info("Container is still alive after timeout, continuing without restart...")
                    except Exception as recovery_error:
                        self.logger.error(f"Container recovery after timeout failed: {recovery_error}")
                else:
                    # Return clear error message for other exceptions
                    error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                    error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                    observation = error_message
                    
                    # For non-timeout exceptions, attempt container recovery without restart
                    try:
                        if self._env and hasattr(self._env, 'container') and self._env.container:
                            if self._env.container.poll() is not None:
                                self.logger.warning("Container has exited due to error, attempting restart...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                            else:
                                # Force restart if container is alive but unresponsive
                                self.logger.warning("Container is unresponsive due to error, forcing restart...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                    except Exception as recovery_error:
                        self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Continue execution even after error occurs
                self.logger.warning(f"❌ Error occurred but continuing execution: {e}")
                done = False  # Set done to False to continue execution
        else:
            agent_name = sub_action["agent"]
            sub_agent_output = self.call_subroutine(agent_name, sub_action, self._env)
            observation = sub_agent_output
            assert isinstance(observation, str) or observation is None
            done = False
        return observation, done

    def _run_step(self, observation: str | None) -> tuple[str | None, bool]:
        """Run a step of the agent (forward, execute, and save).

        Returns:
            observation: Observation
            done: Whether `submit` or another exit reason was called
        """

        assert self.config is not None  # mypy
        assert self._env is not None

        for hook in self.hooks:
            hook.on_step_start()

        # fixme: This will probably fail if the state command is not set
        try:
            if self.state_command:
                state_definition = self.state_command
                state_result = self._env.communicate(state_definition)
                
                state = self._env.communicate("state")
                
                # Use default values if state is empty or has error
                if not state or state.strip() == "":
                    self.logger.warning("State command returned empty result, using default state")
                    state = json.dumps({
                        "current_directory": "/root",
                        "working_dir": "/root",
                        "open_file": "n/a",
                        "interactive_session": "n/a",
                        "available_commands": [],
                        "environment": "default"
                    })
            else:
                # Use default state if state_command is not configured
                self.logger.info("No state command configured, using default state")
                state = json.dumps({
                    "current_directory": "/root",
                    "working_dir": "/root",
                    "open_file": "n/a",
                    "interactive_session": "n/a",
                    "available_commands": [],
                    "environment": "default"
                })
        except Exception as e:
            # Use default values when state command execution fails
            self.logger.warning(f"Failed to get state from command '{self.state_command}': {e}")
            state = json.dumps({
                "current_directory": "/root",
                "working_dir": "/root",
                "open_file": "n/a",
                "interactive_session": "n/a",
                "available_commands": [],
                "environment": "default"
            })
        
        thought, action, output = self.forward(observation, self._env.get_available_actions(), state)
        for hook in self.hooks:
            hook.on_actions_generated(thought=thought, action=action, output=output)
        run_action: str = self._guard_multiline_input(action)

        # Loop over sub-actions (if any)
        done = False
        observations: list[str | None] = list()
        execution_t0 = time.perf_counter()
        for sub_action in self.split_actions(run_action):
            try:
                observation, done = self._run_sub_action(sub_action)
                # If the last sub-action is done, the observation is not
                # appended.
                if done:
                    break
                observations.append(observation)
            except Exception as e:
                # Prevent program termination in all exception scenarios
                self.logger.error(f"Unexpected error in _run_step during sub_action execution: {e}")
                self.logger.error(traceback.format_exc())
                
                # Attempt container recovery
                try:
                    if self._env and hasattr(self._env, 'container') and self._env.container:
                        if self._env.container.poll() is not None:
                            self.logger.warning("Container has exited due to error, attempting restart...")
                            self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self._env.container.stdin.flush()
                            time.sleep(0.1)
                        else:
                            # Force restart if container is alive but unresponsive
                            self.logger.warning("Container is unresponsive due to error, forcing restart...")
                            self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self._env.container.stdin.flush()
                            time.sleep(0.1)
                except Exception as recovery_error:
                    self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Return special message for timeout cases
                if isinstance(e, (NoOutputTimeoutError, TimeoutError)):
                    timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                    observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                else:
                    # Return clear error message for other exceptions
                    error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                    error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                    observation = error_message
                
                # Continue execution even after error occurs
                self.logger.warning(f"❌ Error occurred but continuing execution: {e}")
                observations.append(observation)
                done = False  # Set done to False to continue execution
                break  # Don't proceed to next sub_action since error occurred in current sub_action
        observation = "\n".join([obs for obs in observations if obs is not None])
        execution_time = time.perf_counter() - execution_t0

        trajectory_step = TrajectoryStep(
            {
                "action": action,
                "observation": observation,
                "response": output,
                "state": state,
                "thought": thought,
                "execution_time": execution_time,
            },
        )
        self.trajectory.append(trajectory_step)
        model_stats: APIStats = self.model.stats
        self.info["model_stats"] = model_stats.to_dict()
        for hook in self.hooks:
            hook.on_step_done(trajectory_step=trajectory_step, model_stats=model_stats)
        return observation, done

    def run(
        self,
        setup_args: dict[str, Any],
        env: SWEEnv,
        observation: str | None = None,
        traj_dir: Path | None = None,
        return_type: str = "info_trajectory",
        init_model_stats: APIStats | None = None,
    ):
        """
        Run the agent on an environment.
        Return the final value of the specified return type.

        Args:
            setup_args: Arguments to pass to the agent's setup method.
            env: The environment to run the agent on.
            observation: Output from environment setup
            traj_dir: Directory to save the trajectory to
            return_type: Controls what to return.
                This should be left at `info_trajectory`, the
                other values are for internal usage with subroutines.
            init_model_stats: Initial model stats to use for the run.

        Returns:
            If return_type is "info", returns a tuple of
            the info dictionary and the trajectory (list of dictionaries).
        """
        assert env.record is not None
        assert env.container_obj is not None
        if env.container_obj.id != self.last_container_id:
            self.logger.info(f"Initializing agent settings for container {env.container_obj.id}")
            self.init_environment_vars(env)
            self.last_container_id = env.container_obj.id
        # Re-initialize primary
        self.setup(setup_args, init_model_stats)
        self.config.summarizer_config.function.setup(setup_args, self.config)

        # Save/reset some attributes
        self.trajectory = Trajectory()
        self._env = env
        env.current_agent = self
        self.info = AgentInfo()
        self.traj_dir = traj_dir

        self.logger.info("Trajectory will be saved to %s", self.traj_path)

        # Run action/observation loop
        for hook in self.hooks:
            hook.on_run_start()
        done = False
        while not done:
            try:
                observation, done = self._run_step(observation)
                self.save_trajectory()
                if done:
                    done = True
                # Reset consecutive error counter after successful execution
                self._consecutive_errors = 0
            except Exception as e:
                # Prevent program termination in all exception scenarios
                self.logger.error(f"Unexpected error in agent run loop: {e}")
                self.logger.error(traceback.format_exc())
                
                # Increment consecutive error counter
                self._consecutive_errors += 1
                self.logger.warning(f"Consecutive error count: {self._consecutive_errors}/{self._max_consecutive_errors}")
                
                # Stop execution to prevent infinite loop if too many consecutive errors
                if self._consecutive_errors >= self._max_consecutive_errors:
                    self.logger.error(f"Too many consecutive errors ({self._consecutive_errors}), stopping execution to prevent infinite loop")
                    observation = f"ERROR: TOO MANY CONSECUTIVE ERRORS ({self._consecutive_errors}) - STOPPING EXECUTION TO PREVENT INFINITE LOOP"
                    done = True
                    break
                
                # Attempt container recovery
                try:
                    if self._env and hasattr(self._env, 'container') and self._env.container:
                        if self._env.container.poll() is not None:
                            self.logger.warning("Container has exited due to error, attempting restart...")
                            self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self._env.container.stdin.flush()
                            time.sleep(0.1)
                        else:
                            # Force restart if container is alive but unresponsive
                            self.logger.warning("Container is unresponsive due to error, forcing restart...")
                            self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self._env.container.stdin.flush()
                            time.sleep(0.1)
                except Exception as recovery_error:
                    self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Return special message for timeout cases
                if isinstance(e, (NoOutputTimeoutError, TimeoutError)):
                    timeout_type = "no_output" if isinstance(e, NoOutputTimeoutError) else "total"
                    observation = f"TIMEOUT: {timeout_type.upper()} TIMEOUT OCCURRED - PLEASE TRY A DIFFERENT APPROACH OR SHORTER COMMAND"
                    
                    # For timeout cases, don't restart container unless it has actually exited
                    try:
                        if self._env and hasattr(self._env, 'container') and self._env.container:
                            if self._env.container.poll() is not None:
                                self.logger.warning("Container has exited after timeout, restarting...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                            else:
                                # Continue using if container is still alive - no restart needed
                                self.logger.info("Container is still alive after timeout, continuing without restart...")
                    except Exception as recovery_error:
                        self.logger.error(f"Container recovery after timeout failed: {recovery_error}")
                else:
                    # Return clear error message for other exceptions
                    error_message = f"ERROR: UNEXPECTED ERROR OCCURRED - {str(e)}"
                    error_message += "\nPLEASE TRY A DIFFERENT APPROACH"
                    observation = error_message
                    
                    # For non-timeout exceptions, attempt container recovery
                    try:
                        if self._env and hasattr(self._env, 'container') and self._env.container:
                            if self._env.container.poll() is not None:
                                self.logger.warning("Container has exited due to error, attempting restart...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                            else:
                                # Force restart if container is alive but unresponsive
                                self.logger.warning("Container is unresponsive due to error, forcing restart...")
                                self._env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self._env.container.stdin.flush()
                                time.sleep(0.1)
                    except Exception as recovery_error:
                        self.logger.error(f"Container recovery failed: {recovery_error}")
                
                # Continue execution even after error occurs
                self.logger.warning(f"❌ Error occurred but continuing execution: {e}")
                done = False  # Set done to False to continue execution
                
        for hook in self.hooks:
            hook.on_run_done(trajectory=self.trajectory, info=self.info)

        self.logger.info("Trajectory saved to %s", self.traj_path)

        if return_type == "info":
            return self.info
        if return_type == "info_trajectory":
            return self.info, self.trajectory
        return self.trajectory[-1][return_type]
