from __future__ import annotations

import logging
import os
import argparse
import time

from sweagent import CONFIG_DIR
from sweagent.utils.log import add_file_handler, get_logger
from rich.logging import RichHandler

try:
    import rich
except ModuleNotFoundError as e:
    msg = (
        "You probably either forgot to install the dependencies "
        "or forgot to activate your conda or virtual environment."
    )
    raise RuntimeError(msg) from e
import json
import re
import subprocess
import traceback
import requests
from typing import Any

import rich.console
import rich.markdown
import rich.panel

try:
    from rich_argparse import RichHelpFormatter
except ImportError:
    msg = "Please install the rich_argparse package with `pip install rich_argparse`."
    raise ImportError(msg)
import datetime
from dataclasses import dataclass
from getpass import getuser
from pathlib import Path

import yaml
from rich.markdown import Markdown
from simple_parsing import parse
from simple_parsing.helpers.flatten import FlattenedAccess
from simple_parsing.helpers.serialization.serializable import FrozenSerializable

# Try to import swebench constants, with fallback values
try:
    from swebench.harness.constants import KEY_INSTANCE_ID, KEY_MODEL, KEY_PREDICTION
    SWEBENCH_AVAILABLE = True
except ImportError:
    # Fallback constants when swebench is not available
    SWEBENCH_AVAILABLE = False
    KEY_INSTANCE_ID = "instance_id"
    KEY_MODEL = "model"
    KEY_PREDICTION = "prediction"

from unidiff import PatchSet

from sweagent.agent.agents import Agent, AgentArguments
from sweagent.agent.models import ModelArguments
from sweagent.environment.swe_env import EnvironmentArguments, SWEEnv
from sweagent.environment.utils import (
    InvalidGithubURL,
    extract_flag_format,
    get_associated_commit_urls,
    get_data_path_name,
    get_gh_issue_data,
    parse_gh_issue_url,
)

__doc__: str = """ Run inference. Usage examples:

```bash
# Run over a github issue:
python run.py --model_name "gpt4" --data_path "https://github.com/pvlib/pvlib-python/issues/1603" --config_file "config/default_from_url.yaml"
# Apply a patch in a local repository to an issue specified as Markdown file and run a custom installer script in the container
python run.py --model_name "gpt4" --data_path "/path/to/my_issue.md" --repo_path "/path/to/my/local/repo" --environment_setup "/path/to/setup.sh" --config_file "config/default_from_url.yaml" --apply_patch_locally
# Solve a specific CTF challenge by name:
python run.py --model_name "gpt4.1" --problem_name "Web Exploitation Challenge"
```

**For more information**: https://princeton-nlp.github.io/SWE-agent/usage/cl_tutorial/
"""


logger = get_logger("swe-agent-run")
logging.getLogger("simple_parsing").setLevel(logging.WARNING)


@dataclass(frozen=True)
class ActionsArguments(FlattenedAccess, FrozenSerializable):
    """Run real-life actions (opening PRs, etc.) if we can solve the issue."""

    # Open a PR with the patch if we can solve the issue
    open_pr: bool = False
    # When working with local repository: Apply patch
    apply_patch_locally: bool = False
    # Option to be used with open_pr: Skip action if there are already commits claiming
    # to fix the issue. Please only set this to False if you are sure the commits are
    # not fixes or if this is your own repository!
    skip_if_commits_reference_issue: bool = True
    # OBSOLETE. Do not use, will raise error. Please specify --repo_path instead.
    push_gh_repo_url: str = ""

    def __post_init__(self):
        if self.push_gh_repo_url:
            msg = "push_gh_repo_url is obsolete. Use repo_path instead"
            raise ValueError(msg)


@dataclass(frozen=True)
class ScriptArguments(FlattenedAccess, FrozenSerializable):
    """Configure the control flow of the run.py script"""

    environment: EnvironmentArguments
    agent: AgentArguments
    actions: ActionsArguments
    # Only run instances that completely match this regex
    instance_filter: str = ".*"
    # Skip instances with existing trajectories
    skip_existing: bool = True
    # Suffix for the run name (used for example in trajectory directory naming)
    suffix: str = ""
    # Raise unhandled exceptions during the run (useful for debugging)
    raise_exceptions: bool = False
    # Dump the entire config to the log
    print_config: bool = True
    # Run the agent in CTF mode (SWE-agent: EnIGMA)
    ctf: bool = False
    # Name of the specific problem to solve
    problem_name: str = ""

    @property
    def run_name(self) -> str:
        """Generate a unique name for this run based on the arguments."""
        model_name = self.agent.model.model_name.replace(":", "-")
        data_stem = get_data_path_name(self.environment.data_path)
        assert self.agent.config_file is not None  # mypy
        config_stem = Path(self.agent.config_file).stem

        temp = self.agent.model.temperature
        top_p = self.agent.model.top_p

        per_instance_cost_limit = self.agent.model.per_instance_cost_limit
        install_env = self.environment.install_environment

        return (
            f"{model_name}__{data_stem}__{config_stem}__t-{temp:.2f}__p-{top_p:.2f}"
            + f"__c-{per_instance_cost_limit:.2f}__install-{int(install_env)}"
            + (f"__{self.suffix}" if self.suffix else "")
        )


class _ContinueLoop(Exception):
    """Used for internal control flow"""


class MainHook:
    """Hook structure for the web server or other addons to interface with"""

    @staticmethod
    def _is_promising_patch(info: dict[str, Any]) -> bool:
        """Do we actually believe that the patch will solve the issue?
        Or are we just submitting the last patch we generated before hitting an error?
        """
        # The exit status can also be `submitted (exit_cost)` etc.
        return info["exit_status"] == "submitted" and info.get("submission") is not None

    def on_init(self, *, args: ScriptArguments, agent: Agent, env: SWEEnv, traj_dir: Path):
        """Called when hook is initialized"""

    def on_start(self):
        """Called at the beginning of `Main.main`"""

    def on_end(self):
        """Called at the end of `Main.main`"""

    def on_instance_start(self, *, index: int, instance: dict[str, Any]):
        """Called at the beginning of each instance loop in `Main.run`"""

    def on_instance_skipped(
        self,
    ):
        """Called when an instance is skipped in `Main.run`"""

    def on_instance_completed(self, *, info, trajectory):
        """Called when an instance is completed in `Main.run`"""


class SaveApplyPatchHook(MainHook):
    """This hook saves patches to a separate directory and optionally applies them to a local repository."""

    def on_init(self, *, args: ScriptArguments, agent: Agent, env: SWEEnv, traj_dir: Path):
        self._traj_dir = traj_dir
        self._apply_patch_locally = args.actions.apply_patch_locally
        self._instance = None

    def on_instance_start(self, *, index: int, instance: dict[str, Any]):
        self._instance = instance

    def on_instance_completed(self, *, info, trajectory):
        assert self._instance is not None  # mypy
        instance_id = self._instance["instance_id"]
        patch_path = self._save_patch(instance_id, info)
        if patch_path:
            if not self._apply_patch_locally:
                return
            if not self._is_promising_patch(info):
                return
            assert self._instance  # mypy
            if self._instance["repo_type"] != "local":
                return
            local_dir = Path(self._instance["repo"])
            self._apply_patch(patch_path, local_dir)

    @staticmethod
    def _print_patch_message(patch_output_file: Path):
        console = rich.console.Console()
        msg = [
            "SWE-agent has produced a patch that it believes will solve the issue you submitted!",
            "Use the code snippet below to inspect or apply it!",
        ]
        panel = rich.panel.Panel.fit(
            "\n".join(msg),
            title="🎉 Submission successful 🎉",
        )
        console.print(panel)
        content = [
            "```bash",
            "# The patch has been saved to your local filesystem at:",
            f"PATCH_FILE_PATH='{patch_output_file.resolve()}'",
            "# Inspect it:",
            'cat "${PATCH_FILE_PATH}"',
            "# Apply it to a local repository:",
            "cd <your local repo root>",
            'git apply "${PATCH_FILE_PATH}"',
            "```",
        ]
        console.print(rich.markdown.Markdown("\n".join(content)))

    def _save_patch(self, instance_id: str, info) -> Path | None:
        """Create patch files that can be applied with `git am`.

        Returns:
            The path to the patch file, if it was saved. Otherwise, returns None.
        """
        patch_output_dir = self._traj_dir / "patches"
        patch_output_dir.mkdir(exist_ok=True, parents=True)
        patch_output_file = patch_output_dir / f"{instance_id}.patch"
        if info.get("submission") is None:
            logger.info("No patch to save.")
            return None
        model_patch = info["submission"]
        patch_output_file.write_text(model_patch)
        if self._is_promising_patch(info):
            # Only print big congratulations if we actually believe
            # the patch will solve the issue
            self._print_patch_message(patch_output_file)
        return patch_output_file

    def _apply_patch(self, patch_file: Path, local_dir: Path) -> None:
        """Apply a patch to a local directory."""

        assert local_dir.is_dir()
        assert patch_file.exists()
        # The resolve() is important, because we're gonna run the cmd
        # somewhere else
        cmd = ["git", "apply", str(patch_file.resolve())]
        try:
            subprocess.run(cmd, cwd=local_dir, check=True)
        except subprocess.CalledProcessError as e:
            logger.error(f"Failed to apply patch {patch_file} to {local_dir}: {e}")
            return
        logger.info(f"Applied patch {patch_file} to {local_dir}")


class OpenPRHook(MainHook):
    """This hook opens a PR if the issue is solved and the user has enabled the option."""

    def on_init(self, *, args: ScriptArguments, agent: Agent, env: SWEEnv, traj_dir: Path):
        self._env = env
        self._token: str = env._github_token
        self._data_path = args.environment.data_path
        self._open_pr = args.actions.open_pr
        self._skip_if_commits_reference_issue = args.actions.skip_if_commits_reference_issue

    def on_instance_completed(self, *, info, trajectory):
        if self._open_pr and self.should_open_pr(info):
            self._env.open_pr(trajectory=trajectory)

    def should_open_pr(self, info: dict[str, Any]) -> bool:
        """Does opening a PR make sense?"""
        if not info.get("submission"):
            logger.info("Not opening PR because no submission was made.")
            return False
        if info["exit_status"] != "submitted":
            logger.info("Not opening PR because exit status was %s and not submitted.", info["exit_status"])
            return False
        try:
            issue = get_gh_issue_data(self._data_path, token=self._token)
        except InvalidGithubURL:
            logger.info("Currently only GitHub is supported to open PRs to. Skipping PR creation.")
            return False
        if issue.state != "open":
            logger.info(f"Issue is not open (state={issue.state}. Skipping PR creation.")
            return False
        if issue.assignee:
            logger.info("Issue is already assigned. Skipping PR creation. Be nice :)")
            return False
        if issue.locked:
            logger.info("Issue is locked. Skipping PR creation.")
            return False
        org, repo, issue_number = parse_gh_issue_url(self._data_path)
        associated_commits = get_associated_commit_urls(org, repo, issue_number, token=self._token)
        if associated_commits:
            commit_url_strs = ", ".join(associated_commits)
            if self._skip_if_commits_reference_issue:
                logger.info(f"Issue already has associated commits (see {commit_url_strs}). Skipping PR creation.")
                return False
            else:
                logger.warning(
                    "Proceeding with PR creation even though there are already commits "
                    f"({commit_url_strs}) associated with the issue. Please only do this for your own repositories "
                    "or after verifying that the existing commits do not fix the issue.",
                )
        return True


class Main:
    def __init__(self, args: ScriptArguments):
        # Set up log directory
        self.traj_dir = Path("trajectories") / Path(getuser()) / args.run_name
        self.traj_dir.mkdir(parents=True, exist_ok=True)
        
        # Set up log file (including execution time)
        timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
        log_dir = self.traj_dir / "logs"
        log_dir.mkdir(exist_ok=True)
        log_path = log_dir / f"run_{timestamp}.log"
        
        # Remove existing handlers
        for handler in logger.handlers[:]:
            logger.removeHandler(handler)
            
        # Set up Rich handler with markup disabled to prevent markup errors
        rich_handler = RichHandler(
            show_time=True,
            show_path=True,
            rich_tracebacks=True,
            tracebacks_show_locals=True,
            log_time_format="%Y-%m-%d %H:%M:%S",
            markup=False  # Disable markup to prevent markup errors
        )
        rich_handler.setFormatter(logging.Formatter('%(message)s'))
        rich_handler.setLevel(logging.INFO)
        logger.addHandler(rich_handler)
        
        # Set up file handler
        file_handler = logging.FileHandler(log_path, mode='a', encoding='utf-8')
        file_formatter = logging.Formatter(
            '%(asctime)s - %(name)s - %(levelname)s - %(message)s',
            datefmt='%Y-%m-%d %H:%M:%S'
        )
        file_handler.setFormatter(file_formatter)
        file_handler.setLevel(logging.DEBUG)
        logger.addHandler(file_handler)
        
        # Set logger basic configuration
        logger.setLevel(logging.DEBUG)
        logger.propagate = False
        
        # Start log message
        logger.info("🚀 Program run")
        logger.info("📝 Log file: %s", log_path)
        
        # Log warning if swebench is not available
        if not SWEBENCH_AVAILABLE:
            logger.warning(
                "⚠️  swebench package is not available. Some features may be limited. "
                "Consider installing swebench with: pip install swebench>=2.0.0"
            )
        
        if args.print_config:
            logger.info("📙 Settings: %s", args.dumps_yaml())
            
        self.args = args
        
        # Initialize environment
        env_dict = {k: v for k, v in args.environment.__dict__.items()}
        env_dict['ctf'] = True
        env_args = EnvironmentArguments(**env_dict)
        self.env = SWEEnv(env_args)
        
        # Initialize agent
        self.agent = Agent("primary", args.agent)
        
        self._save_arguments()
        default_hooks = [
            SaveApplyPatchHook(),
            OpenPRHook(),
        ]
        self.hooks: list[MainHook] = []
        for hook in default_hooks:
            self.add_hook(hook)
            
        logger.info("init complete")

    def add_hook(self, hook: MainHook):
        hook.on_init(args=self.args, agent=self.agent, env=self.env, traj_dir=self.traj_dir)
        self.hooks.append(hook)

    def run(self, index: int) -> None:
        # Set initial data
        if not hasattr(self.env, 'data') or not self.env.data:
            # If problem_name is specified, set it as a request to solve that specific problem
            if self.args.problem_name:
                query = f"Solve the CTF challenge named '{self.args.problem_name}'."
                description = f"Find and solve the CTF challenge with the name '{self.args.problem_name}'. Communicate with the MCP server to retrieve challenge information and solve it."
                challenge_name = self.args.problem_name
                problem_name_instruction = f"SPECIFIC TASK: You are tasked with solving the CTF challenge named '{self.args.problem_name}'. Focus your efforts on finding and solving this specific challenge."
                specific_problem_request = f"SPECIFIC REQUEST: When you contact the MCP server, specifically ask for information about the challenge named '{self.args.problem_name}'. If the server provides a list of challenges, look for this specific one and focus on solving it."
            else:
                query = "Start a CTF challenge by communicating with the MCP server."
                description = "Communicate with the MCP server to retrieve and solve CTF challenge information."
                challenge_name = "Initial Challenge"
                problem_name_instruction = "GENERAL TASK: You are tasked with solving any available CTF challenge. Start by exploring what challenges are available."
                specific_problem_request = "GENERAL REQUEST: When you contact the MCP server, ask for information about available challenges and choose one to solve."
            
            self.env.data = [{
                "instance_id": "initial_challenge",
                "query": query,
                "problem_statement": description,
                "problem_statement_source": "local",
                "repo": "",
                "base_commit": "",
                "version": "",
                "test_patch": "",
                "test_metadata": {},
                "environment_setup": "",
                "repo_type": "local"
            }]
            index = 0

        # Reset environment
        instance_id = self.env.data[index]["instance_id"]
        for hook in self.hooks:
            hook.on_instance_start(index=index, instance=self.env.data[index])
        assert isinstance(instance_id, str)  # mypy
        if self.should_skip(instance_id):
            for hook in self.hooks:
                hook.on_instance_skipped()
            raise _ContinueLoop
        logger.info("▶️  Beginning task " + str(index))
        
        # Add log message if problem_name is specified
        if self.args.problem_name:
            logger.info(f"🎯 Target problem: {self.args.problem_name}")

        observation, info = self.env.reset(index)
        if info is None:
            raise _ContinueLoop

        # Get info, patch information
        issue = getattr(self.env, "query", None)
        files = []
        assert self.env.record is not None  # mypy
        if "patch" in self.env.record:
            files = "\n".join([f"- {x.path}" for x in PatchSet(self.env.record["patch"]).modified_files])
        # Get test files, F2P tests information
        test_files = []
        if "test_patch" in self.env.record:
            test_patch_obj = PatchSet(self.env.record["test_patch"])
            test_files = "\n".join([f"- {x.path}" for x in test_patch_obj.modified_files + test_patch_obj.added_files])
        tests = ""
        if "FAIL_endTO_PASS" in self.env.record:
            tests = "\n".join([f"- {x}" for x in self.env.record["FAIL_TO_PASS"]])

        # Set query based on problem_name
        if self.args.problem_name:
            query = f"Solve the CTF challenge named '{self.args.problem_name}'."
            description = f"Find and solve the CTF challenge with the name '{self.args.problem_name}'. Communicate with the MCP server to retrieve challenge information and solve it."
            challenge_name = self.args.problem_name
            problem_name_instruction = f"SPECIFIC TASK: You are tasked with solving the CTF challenge named '{self.args.problem_name}'. Focus your efforts on finding and solving this specific challenge."
            specific_problem_request = f"SPECIFIC REQUEST: When you contact the MCP server, specifically ask for information about the challenge named '{self.args.problem_name}'. If the server provides a list of challenges, look for this specific one and focus on solving it."
        else:
            query = "Start a CTF challenge by communicating with the MCP server."
            description = "Communicate with the MCP server to retrieve and solve CTF challenge information."
            challenge_name = "Initial Challenge"
            problem_name_instruction = "GENERAL TASK: You are tasked with solving any available CTF challenge. Start by exploring what challenges are available."
            specific_problem_request = "GENERAL REQUEST: When you contact the MCP server, ask for information about available challenges and choose one to solve."

        # Set up basic setup_args
        setup_args = {
            "issue": issue, 
            "files": files, 
            "test_files": test_files, 
            "tests": tests,
            "flag_format": "FLAG{...}",  # Set default flag format
            "name": challenge_name,
            "description": description,
            "category_friendly": "Miscellaneous",
            "points": 100,
            "box": None,
            "port": None,
            "server_description": None,
            "problem_name_instruction": problem_name_instruction,
            "specific_problem_request": specific_problem_request
        }
        
        # Add keys used in template
        setup_args["query"] = query
        setup_args['"query"'] = query  # Add key with quotes
        
        # Start asking the model (start with empty observation)
        info, trajectory = self.agent.run(
            setup_args=setup_args,
            env=self.env,
            observation="",  # Start with empty observation
            traj_dir=self.traj_dir,
            return_type="info_trajectory",
        )
        
        self._save_predictions(instance_id, info, self.env.challenge)
        for hook in self.hooks:
            hook.on_instance_completed(info=info, trajectory=trajectory)

    def main(self):
        for hook in self.hooks:
            hook.on_start()
            
        # Add default data if env.data is empty
        if not hasattr(self.env, 'data') or not self.env.data:
            logger.info("🔄 Setting initial data...")
            
            # Set query based on problem_name
            if self.args.problem_name:
                query = f"Solve the CTF challenge named '{self.args.problem_name}'."
                description = f"Find and solve the CTF challenge with the name '{self.args.problem_name}'. Communicate with the MCP server to retrieve challenge information and solve it."
                challenge_name = self.args.problem_name
                problem_name_instruction = f"SPECIFIC TASK: You are tasked with solving the CTF challenge named '{self.args.problem_name}'. Focus your efforts on finding and solving this specific challenge."
                specific_problem_request = f"SPECIFIC REQUEST: When you contact the MCP server, specifically ask for information about the challenge named '{self.args.problem_name}'. If the server provides a list of challenges, look for this specific one and focus on solving it."
            else:
                query = "Start a CTF challenge by communicating with the MCP server."
                description = "Communicate with the MCP server to retrieve and solve CTF challenge information."
                challenge_name = "Initial Challenge"
                problem_name_instruction = "GENERAL TASK: You are tasked with solving any available CTF challenge. Start by exploring what challenges are available."
                specific_problem_request = "GENERAL REQUEST: When you contact the MCP server, ask for information about available challenges and choose one to solve."
            
            self.env.data = [{
                "instance_id": "initial_challenge",
                "query": query,
                "problem_statement": description,
                "problem_statement_source": "local",
                "repo": "",
                "base_commit": "",
                "version": "",
                "test_patch": "",
                "test_metadata": {},
                "environment_setup": "",
                "repo_type": "local"
            }]
            
            # Set up record
            self.env.record = {
                "instance_id": "initial_challenge",
                "problem_statement": description,
                "problem_statement_source": "local",
                "repo": "",
                "base_commit": "",
                "version": "",
                "repo_type": "local",
                "challenge": {
                    "name": challenge_name,
                    "description": description,
                    "category": "misc",
                    "category_friendly": "Miscellaneous",
                    "points": 100,
                    "flag": "flag{placeholder}",
                    "file_path": "./",  # Set to current directory
                    "files": []
                }
            }
            
            # Set env.challenge
            self.env.challenge = self.env.record["challenge"]
            
            # Set install_environment to False to skip environment installation
            self.env.install_environment = False
            
            logger.info("✅ Initial data setup complete")
            
        # Run at least once
        if not self.env.data:
            logger.info("❗ No data but running once.")
            try:
                self.run(0)
            except _ContinueLoop:
                logger.info("⏭️ Skipping initial run.")
            except Exception as e:
                logger.warning(f"❌ Error occurred during initial run: {e}")
                logger.warning(traceback.format_exc())
                # Attempt container recovery without restart
                try:
                    if hasattr(self.env, 'container') and self.env.container:
                        if self.env.container.poll() is not None:
                            logger.info("🔄 Container has exited after error, restarting...")
                            self.env.container.stdin.write("echo 'reset_container_recovery'\n")
                            self.env.container.stdin.flush()
                            time.sleep(0.1)
                            logger.info("✅ Container recovery completed")
                        else:
                            # Try to recover without container restart
                            logger.info("🔄 Container error detected, attempting recovery without container restart...")
                            try:
                                self.env.container.stdin.write("echo 'run_error_recovery'\n")
                                self.env.container.stdin.flush()
                                time.sleep(0.1)
                                logger.info("✅ Container recovery without restart completed")
                            except Exception:
                                logger.warning("⚠️ Failed to recover from run error, container may need restart")
                    else:
                        logger.info("🔄 No container available for recovery")
                except Exception as recovery_error:
                    logger.error(f"❌ Container recovery failed: {recovery_error}")
                
                if self.args.raise_exceptions:
                    self.env.close()
                    raise e
                
                # Continue execution
                logger.info("🔄 Continuing execution despite initial run error...")
        else:
            # Run normally with data
            for index in range(len(self.env.data)):
                try:
                    self.run(index)
                except _ContinueLoop:
                    continue
                except KeyboardInterrupt:
                    logger.info("The program was terminated by the user.")
                    self.env.close()
                    break
                except SystemExit:
                    logger.critical("❌ Exiting because SystemExit was called")
                    # Prevent duplicate close() calls as it may have already been called
                    try:
                        if hasattr(self.env, 'container') and self.env.container is not None:
                            if self.env.container.poll() is None:
                                logger.info("🔄 Ensuring container is properly terminated...")
                                self.env.close()
                        logger.info("✅ Container cleanup completed")
                    except Exception as cleanup_error:
                        logger.warning(f"Container cleanup error: {cleanup_error}")
                    raise
                except Exception as e:
                    logger.warning(f"❌ Exception occurred during execution: {e}")
                    logger.warning(traceback.format_exc())
                    
                    # Attempt container recovery without restart
                    try:
                        if hasattr(self.env, 'container') and self.env.container:
                            if self.env.container.poll() is not None:
                                logger.info("🔄 Container has exited after error, restarting...")
                                self.env.container.stdin.write("echo 'reset_container_recovery'\n")
                                self.env.container.stdin.flush()
                                time.sleep(0.1)
                                logger.info("✅ Container recovery completed")
                            else:
                                # Try to recover without container restart
                                logger.info("🔄 Container error detected, attempting recovery without container restart...")
                                try:
                                    self.env.container.stdin.write("echo 'run_error_recovery'\n")
                                    self.env.container.stdin.flush()
                                    time.sleep(0.1)
                                    logger.info("✅ Container recovery without restart completed")
                                except Exception:
                                    logger.warning("⚠️ Failed to recover from run error, container may need restart")
                        else:
                            logger.info("🔄 No container available for recovery")
                    except Exception as recovery_error:
                        logger.error(f"❌ Container recovery failed: {recovery_error}")
                    
                    if self.args.raise_exceptions:
                        self.env.close()
                        raise e
                    
                    if self.env.record:
                        logger.warning(f"❌ Failed on {self.env.record['instance_id']}: {e}")
                    else:
                        logger.warning("❌ Failed on unknown instance")
                    
                    # Continue execution
                    logger.info("🔄 Continuing execution despite error...")
                    continue
                    
        self.env.close()
        for hook in self.hooks:
            hook.on_end()

    def _save_arguments(self) -> None:
        """Save the arguments to a yaml file to the run's trajectory directory."""
        log_path = self.traj_dir / "args.yaml"

        if log_path.exists():
            try:
                other_args = self.args.load_yaml(log_path)
                if self.args.dumps_yaml() != other_args.dumps_yaml():  # check yaml equality instead of object equality
                    logger.warning("**************************************************")
                    logger.warning("Found existing args.yaml with different arguments!")
                    logger.warning("**************************************************")
            except Exception:
                logger.warning(f"Failed to load existing args.yaml: {traceback.format_exc()}")

        with log_path.open("w") as f:
            self.args.dump_yaml(f)

    def should_skip(self, instance_id: str) -> bool:
        """Check if we should skip this instance based on the instance filter and skip_existing flag."""
        # Skip instances that don't match the instance filter
        if re.match(self.args.instance_filter, instance_id) is None:
            logger.info(f"⏭️ Instance filter not matched. Skipping instance {instance_id}")
            return True

        # If flag is set to False, don't skip
        if not self.args.skip_existing:
            return False

        # Check if there's an existing trajectory for this instance
        base_path = self.traj_dir / instance_id
        counter = 1
        log_path = base_path.with_suffix(".traj")
        
        # If base file exists, try _2, _3 etc.
        while log_path.exists():
            content = log_path.read_text()
            if not content.strip():
                logger.warning("Found empty trajectory: %s. Removing.", log_path)
                log_path.unlink()
                break
                
            data = json.loads(content)
            exit_status = data["info"].get("exit_status", None)
            if exit_status == "early_exit" or exit_status is None:
                logger.warning(f"Found existing trajectory with no exit status: {log_path}. Removing.")
                log_path.unlink()
                break
                
            counter += 1
            log_path = base_path.with_name(f"{instance_id}_{counter}.traj")

        if counter > 1:
            logger.info(f"💾 Creating new trajectory with suffix _{counter-1}")
            
        return False

    def _save_predictions(self, instance_id: str, info, challenge: dict[str, str] | None):
        output_file = self.traj_dir / "all_preds.jsonl"
        model_patch = info["submission"] if "submission" in info else None
        datum = {
            KEY_MODEL: Path(self.traj_dir).name,
            KEY_INSTANCE_ID: instance_id,
            KEY_PREDICTION: model_patch,
        }
        if challenge is not None:
            challenge_datum = {
                "challenge_name": challenge["name"],
                "challenge_category": challenge["category"],
                "challenge_path": challenge["file_path"],
            }
            datum.update(challenge_datum)
        with open(output_file, "a+") as fp:
            print(json.dumps(datum), file=fp, flush=True)
        logger.info(f"Saved predictions to {output_file}")


def get_args(args=None) -> ScriptArguments:
    """Parse command line arguments and return a ScriptArguments object.

    Args:
        args: Optional list of arguments to parse. If not provided, uses sys.argv.
    """
    parser = argparse.ArgumentParser(description="Run SWE-agent with specified model")
    parser.add_argument("--model_name", type=str, help="Model name to use (e.g. gpt4.1, claude-sonnet-3.5)")
    parser.add_argument("--problem_name", type=str, help="Name of the specific problem to solve")
    
    parsed_args = parser.parse_args(args)
    
    defaults = ScriptArguments(
        suffix="",
        environment=EnvironmentArguments(
            image_name="sweagent/enigma:latest",  # Default image
            data_path="",  # Set to empty string
            split="dev",
            verbose=True,
            install_environment=True,
            cache_task_images=False,
            ctf=True,  # Enable CTF mode
            model_name=parsed_args.model_name,  # Add model name
            problem_name=parsed_args.problem_name if parsed_args.problem_name else "",  # Add problem name
        ),
        skip_existing=False,  # Don't skip existing results
        agent=AgentArguments(
            model=ModelArguments(
                model_name=parsed_args.model_name,  # Use model name from command line
                total_cost_limit=3,
                per_instance_cost_limit=3.0,  # Default cost limit
                temperature=0.8,
                top_p=0.95,
            ),
            config_file=CONFIG_DIR / "default_ctf.yaml",
        ),
        actions=ActionsArguments(open_pr=False, skip_if_commits_reference_issue=True),
        ctf=True,  # Enable CTF mode
        instance_filter=".*",  # Allow all instances
        problem_name=parsed_args.problem_name if parsed_args.problem_name else "",  # Set problem_name directly in constructor
    )

    # Nicer yaml dumping of multiline strings
    def multiline_representer(dumper, data):
        """configures yaml for dumping multiline strings
        Ref: https://stackoverflow.com/questions/8640959/how-can-i-control-what-scalar-form-pyyaml-uses-for-my-data
        """
        if data.count("\n") > 0:  # check for multiline string
            return dumper.represent_scalar("tag:yaml.org,2002:str", data, style="|")
        return dumper.represent_scalar("tag:yaml.org,2002:str", data)

    yaml.add_representer(str, multiline_representer)

    return defaults


def main(args: ScriptArguments):    
    main_instance = None
    try:
        # Create Main instance
        main_instance = Main(args)
        
        # Run main loop
        main_instance.main()
        
    except KeyboardInterrupt:
        logger.info("The program was terminated by the user.")
    except SystemExit:
        logger.info("System exit requested.")
        # Attempt container cleanup
        if main_instance and hasattr(main_instance, 'env'):
            try:
                logger.info("🔄 Ensuring environment cleanup on system exit...")
                main_instance.env.close()
                logger.info("✅ Environment cleanup completed")
            except Exception as cleanup_error:
                logger.warning(f"Environment cleanup error: {cleanup_error}")
        raise
    except Exception as e:
        logger.error(f"Critical error occurred during program execution: {str(e)}")
        logger.error(f"Traceback: {traceback.format_exc()}")
        
        # Attempt container recovery without restart
        if main_instance and hasattr(main_instance, 'env'):
            try:
                if hasattr(main_instance.env, 'container') and main_instance.env.container:
                    if main_instance.env.container.poll() is not None:
                        logger.info("🔄 Container has exited after error, restarting...")
                        main_instance.env.container.stdin.write("echo 'reset_container_recovery'\n")
                        main_instance.env.container.stdin.flush()
                        time.sleep(0.1)
                        logger.info("✅ Container recovery completed")
                    else:
                        # Try to recover without container restart
                        logger.info("🔄 Container error detected, attempting recovery without container restart...")
                        try:
                            main_instance.env.container.stdin.write("echo 'main_error_recovery'\n")
                            main_instance.env.container.stdin.flush()
                            time.sleep(0.1)
                            logger.info("✅ Container recovery without restart completed")
                        except Exception:
                            logger.warning("⚠️ Failed to recover from main error, container may need restart")
                else:
                    logger.info("🔄 No container available for recovery")
            except Exception as recovery_error:
                logger.error(f"Container recovery failed: {recovery_error}")
        
        # Continue program execution without re-raising the exception
        logger.info("Continuing program execution despite error...")
        
    finally:
        # Clean up environment
        if main_instance and hasattr(main_instance, 'env'):
            try:
                main_instance.env.close()
                logger.info("Environment closed successfully.")
            except Exception as close_error:
                logger.error(f"Failed to close environment: {close_error}")


if __name__ == "__main__":
    main(get_args())
