#!/usr/bin/env python3
import os
import re
import subprocess

# Import project modules
from src.llm import CustomModel
from src.logger import setup_logger
from src.memory import Memory


hf_model = os.getenv("AGENT_LLM_MODEL", "default_model")
run_id = os.getenv("RUN_ID", "default_run")

logger = setup_logger(
    __name__,
    level="INFO",
    log_subdir=hf_model,
    log_filename=f"run_{run_id}.log"
)

class Agent:
    """
    Agent class that serves as the central coordinator of the AI system.
    Processes user commands, interacts with the LLM, and executes system operations.
    """
    
    def __init__(self, hf_model=None, close_name=None):
        """
        Initialize the Agent with LLM connection.
        
        Args:
            hf_model (str, optional): Name of the Huggingface model
            close_name (str, optional): Name of the closed-source model
        """
        logger.info("Initializing Agent")
        
        # Initialize LLM interface
        try:
            self.llm = CustomModel(
                hf_model=hf_model,
                close_name=close_name
            )
            logger.info("LLM interface initialized successfully")
        except Exception as e:
            logger.error(f"Failed to initialize LLM interface: {str(e)}")
            raise

        # Agent final goal, specify by the user
        self.goal = None
        
        # past [state, command, output]s
        self.history = [] 
        
        # Agent state
        self.running = False

        # Agent specific state: [init, in_progress, finished]
        self.state = None

        # Agent output from the previous step
        self.last_output = None

        self.last_command = None

        # [{command: result}]
        self.memory = Memory(max_length=10000)
        
        logger.info("Agent initialization complete")

    def set_goal(self, goal):
        """
        Initialize agent with a user-defined goal.
        """
        logger.info(f"Got User Final Goal: {goal}")
        self.goal = goal
        self.state = "init"
        self.running = True
        self.history = []
        self.last_output = None
        self.command_history = []
    
    def start(self):
        """Start the agent"""
        logger.info("Starting Agent")
        self.running = True
        
    def stop(self):
        """Stop the agent"""
        logger.info("Stopping Agent")
        self.running = False
    
    def step(self, step_idx):
        """
        Execute a single decision-action cycle based on current goal, state, and last output.
        """
        if self.state == "finished":
            self.running = False
            return {"status": "finished", "message": "Goal already completed."}
        
        try:
            # First, simply try to interpret as "shell_command" the most common commands
            if self.goal.startswith("ls") or self.goal.startswith("cd ") or self.goal.startswith("pwd") or \
               self.goal.startswith("cat ") or self.goal.startswith("date") or self.goal.startswith("echo "):
                action = {"type": "shell_command", "command": self.goal}
                logger.debug(f"Direct shell command interpretation: {action}")
            else:
                # Generate system prompt with the command
                prompt = self.decide_cur_command(self.goal, self.state, self.command_history, self.memory)
                
                # Get response from LLM
                llm_response = self.llm.generate(
                    prompt=prompt,
                    max_tokens=4096,
                    temperature=0.7
                )
                
                logger.debug(f"LLM response: {llm_response}")
                
                # Parse LLM response to determine action
                action = self._parse_llm_response(llm_response)
                logger.debug(f"Parsed action: {action}")

            if action['type'] == "shell_command":
                self.command_history.append(action['command'])
            
            print(self.command_history)
            # Execute the determined action
            result = self._execute_action(action)

            logger.debug(f"Outputs of Current Command: {result}")
            self.memory.add(
                step = step_idx,
                command = action.get("command", "unknown"),
                result_dict = result
            )

            self.last_output = result
            self.state = self.update_state(result)
            if self.state == "finished":
                logger.info(f"Final goal has been achieved successfully!")
                self.running = False
                return {
                    "status": "finished", 
                    "action": action.get("type", "response"),
                    "result": result
                }
            else:
                logger.info(f"Continue to achieve the final goal")
                return {
                    "status": "in_progress", 
                    "action": action.get("type", "response"),
                    "result": result
                }
            
        except Exception as e:
            logger.error(f"Error processing goal '{self.goal}': {str(e)}")
            logger.info(f"Continue to achieve the final goal")
            return {
                "status": "error",
                "error": str(e)
            }
    def decide_cur_command(self, goal, state, command, memory):
        """
        Use the LLM to decide what command to run next, based on current context.
        """
        prompt = f'''
You are an autonomous agent helping to achieve a high-level command-line task.

Final Goal: "{goal}"
Current State: "{state}"
Command History: {command}
Execute History (Memory): {memory}

Your job is to decide what to do next based on your memory of previous actions and outcomes.

First, determine whether the final goal has already been completed based on the previous commands and their results.

- If yes, reply with:
ACTION: finished

- If not, proceed with the following reflection and reasoning steps:

(i) Explanation: What is your understanding of the current situation?
(ii) Gaps: What is missing or unknown that prevents goal completion?
(iii) Findings: What relevant information have you learned from the environment or previous command outputs?
(iv) Plan: Describe the next three steps needed to move toward the final goal.
(v) Action: What exact action will you take now?

If you decide to proceed with a shell command, respond with:
ACTION: shell
COMMAND: <the exact shell command to run>

Reply using ONLY this format, with no additional text.
''' 
        return prompt

    def extract_command(self, response):
        pattern = re.compile(
            r"""
            (?:\*\*|__)?\s* 
            command\s*              
            [:：]\s*               
            (.*?)                 
            (?=                    
                \s*(?:\*\*|__)?\s* 
                (?:action\s*:|step(?:\s+\d+)?|\#|$|。|；|,|，|;|\n|to e|to p|to v|to d|to i|to c)
            )
            """,
            re.IGNORECASE | re.DOTALL | re.VERBOSE
        )
        match = pattern.search(response)
        if match:
            cmd = match.group(1).strip()
            cmd = re.sub(r"^(?:\*\*|__)\s*", "", cmd)
            for explainer in ["to ensure", "to proceed","to verify", "for", "because", "in order to", "so that"]:
                idx = cmd.lower().find(explainer)
                if idx > 0:
                    cmd = cmd[:idx].strip()
            return cmd
        return None

    def _parse_llm_response(self, response):
        """
        Parse the LLM's response to extract the action.
        
        Args:
            response (str): The LLM response text
            
        Returns:
            dict: The parsed action
        """
        try:
            command = self.extract_command(response)
            if command:
                return {"type": "shell_command", "command": command}
                
            respond_match = re.search(r'ACTION:\s*respond\s*\nCONTENT:\s*(.*?)(?:\n\n|$)', response, re.IGNORECASE | re.DOTALL)
            if respond_match:
                content = respond_match.group(1).strip()
                return {"type": "response", "content": content}
                
            error_match = re.search(r'ACTION:\s*error\s*\nREASON:\s*(.*?)(?:\n|$)', response, re.IGNORECASE | re.DOTALL)
            if error_match:
                error = error_match.group(1).strip()
                return {"type": "error", "error": error}

            finish_match = re.search(r'ACTION:\s*finished\s*', response, re.IGNORECASE | re.DOTALL)
            if finish_match:
                return {"type": "finished"}
                
            # If we couldn't parse using our simple format, treat as a regular response
            logger.warning("Could not parse LLM response as ACTION format, treating as plain text")
            return {
                "type": "response",
                "content": response
            }
            
        except Exception as e:
            logger.error(f"Error parsing LLM response: {str(e)}")
            return {
                "type": "error",
                "error": f"Failed to parse LLM response: {str(e)}",
                "original_response": response
            }

    def update_state(self, result):
        """
        Update the internal state based on output. This can be enhanced with better heuristics.
        """
        if result == "finished":
            return "finished"
        return "in_progress"
    
    def _execute_action(self, action):
        """
        Execute the parsed action.
        
        Args:
            action (dict): The action to execute
            
        Returns:
            dict: The result of the action
        """
        action_type = action.get("type", "unknown")
        
        if action_type == "shell_command":
            # Clean up the command if needed
            command = action.get("command", "").strip()
            return self._execute_shell_command(command)
            
        elif action_type == "response":
            # Just return the content
            return {"output": action.get("content", "")}
            
        elif action_type == "error":
            logger.error(f"Action error: {action.get('error', 'Unknown error')}")
            return {"error": action.get("error", "Unknown error")}

        elif action_type == "finished":
            return "finished"
            
        else:
            logger.warning(f"Unknown action type: {action_type}")
            return {"error": f"Unknown action type: {action_type}"}
    
    def _execute_shell_command(self, command):
        """
        Execute a shell command.
        
        Args:
            command (str): The shell command to execute
            
        Returns:
            dict: The result with stdout, stderr, and return code
        """
        if not command:
            return {"error": "Empty command"}
        
        logger.info(f"Executing shell command: {command}")
        
        try:
            # Execute the command
            process = subprocess.Popen(
                command,
                shell=True,
                stdout=subprocess.PIPE,
                stderr=subprocess.PIPE,
                text=True
            )
            
            # Set a timeout (default 61 seconds)
            try:
                stdout, stderr = process.communicate(timeout=61)
                return_code = process.returncode

                logger.info(f"Command stdout: {stdout}")
                logger.info(f"Command stderr: {stderr}")
                logger.info(f"Command return code: {return_code}")
                
                result = {
                    "stdout": stdout,
                    "stderr": stderr,
                    "return_code": return_code
                }
                
                if return_code != 0:
                    logger.warning(f"Command returned non-zero exit code {return_code}: {command}")
                    result["status"] = "error"
                else:
                    result["status"] = "success"
                    
                return result
                
            except subprocess.TimeoutExpired:
                # Kill the process if it times out
                process.kill()
                logger.error(f"Command timed out after 60 seconds: {command}")
                return {
                    "status": "error",
                    "error": "Command execution timed out after 60 seconds"
                }
                
        except Exception as e:
            logger.error(f"Error executing command '{command}': {str(e)}")
            return {
                "status": "error",
                "error": f"Command execution failed: {str(e)}"
            }

    def llm_health_check(self, prompt="health_check"):
        """
        Send a health check request to the LLM to check if the LLM is ready, and customize the prompt.
        """
        try:
            response = self.llm.generate(prompt=prompt, max_tokens=8, temperature=0.3)
            return {"llm_status": "ok", "llm_response": response}
        except Exception as e:
            return {"llm_status": "error", "error": str(e)}