"""
OfficeArena: GUI agent evaluation environment for Microsoft Office applications.
"""

import os
import time
from pathlib import Path
from typing import Any, Dict, List, Optional, Tuple

from screenenv import Sandbox

from ..adapter import ActionAdapter
from ..agents import BaseAgent
from ..utils.logger import OfficeArenaLogger
from ..utils.onedrive import OneDriveClient
from ..utils.powerpoint import download_powerpoint_as_images_sync


from io import BytesIO
from PIL import Image

class OfficeArena:
    """
    GUI agent evaluation environment for Microsoft Office applications.
    It integrates with OneDrive for file access and uses
    screenenv for browser-based Office application interaction.
    """

    def __init__(
        self,
        client_id: Optional[str] = None,
        headless: bool = False,
        max_steps: int = 30,
        step_delay: float = 1.0,
        resolution: Optional[Tuple[int, int]] = None,
        onedrive_root_path: str = "/Documents/OfficeArena",
        enable_logging: bool = True,
        log_dir: Optional[str] = None,
    ):
        """
        Initialize the OfficeArena evaluation environment.

        Args:
            client_id: OneDrive client ID (if None, will try to get from env)
            headless: Whether to run browser in headless mode
            max_steps: Maximum number of steps per evaluation
            step_delay: Delay between actions to allow UI updates
            resolution: The resolution of the sandbox (width, height)
            onedrive_root_path: OneDrive root path for file access
            enable_logging: Whether to enable detailed logging
            log_dir: Directory for log files (if None, uses default)
        """
        self.client_id = client_id or os.getenv("CLIENT_ID")
        if not self.client_id:
            raise ValueError("CLIENT_ID must be provided or set in environment variables")

        self.headless = headless
        self.max_steps = max_steps
        self.step_delay = step_delay
        self.resolution = resolution
        self.onedrive_root_path = onedrive_root_path
        self.enable_logging = enable_logging

        # Initialize OneDrive client
        try:
            self.onedrive_client = OneDriveClient(client_id=self.client_id, root_path=onedrive_root_path)
        except Exception as onedrive_init_error:
            # OneDrive initialization failures are infrastructure issues
            raise ValueError(f"Failed to initialize OneDrive client (infrastructure failure): {onedrive_init_error}")

        # Evaluation state
        self.sandbox: Optional[Sandbox] = None
        self.adapter: Optional[ActionAdapter] = None
        self.current_step = 0
        self.task_completed = False
        self.evaluation_history: List[Dict[str, Any]] = []

        # Logger (will be initialized per task)
        self.logger: Optional[OfficeArenaLogger] = None
        self.log_dir = log_dir

    def _check_wacframe_available(self) -> bool:
        """
        Check if WacFrame is available on any of the pages in the browser context.
        This indicates that Office Online has loaded properly.
        
        Returns:
            True if WacFrame is found, False otherwise
        """
        try:
            # Ensure chromium context is properly initialized
            if not hasattr(self.sandbox, 'chromium_context') or not self.sandbox.chromium_context:
                if self.logger:
                    self.logger.log_error("Chromium context not available")
                return False
                
            context = self.sandbox.chromium_context
            if not context.pages:
                if self.logger:
                    self.logger.log_error("No pages available in chromium context")
                return False
                
            page = context.pages[0]
            
            # Check frames directly (like in powerpoint.py)
            for f in page.frames:
                try:
                    # Handle both callable and property-style name access
                    name = getattr(f, "name", lambda: "")()
                except Exception:
                    try:
                        name = f.name
                    except Exception:
                        name = ""
                
                if "WacFrame" in str(name):
                    return True
                    
            return False
            
        except Exception as e:
            if self.logger:
                self.logger.log_error(f"Error checking WacFrame availability: {str(e)}")
            return False

    def _wait_for_office_online_ready(self, max_retries: int = 3, wait_timeout: int = 10) -> None:
        """
        Wait for Office Online to be ready by checking for the WacFrame iframe.
        If not ready, refresh the page and retry.
        
        Args:
            max_retries: Maximum number of refresh attempts
            wait_timeout: Seconds to wait for iframe to load each attempt
        """
        for attempt in range(max_retries + 1):  # +1 for initial attempt
            try:
                # Wait for the page to load initially and browser to be ready
                initial_wait = 5 if attempt == 0 else 3
                time.sleep(initial_wait)
                
                # Wait up to wait_timeout seconds for the WacFrame to appear
                start_time = time.time()
                while time.time() - start_time < wait_timeout:
                    try:
                        # Ensure chromium context is properly initialized
                        if not hasattr(self.sandbox, 'chromium_context') or not self.sandbox.chromium_context:
                            time.sleep(1)
                            continue
                            
                        context = self.sandbox.chromium_context
                        if not context.pages:
                            time.sleep(1)
                            continue
                            
                        page = context.pages[0]
                        
                        # Check frames directly (like in powerpoint.py)
                        wac_frames = []
                        for f in page.frames:
                            try:
                                # Handle both callable and property-style name access
                                name = getattr(f, "name", lambda: "")()
                            except Exception:
                                try:
                                    name = f.name
                                except Exception:
                                    name = ""
                            
                            if "WacFrame" in str(name):
                                wac_frames.append(f)
                        
                        if wac_frames:
                            message = f"[OfficeArena] ✅ Office Online ready (WacFrame detected on attempt {attempt + 1})"
                            print(message)
                            if self.logger:
                                self.logger.log_info(message)
                            return
                            
                    except Exception:
                        # Frame access might fail while page is loading
                        pass
                    
                    time.sleep(1)
                
                # If we reach here, WacFrame wasn't found within timeout
                if attempt < max_retries:
                    message = f"[OfficeArena] ⚠️  Office Online not ready (attempt {attempt + 1}), refreshing page..."
                    print(message)
                    if self.logger:
                        self.logger.log_info(message)
                    
                    # Refresh the page using Playwright
                    try:
                        if hasattr(self.sandbox, 'chromium_context') and self.sandbox.chromium_context:
                            context = self.sandbox.chromium_context
                            if context.pages:
                                page = context.pages[0]
                                page.reload()
                    except Exception as e:
                        print(f"[OfficeArena] Failed to refresh page: {e}")
                else:
                    # Final attempt failed
                    message = f"[OfficeArena] ⚠️  Office Online may not be fully ready after {max_retries} retries, continuing anyway"
                    print(message)
                    if self.logger:
                        self.logger.log_info(message)
                    
            except Exception as e:
                error_msg = f"Error checking Office Online readiness: {str(e)}"
                if self.logger:
                    self.logger.log_error(error_msg)
                
                if attempt < max_retries:
                    print(f"[OfficeArena] Retrying Office Online check (attempt {attempt + 1})")
                    time.sleep(2)
                else:
                    print(f"[OfficeArena] ⚠️  {error_msg}, continuing evaluation")
                    break

    def start_evaluation(self, file_path: str, task_instruction: str) -> bytes:
        """
        Start an evaluation session by opening the specified Office file.

        Args:
            file_path: Path to the Office file in OneDrive (relative to root)
            task_instruction: Description of the task to complete

        Returns:
            Initial screenshot as bytes
        """
        # Clean up any previous session
        if self.sandbox:
            self.sandbox.close()

        # Initialize logger for this task
        if self.enable_logging:
            task_id = f"{Path(file_path).stem}_{int(time.time())}"
            self.logger = OfficeArenaLogger(log_dir=self.log_dir, task_id=task_id)
            self.logger.start_task(file_path, task_instruction)

        # Initialize new sandbox for evaluation
        sandbox_kwargs = {"headless": self.headless}
        if self.resolution is not None:
            sandbox_kwargs["resolution"] = self.resolution

        try:
            self.sandbox = Sandbox(**sandbox_kwargs)
        except Exception as sandbox_error:
            error_msg = f"Failed to initialize sandbox: {sandbox_error}"
            if self.logger:
                self.logger.log_error(error_msg)
            raise RuntimeError(error_msg)
        # self.adapter = ActionAdapter(self.sandbox)
        # self.adapter = ClaudeActionAdapter(self.sandbox)

        # Reset evaluation state
        self.current_step = 0
        self.task_completed = False
        self.evaluation_history = []

        try:
            try:
                edit_link = self.onedrive_client.get_edit_link(file_path)
            except Exception as link_error:
                # OneDrive API failures (rate limiting, network, auth) are infrastructure failures
                if "rate" in str(link_error).lower() or "429" in str(link_error) or "throttl" in str(link_error).lower():
                    error_msg = f"OneDrive rate limit exceeded while getting edit link: {link_error}"
                elif "network" in str(link_error).lower() or "connection" in str(link_error).lower() or "timeout" in str(link_error).lower():
                    error_msg = f"Network error while getting edit link: {link_error}"
                elif "auth" in str(link_error).lower() or "token" in str(link_error).lower() or "401" in str(link_error) or "403" in str(link_error):
                    error_msg = f"Authentication error while getting edit link: {link_error}"
                else:
                    error_msg = f"OneDrive API error while getting edit link: {link_error}"
                
                if self.logger:
                    self.logger.log_error(error_msg, "OneDrive edit link")
                raise RuntimeError(f"infrastructure failure: {error_msg}")
                
            if not edit_link:
                error_msg = f"Failed to get edit link for file: {file_path}"
                if self.logger:
                    self.logger.log_error(error_msg, "OneDrive edit link")
                raise RuntimeError(f"infrastructure failure: {error_msg}")
                
            try:
                self.sandbox.open(edit_link)
            except Exception as open_error:
                # Sandbox opening failures are infrastructure issues
                error_msg = f"Failed to open file in sandbox: {open_error}"
                if self.logger:
                    self.logger.log_error(error_msg, "Sandbox open")
                raise RuntimeError(f"infrastructure failure: {error_msg}")

            # Wait for file to load completely and check for Office Online availability
            self._wait_for_office_online_ready(max_retries=3)
            time.sleep(2)  # Additional wait for full initialization

            # Set up PowerPoint classic ribbon for better automation compatibility
            if file_path.lower().endswith((".pptx", ".ppt")):
                try:
                    from ..utils.powerpoint import ensure_classic_ribbon_always_show

                    message = "[OfficeArena] Setting up PowerPoint classic ribbon..."
                    print(message)
                    if self.logger:
                        self.logger.log_info(message)

                    ribbon_success = ensure_classic_ribbon_always_show(sandbox=self.sandbox, verbose=True)
                    if ribbon_success:
                        message = "[OfficeArena] ✅ Classic ribbon setup successful"
                        print(message)
                        if self.logger:
                            self.logger.log_info(message)
                    else:
                        message = "[OfficeArena] ⚠️  Classic ribbon setup had issues, continuing anyway"
                        print(message)
                        if self.logger:
                            self.logger.log_info(message)
                except Exception as ribbon_error:
                    message = f"[OfficeArena] ⚠️  Failed to set up classic ribbon: {ribbon_error}"
                    print(message)
                    if self.logger:
                        self.logger.log_error(str(ribbon_error), "PowerPoint classic ribbon setup")
                    # Continue evaluation even if ribbon setup fails

            # Take initial screenshot
            screenshot = self.sandbox.desktop_screenshot()

            # Log initial screenshot if logging enabled
            if self.logger:
                self.logger.log_info("Initial screenshot captured")

            # Record evaluation start
            self.evaluation_history.append(
                {
                    "type": "evaluation_start",
                    "file_path": file_path,
                    "task_instruction": task_instruction,
                    "edit_link": edit_link,
                    "timestamp": time.time(),
                }
            )

            return screenshot

        except Exception as e:
            error_msg = f"Failed to start evaluation with file {file_path}: {str(e)}"
            if self.logger:
                self.logger.log_error(error_msg)
            if self.sandbox:
                self.sandbox.close()
                self.sandbox = None
            # Check if this is an infrastructure failure (like edit link failure)
            if "infrastructure failure:" in str(e):
                raise e  # Re-raise infrastructure failures as-is
            else:
                raise RuntimeError(f"infrastructure failure: {error_msg}")

    def execute_action(self, action: str) -> Dict[str, Any]:
        """
        Execute a single action and return the result with screenshot.

        Args:
            action: Action string with args

        Returns:
            Dictionary containing:
            - screenshot: Screenshot after action execution (bytes)
            - action_success: Whether the action executed successfully
            - task_completed: Whether the task is marked as completed
            - step_info: Additional information about the step
            - evaluation_complete: Whether max steps reached or task finished
        """
        if not self.sandbox or not self.adapter:
            raise RuntimeError("Evaluation not started. Call start_evaluation() first.")

        if self.current_step >= self.max_steps:
            raise RuntimeError("Maximum steps reached. Evaluation complete.")

        # Execute the action
        action_result = self.adapter.execute_action(action)

        # Update step counter
        self.current_step += 1

        # Check if task is marked as completed
        if action_result.get("task_completed", False):
            self.task_completed = True

        # Take screenshot after action with delay for UI updates
        time.sleep(self.step_delay)
        screenshot = self.sandbox.desktop_screenshot()
        
        obs_screenshot = screenshot
        
        if isinstance(action_result['result'], dict) and 'pending_executions' in action_result['result']:
            pending_executions = action_result['result']['pending_executions']
            for pending in pending_executions:
                if pending['action'] == 'zoom':
                    region = pending['action_args']['region']
                    
                    image_stream = BytesIO(screenshot)
                    with Image.open(image_stream) as image:
                        original_format = image.format or 'PNG'
                        cropped_image = image.crop(region)
                        output_stream = BytesIO()
                        cropped_image.save(output_stream, format=original_format)
                        cropped_bytes = output_stream.getvalue()
                        obs_screenshot = cropped_bytes
                        
        # Log the action with enhanced logging
        if self.logger:
            self.logger.log_action(action, action_result, screenshot)

        # Determine if evaluation is complete
        evaluation_complete = self.task_completed or self.current_step >= self.max_steps

        # Record the step
        step_record = {
            "type": "action_step",
            "step": self.current_step,
            "action": action,
            "action_result": action_result,
            "task_completed": self.task_completed,
            "timestamp": time.time(),
        }
        self.evaluation_history.append(step_record)

        return {
            "screenshot": screenshot,
            "obs_screenshot": obs_screenshot,
            "action_success": action_result["success"],
            "task_completed": self.task_completed,
            "step_info": {
                "step": self.current_step,
                "max_steps": self.max_steps,
                "action": action,
                "action_result": action_result,
            },
            "evaluation_complete": evaluation_complete,
        }

    def evaluate_agent(
        self,
        agent: BaseAgent,
        file_path: str,
        task_instruction: str,
        save_screenshots: bool = False,
        save_online_images: bool = False,
        screenshot_dir: Optional[str] = None,
    ) -> Dict[str, Any]:
        """
        Run a complete evaluation of an agent on a specific Office task.

        Args:
            agent: The agent to evaluate
            file_path: Path to the Office file in OneDrive
            task_instruction: Task description
            save_screenshots: Whether to save screenshots during evaluation
            save_only_images: Whether to only save images
            screenshot_dir: Directory to save screenshots (if save_screenshots=True)

        Returns:
            Complete evaluation results
        """
        # Setup screenshot directory if needed
        if save_screenshots and not screenshot_dir:
            screenshot_dir = f"evaluation_{int(time.time())}"

        if save_screenshots:
            Path(screenshot_dir).mkdir(exist_ok=True)

        # Initialize status tracking
        execution_status = "success"
        verification_status = "success"
        infrastructure_failure_reason = None

        try:
            # Reset agent and start evaluation
            agent.reset()
            
            try:
                current_screenshot = self.start_evaluation(file_path, task_instruction)
                current_obs_screenshot = current_screenshot
            except RuntimeError as start_error:
                # Check if this is an infrastructure failure from start_evaluation
                if "infrastructure failure:" in str(start_error):
                    infrastructure_failure_reason = str(start_error).replace("infrastructure failure: ", "")
                    execution_status = f"infrastructure failure: {infrastructure_failure_reason}"
                    if self.logger:
                        self.logger.log_error(infrastructure_failure_reason, "Start evaluation")
                    
                    return {
                        "success": False,
                        "steps_taken": 0,
                        "max_steps": self.max_steps,
                        "completed_within_limit": False,
                        "file_path": file_path,
                        "task_instruction": task_instruction,
                        "final_screenshot_saved": save_screenshots,
                        "screenshot_directory": screenshot_dir if save_screenshots else None,
                        "downloaded_file_path": None,
                        "execution_status": execution_status,
                        "verification_status": None,
                        "error": infrastructure_failure_reason,
                        "log_paths": self.logger.get_log_paths() if self.logger else None,
                    }
                else:
                    # Re-raise other start_evaluation errors
                    raise
            
            # Check if Office Online loaded properly by checking for WacFrame
            if not self._check_wacframe_available():
                infrastructure_failure_reason = "PowerPoint application did not load (WacFrame not found)"
                execution_status = f"infrastructure failure: {infrastructure_failure_reason}"
                if self.logger:
                    self.logger.log_error(infrastructure_failure_reason, "Office Online check")
                
                return {
                    "success": False,
                    "steps_taken": 0,
                    "max_steps": self.max_steps,
                    "completed_within_limit": False,
                    "file_path": file_path,
                    "task_instruction": task_instruction,
                    "final_screenshot_saved": save_screenshots,
                    "screenshot_directory": screenshot_dir if save_screenshots else None,
                    "downloaded_file_path": None,
                    "execution_status": execution_status,
                    "verification_status": None,
                    "error": infrastructure_failure_reason,
                    "log_paths": self.logger.get_log_paths() if self.logger else None,
                }
            
            self.adapter = agent.action_adapter_class(self.sandbox)

            # Save initial screenshot
            if save_screenshots:
                initial_path = Path(screenshot_dir) / "step_000_initial.png"
                with open(initial_path, "wb") as f:
                    f.write(current_screenshot)

            # Run the evaluation loop
            while not self.task_completed and self.current_step < self.max_steps:
                # Get action from agent
                action = agent.step(current_obs_screenshot, task_instruction)

                # Execute action
                result = self.execute_action(action)
                current_obs_screenshot = result["obs_screenshot"]
                current_screenshot = result["screenshot"]
                action_type = result["step_info"]["action_result"].get("action_type", "")

                # Save screenshot if enabled
                if save_screenshots:
                    screenshot_path = Path(screenshot_dir) / f"step_{self.current_step:03d}_{action_type}.png"
                    with open(screenshot_path, "wb") as f:
                        f.write(current_screenshot)

                # Check if evaluation is complete
                if result["evaluation_complete"]:
                    break

            # Download the slides as a zip file if this is a PowerPoint presentation
            if save_screenshots and screenshot_dir and file_path.lower().endswith((".ppt", ".pptx")):
                try:
                    message = "Downloading PowerPoint slides as images"
                    if self.logger:
                        self.logger.log_info(message)
 
                    # Download images using the sync function
                    try:
                        images_zip_name = download_powerpoint_as_images_sync(sandbox=self.sandbox, download_dir=screenshot_dir, verbose=True, download_timeout=10)
                    except Exception as ppt_download_error:
                        # PowerPoint download function failures could be infrastructure issues
                        error_msg = f"PowerPoint image download function failed: {ppt_download_error}"
                        if self.logger:
                            self.logger.log_error(error_msg, "PowerPoint download")
                        if execution_status == "success":
                            verification_status = "failed: image missing"
                        images_zip_name = None
                        
                    print(f"Images zip name returned by function: {images_zip_name}")

                    if images_zip_name:
                        if images_zip_name.startswith("/"):
                            path = images_zip_name
                        else:
                            images_zip_name = Path(images_zip_name)
                            path = "/home/user/desktop/"+str(images_zip_name.parent)+"/" + images_zip_name.name
                        local_dest = str(Path(screenshot_dir) / Path(file_path).with_suffix(".zip").name)
                        if self.logger:
                            self.logger.log_info(f"Downloading PowerPoint images zip from {path} to {local_dest}")
                        
                        try:
                            self.sandbox.download_file_from_remote(path, local_dest)
                        except Exception as download_error:
                            # Sandbox download failure is an infrastructure issue
                            error_msg = f"Failed to download PowerPoint images via sandbox: {download_error}"
                            if self.logger:
                                self.logger.log_error(error_msg, "PowerPoint download")
                            if execution_status == "success":
                                verification_status = "failed: image missing"
                    else:
                        error_message = "Failed to download PowerPoint images"
                        if self.logger:
                            self.logger.log_error(error_message, "PowerPoint download")
                        if execution_status == "success":
                            verification_status = "failed: image missing"
                except Exception as e:
                    error_msg = f"Error downloading PowerPoint images: {str(e)}"
                    if self.logger:
                        self.logger.log_error(error_msg, "PowerPoint download")
                    if execution_status == "success":
                        verification_status = "failed: image missing"
                        
            # Download the final file if the task was successful
            downloaded_file_path = None
            if save_screenshots and screenshot_dir:
                try:
                    message = f"Task finished. Downloading final file: {file_path}"
                    if self.logger:
                        self.logger.log_info(message)

                    try:
                        downloaded_file_path = self.onedrive_client.download_file(file_path, screenshot_dir)
                    except Exception as download_error:
                        # OneDrive download failures are infrastructure failures
                        if "rate" in str(download_error).lower() or "429" in str(download_error) or "throttl" in str(download_error).lower():
                            error_msg = f"OneDrive rate limit exceeded while downloading file: {download_error}"
                        elif "network" in str(download_error).lower() or "connection" in str(download_error).lower() or "timeout" in str(download_error).lower():
                            error_msg = f"Network error while downloading file: {download_error}"
                        elif "auth" in str(download_error).lower() or "token" in str(download_error).lower() or "401" in str(download_error) or "403" in str(download_error):
                            error_msg = f"Authentication error while downloading file: {download_error}"
                        else:
                            error_msg = f"OneDrive API error while downloading file: {download_error}"
                        
                        if self.logger:
                            self.logger.log_error(error_msg, "File download")
                        # Final file download failure is an infrastructure failure - task needs to be rerun
                        if execution_status == "success":
                            execution_status = f"infrastructure failure: {error_msg}"
                            infrastructure_failure_reason = error_msg
                        raise

                    success_message = f"Successfully downloaded file to: {downloaded_file_path}"
                    if self.logger:
                        self.logger.log_info(success_message)
                except Exception as e:
                    error_msg = f"Error downloading final file: {str(e)}"
                    if self.logger:
                        self.logger.log_error(error_msg, "File download")
                    # Final file download failure is an infrastructure failure - task needs to be rerun
                    if execution_status == "success":
                        execution_status = f"infrastructure failure: {error_msg}"
                        infrastructure_failure_reason = error_msg

            # Determine overall success based on execution status and file/image downloads
            overall_success = self.task_completed
            if execution_status.startswith("infrastructure failure"):
                overall_success = False

            # Compile final results
            evaluation_results = {
                "success": overall_success,
                "steps_taken": self.current_step,
                "max_steps": self.max_steps,
                "completed_within_limit": self.task_completed and self.current_step <= self.max_steps,
                "file_path": file_path,
                "task_instruction": task_instruction,
                "final_screenshot_saved": save_screenshots,
                "screenshot_directory": screenshot_dir if save_screenshots else None,
                "downloaded_file_path": downloaded_file_path,
                "execution_status": execution_status,
                "verification_status": verification_status,
            }

            # Log task completion
            if self.logger:
                self.logger.end_task(self.task_completed, self.current_step)
                evaluation_results["log_paths"] = self.logger.get_log_paths()

            return evaluation_results

        except Exception as e:
            error_msg = str(e)
            if self.logger:
                self.logger.log_error(error_msg, "evaluate_agent")
                self.logger.end_task(False, self.current_step)

            # Determine if this is an infrastructure failure
            if infrastructure_failure_reason or "connection" in error_msg.lower() or "network" in error_msg.lower():
                execution_status = f"infrastructure failure: {infrastructure_failure_reason or error_msg}"

            return {
                "success": False,
                "error": error_msg,
                "steps_taken": self.current_step,
                "file_path": file_path,
                "task_instruction": task_instruction,
                "execution_status": execution_status,
                "verification_status": None,
            }

        finally:
            # cleanup
            self.sandbox.close()
            self.adapter = None
            agent.close()

    def get_current_screenshot(self) -> bytes:
        """
        Get the current screenshot of the Office application.

        Returns:
            Current screenshot as bytes
        """
        if not self.sandbox:
            raise RuntimeError("No active evaluation session. Call start_evaluation() first.")

        return self.sandbox.desktop_screenshot()

    def get_evaluation_status(self) -> Dict[str, Any]:
        """
        Get the current status of the evaluation.

        Returns:
            Dictionary with evaluation status information
        """
        return {
            "current_step": self.current_step,
            "max_steps": self.max_steps,
            "task_completed": self.task_completed,
            "evaluation_active": self.sandbox is not None,
            "steps_remaining": max(0, self.max_steps - self.current_step),
        }

    def close(self) -> None:
        """Clean up evaluation resources."""
        if self.sandbox:
            self.sandbox.close()
            self.sandbox = None
            
        self.adapter = None

        # Close logger if it exists
        if self.logger:
            self.logger.close()
            self.logger = None

        # Record evaluation end
        if self.evaluation_history:
            self.evaluation_history.append(
                {
                    "type": "evaluation_end",
                    "final_step": self.current_step,
                    "task_completed": self.task_completed,
                    "timestamp": time.time(),
                }
            )

    def __enter__(self):
        """Context manager entry."""
        return self

    def __exit__(self, exc_type, exc_value, traceback):
        """Context manager exit."""
        self.close()
