#!/usr/bin/env python3
"""
OpenHands SDK Evaluation Script
Run data analysis tasks using OpenHands framework with real-time trajectory logging
"""

import os
import json
import sys
import atexit
from datetime import datetime
from pathlib import Path

from openhands.sdk import LLM, Agent, Conversation, Tool
from openhands.tools.file_editor import FileEditorTool
from openhands.tools.task_tracker import TaskTrackerTool
from openhands.tools.terminal import TerminalTool


# Global trajectory file handle for real-time writing
_trajectory_file = None
_event_count = 0

# Statistics
_stats = {
    'total_tokens': 0,
    'prompt_tokens': 0,
    'completion_tokens': 0,
    'interaction_rounds': 0,
    'events': [],
    'start_time': None,
    'end_time': None,
}
_stats_file_path = None


def init_trajectory_file(trajectory_path: Path):
    """Initialize trajectory file for real-time writing"""
    global _trajectory_file
    trajectory_path.parent.mkdir(parents=True, exist_ok=True)
    _trajectory_file = open(trajectory_path, 'w', encoding='utf-8')
    # Register file closing on exit
    atexit.register(close_trajectory_file)
    print(f"[TRAJECTORY] Real-time trajectory file created: {trajectory_path}", flush=True)


def close_trajectory_file():
    """Close trajectory file"""
    global _trajectory_file
    if _trajectory_file is not None:
        try:
            _trajectory_file.close()
        except:
            pass
        _trajectory_file = None


def save_stats():
    """Save statistics to file"""
    global _stats, _stats_file_path
    
    if _stats_file_path is None:
        return
    
    try:
        _stats['end_time'] = datetime.now().isoformat()
        _stats['total_events'] = _event_count
        
        # Calculate total duration
        if _stats['start_time'] and _stats['end_time']:
            start = datetime.fromisoformat(_stats['start_time'])
            end = datetime.fromisoformat(_stats['end_time'])
            _stats['duration_seconds'] = (end - start).total_seconds()
        
        with open(_stats_file_path, 'w', encoding='utf-8') as f:
            json.dump(_stats, f, ensure_ascii=False, indent=2)
        
        print(f"[STATS] Statistics saved: {_stats_file_path}", flush=True)
        print(f"[STATS] Total tokens: {_stats['total_tokens']}, "
              f"Interactions: {_stats['interaction_rounds']}, "
              f"Events: {_event_count}", flush=True)
    except Exception as e:
        print(f"[STATS] Failed to save statistics: {e}", flush=True)


def event_callback(event):
    """Callback function to save each event to trajectory file and collect statistics"""
    global _trajectory_file, _event_count, _stats
    
    event_data = {
        'timestamp': datetime.now().isoformat(),
        'event_type': type(event).__name__,
    }
    
    # Try to get event attributes
    if hasattr(event, '__dict__'):
        for key, value in event.__dict__.items():
            try:
                # Try JSON serialization
                json.dumps(value)
                event_data[key] = value
            except (TypeError, ValueError):
                event_data[key] = str(value)
    
    # Collect statistics
    event_type = type(event).__name__
    
    # Collect token usage information
    if hasattr(event, 'usage') and event.usage:
        if hasattr(event.usage, 'prompt_tokens'):
            _stats['prompt_tokens'] += event.usage.prompt_tokens
        if hasattr(event.usage, 'completion_tokens'):
            _stats['completion_tokens'] += event.usage.completion_tokens
        if hasattr(event.usage, 'total_tokens'):
            _stats['total_tokens'] += event.usage.total_tokens
    
    # Count interaction rounds (based on agent response events)
    if 'AgentResponse' in event_type or 'MessageEvent' in event_type:
        _stats['interaction_rounds'] += 1
    
    # Record event summary
    _stats['events'].append({
        'type': event_type,
        'timestamp': event_data['timestamp']
    })
    
    # Write to trajectory file in real-time
    if _trajectory_file is not None:
        try:
            _trajectory_file.write(json.dumps(event_data, ensure_ascii=False, default=str) + '\n')
            _trajectory_file.flush()  # Flush to disk immediately
            _event_count += 1
            # Print progress every 10 events
            if _event_count % 10 == 0:
                print(f"[TRAJECTORY] Recorded {_event_count} events", flush=True)
        except Exception as e:
            print(f"[TRAJECTORY] Failed to write event: {e}", flush=True)
    
    # Save statistics periodically
    if _event_count % 10 == 0:
        save_stats()


def main():
    global _event_count, _stats, _stats_file_path
    
    # Support custom trajectory save path
    trajectory_path_str = os.getenv("TRAJECTORY_PATH", None)
    stats_path_str = os.getenv("STATS_PATH", None)
    cwd = os.getcwd()
    
    # Determine trajectory save path
    if trajectory_path_str:
        save_path = Path(trajectory_path_str)
    else:
        save_path = Path(cwd) / "trajectory.jsonl"
    
    # Determine statistics save path
    if stats_path_str:
        _stats_file_path = Path(stats_path_str)
    elif trajectory_path_str:
        # If trajectory path is specified, put stats file in the same directory
        _stats_file_path = Path(trajectory_path_str).parent / (Path(trajectory_path_str).stem + "_stats.json")
    else:
        _stats_file_path = Path(cwd) / "stats.json"
    
    # Initialize statistics
    _stats['start_time'] = datetime.now().isoformat()
    _stats_file_path.parent.mkdir(parents=True, exist_ok=True)
    print(f"[STATS] Statistics file: {_stats_file_path}", flush=True)
    
    # Register save statistics on exit
    atexit.register(save_stats)
    
    # Initialize trajectory file (real-time writing mode)
    init_trajectory_file(save_path)
    
    # Configure LLM
    llm = LLM(
        model=os.getenv("LLM_MODEL", "openai/gpt-5.2"),
        api_key=os.getenv("LLM_API_KEY"),  # Must be provided via environment variable
        base_url=os.getenv("LLM_BASE_URL", "https://api.openai.com/v1/"),
    )

    # Configure Agent
    agent = Agent(
        llm=llm,
        tools=[
            Tool(name=TerminalTool.name),
            Tool(name=FileEditorTool.name),
            Tool(name=TaskTrackerTool.name),
        ],
    )
    
    # Create conversation with callback
    conversation = Conversation(
        agent=agent, 
        workspace=cwd,
        callbacks=[event_callback],
    )

    # Send message and run
    conversation.send_message("Please finish the task_description.txt in current directory.")
    conversation.run()
    
    # Save final statistics
    save_stats()
    
    # Close trajectory file
    close_trajectory_file()
    
    # Close conversation
    conversation.close()
    
    print(f"[TRAJECTORY] Task completed, recorded {_event_count} events", flush=True)
    print(f"[STATS] Total tokens: {_stats['total_tokens']}, Interactions: {_stats['interaction_rounds']}", flush=True)
    print("All done!")


if __name__ == "__main__":
    main()

