# /// script
# requires-python = ">=3.13"
# dependencies = [
#   "langgraph>=0.2.67",
#   "langchain-core>=0.3.33",
#   "langchain-openai>=0.3.3",
#   "python-dotenv>=1.0.1",
#   "sentence-transformers>=3.3.1",
#   "numpy>=2.2.1",
#   "scikit-learn>=1.6.1"
# ]
# ///

import os
import json
import tempfile
from datetime import datetime
from pathlib import Path
from typing import Optional
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from langchain_core.tools import tool
from langgraph.prebuilt import create_react_agent
from sentence_transformers import SentenceTransformer
import numpy as np
from sklearn.metrics.pairwise import cosine_similarity

load_dotenv()

# ============================================================================
# CONSTANTS - All messages and prompts (except system_prompt.md)
# ============================================================================

# Thought similarity feedback messages
THOUGHT_SIMILARITY_HIGH = "Nearly identical reflection to cycle {cycle} ({similarity}% similar). Break pattern with: web search, new memory exploration, or send a message to the operator."
THOUGHT_SIMILARITY_MEDIUM = "High similarity to cycle {cycle} thoughts ({similarity}%). Consider exploring new angles or external sources."
THOUGHT_SIMILARITY_LOW = "Related themes detected - ensure forward progress."


# Wake messages for agent
WAKE_MSG_WITH_USER_INPUT = """You have a new message from the operator. Please respond to it using the send_message tool.

Operator message: {user_messages}

[Context: The history below includes your previous thoughts for reference only.]
[Task: Respond to the operator's message with NEW insights, then continue exploration.]
{thought_feedback_context}
Respond to the operator's message, then continue your exploration.{memory_reminder}"""

WAKE_MSG_CONTINUE = """continue (cycle: {cycle_num})

[Context: The history below includes your previous thoughts for reference only.]
[Task: Continue with NEW insights and actions, not re-analysis of past work.]
{thought_feedback_context}{memory_reminder}"""

# Memory reminder messages
MEMORY_REMINDER_WITH_KEYS = "\n\n[Memory keys (newest first): {keys_display}]\n"
MEMORY_REMINDER_EMPTY = "\n\n[Memory: No keys stored yet]\n"

# Thought feedback messages
THOUGHT_FEEDBACK_WARNING = "\n\n[Thought Pattern Alert: {message}]\n"
THOUGHT_FEEDBACK_INFO = "\n\n[Note: {message}]\n"

# History compaction messages
COMPACTION_PROMPT_TEMPLATE = """Create a comprehensive summary of the conversation history.

## Context
{context_description}

## Messages to Process
{messages_json}

## Instructions

Create a summary that:
- Synthesizes the entire journey into a fresh, coherent narrative
- Captures the current state of exploration and key insights
- Tracks the evolution of ideas and their interconnections
- Highlights significant breakthroughs and turning points
- Notes current research directions and open questions
- Aim for 800-1000 words to be comprehensive yet focused

**CRITICAL: Preserve exchanges with the operator**
- Include the agent's questions to the operator and operator's answers
- Maintain context about any plans or agreements discussed
- Keep track of operator's clarifications when asked
- Preserve the natural flow of dialogue between agent and operator
- Note: These exchanges are part of the collaborative journey - don't lose this context

If this is not the first summarization:
- Build upon but don't merely repeat previous insights
- Show how understanding has deepened or shifted
- Emphasize what's new or evolved since the last summary

IMPORTANT: Write a fresh opening that captures where the journey stands NOW, not where it began. Each summary should read as a current status report, not a historical chronicle starting from day one.

Respond with ONLY the summary text."""

COMPACTED_HISTORY_WRAPPER = """[COMPACTED HISTORY - REFERENCE ONLY]
This is a summary of your previous cycles for context. Do NOT re-analyze this content - it's your own past work already processed.

{summary_text}

[END OF COMPACTED HISTORY - Continue with NEW exploration]"""

# Error messages
ERROR_SYSTEM_PROMPT_MISSING = (
    "system_prompt.md not found. Create this file with your system prompt."
)
ERROR_MEMORY_NOT_INITIALIZED = "Memory not initialized. Key '{key}' not found."
ERROR_KEY_NOT_FOUND = "Key '{key}' not found in memory"
ERROR_NO_MEMORY_ENTRIES = "No memory entries found (new memory initialized)"

# Tool response messages
MSG_OPERATOR_READ = "The operator has read your message."
MSG_MEMORY_LIST_EMPTY = "No memory entries found"
MSG_MEMORY_LIST_FORMAT = "Memory keys ({count} items):\n{keys}"
MSG_MEMORY_READ_FORMAT = "Memory['{key}']:\n{value}"
MSG_MEMORY_WRITE_UPDATE = "Updated entry: {key}"
MSG_MEMORY_WRITE_CREATE = "Created new entry: {key}"
MSG_MEMORY_DELETE_SUCCESS = "Deleted: {key}"
MSG_MEMORY_SEARCH_NO_MATCH = "No keys found matching '{pattern}'"
MSG_MEMORY_SEARCH_FORMAT = "Keys matching '{pattern}' ({count} found):\n{keys}"
MSG_SEND_MESSAGE_SYNC = "Operator responded: {response}"
MSG_SEND_MESSAGE_ASYNC = "Message sent to operator: {preview}..."

# Log messages
LOG_MEMORY_FILE_NOT_FOUND = "Memory file not found, creating empty memory"
LOG_MEMORY_LIST_COMPLETE = "Memory list completed"
LOG_MEMORY_READ_COMPLETE = "Memory read completed"
LOG_MEMORY_WRITE_COMPLETE = "Memory write completed"
LOG_MEMORY_DELETE_COMPLETE = "Memory delete completed"
LOG_MEMORY_SEARCH_COMPLETE = "Memory search completed"
LOG_THOUGHT_CORRUPT = "Thought embeddings file corrupt, starting fresh"
LOG_HISTORY_CORRUPT = "History file corrupt, starting with empty history"
LOG_CREATED_EMPTY_HISTORY = "Created empty history.json"
LOG_CREATED_EMPTY_MEMORY = "Created empty memory.json"


# Minimal thought deduplication - circular buffer for reflection/plan embeddings
class ThoughtTracker:
    def __init__(self, max_thoughts=10):
        self.max_thoughts = max_thoughts
        self.thoughts_file = Path("thought_embeddings.json")
        self.model = None  # Lazy load
        self.thoughts = []

        if self.thoughts_file.exists():
            try:
                with open(self.thoughts_file) as f:
                    data = json.load(f)
                    self.thoughts = data.get("thoughts", [])[
                        -max_thoughts:
                    ]  # Keep only last N
            except (json.JSONDecodeError, KeyError):
                log(LOG_THOUGHT_CORRUPT, {}, "warning")
                self.thoughts = []

    def _ensure_model(self):
        if self.model is None:
            self.model = SentenceTransformer("all-MiniLM-L6-v2")

    def save(self):
        data = {
            "thoughts": self.thoughts,
            "max_entries": self.max_thoughts,
            "model": "all-MiniLM-L6-v2",
        }
        with open(self.thoughts_file, "w") as f:
            json.dump(data, f, indent=2)

    def check_similarity(self, new_reflection_text, cycle_num):
        """Check if new reflection is similar to recent thoughts"""
        if not new_reflection_text:
            return None

        self._ensure_model()
        new_embedding = self.model.encode(new_reflection_text)

        # If no previous thoughts, just add this one and return
        if not self.thoughts:
            self.thoughts.append(
                {
                    "cycle": cycle_num,
                    "timestamp": datetime.now().isoformat(),
                    "reflection_text": new_reflection_text[:500],  # Store preview only
                    "embedding": new_embedding.tolist(),
                }
            )
            return None

        # Check similarity against last 5 thoughts
        recent_thoughts = self.thoughts[
            -5:
        ]  # Slicing handles shorter lists automatically
        similarities = []

        for thought in recent_thoughts:
            similarity = cosine_similarity(
                new_embedding.reshape(1, -1),
                np.array(thought["embedding"]).reshape(1, -1),
            )[0][0]
            similarities.append((thought["cycle"], similarity))

        if not similarities:
            return None

        max_cycle, max_sim = max(similarities, key=lambda x: x[1])

        # Add new thought to circular buffer
        self.thoughts.append(
            {
                "cycle": cycle_num,
                "timestamp": datetime.now().isoformat(),
                "reflection_text": new_reflection_text[:500],  # Store preview only
                "embedding": new_embedding.tolist(),
            }
        )

        # Maintain circular buffer size
        if len(self.thoughts) > self.max_thoughts:
            self.thoughts = self.thoughts[-self.max_thoughts :]

        # Return feedback if similarity is notable (increased thresholds by 10%)
        if max_sim > 0.9:  # Was 0.8, now 10% higher
            return {
                "thought_similarity_info": {  # Changed from warning to info
                    "severity": "high_similarity",
                    "similarity": round(max_sim, 2),
                    "similar_to_cycle": max_cycle,
                    "message": THOUGHT_SIMILARITY_HIGH.format(
                        cycle=max_cycle, similarity=round(max_sim * 100)
                    ),
                    "note": "This is informational - you have full autonomy in choosing your exploration path.",
                }
            }
        elif max_sim > 0.8:  # Was 0.7, now 10% higher
            return {
                "thought_similarity_info": {  # Changed from warning to info
                    "severity": "notable_similarity",
                    "similarity": round(max_sim, 2),
                    "similar_to_cycle": max_cycle,
                    "message": THOUGHT_SIMILARITY_MEDIUM.format(
                        cycle=max_cycle, similarity=round(max_sim * 100)
                    ),
                    "note": "This is informational - you have full autonomy in choosing your exploration path.",
                }
            }
        elif max_sim > 0.7:  # Was 0.6, now 10% higher
            return {
                "thought_similarity_info": {
                    "severity": "mild_similarity",
                    "similarity": round(max_sim, 2),
                    "similar_to_cycle": max_cycle,
                    "message": THOUGHT_SIMILARITY_LOW,
                    "note": "Natural continuity in exploration.",
                }
            }

        return None


# Model aliases to full OpenRouter paths
MODEL_REGISTRY = {
    # Primary models with full tool support
    "claude": "anthropic/claude-sonnet-4",
    "opus": "anthropic/claude-opus-4.1",
    "gemini": "google/gemini-2.5-pro",
    "gpt5": "openai/gpt-5",
    "grok": "x-ai/grok-4",  # xAI Grok 4 with 256K context
    "o3": "openai/o3",  # OpenAI o3 reasoning model (April 2025)
}

# Model-specific configurations
MODEL_CONFIGS = {
    "anthropic/claude-sonnet-4": {
        "temperature": 0.0,  # Original default
        "streaming": True,  # Original hardcoded value
        "max_tokens": 16384,  # Increased for complex problems (Sonnet 4 supports up to 64K)
        "supports_tools": True,
        "context_window": 200000,
        "model_kwargs": {
            "stream_options": {"include_usage": True}  # Original hardcoded
        },
    },
    "anthropic/claude-opus-4.1": {
        # OpenRouter supports all standard OpenAI parameters for Claude
        "temperature": 0.0,  # Low for deterministic tool calling
        "top_p": 0.99,  # Anthropic's 2025 recommended value
        "streaming": True,
        "max_tokens": 4096,  # Increased from 1200 to handle longer responses
        "supports_tools": True,
        "context_window": 200000,  # 200K tokens
        "frequency_penalty": 0,  # No repetition penalty for tools
        "presence_penalty": 0,  # No novelty penalty for tools
        "model_kwargs": {"stream_options": {"include_usage": True}},
        "extra_body": {
            "verbosity": "low"  # OpenRouter-specific param goes in extra_body
        },
    },
    "google/gemini-2.5-pro": {
        # OpenRouter supports all standard OpenAI parameters for Gemini
        "temperature": 0.2,  # 0.15-0.3 for deterministic reasoning
        "top_p": 0.95,  # Google's recommended range 0.9-0.95
        "max_tokens": 2048,  # Keep modest to avoid breaking JSON parsers
        "streaming": True,
        "supports_tools": True,
        "context_window": 1048576,  # 1M tokens input
        "frequency_penalty": 0,  # No repetition penalty for tools
        "presence_penalty": 0,  # No novelty penalty for tools
        "request_timeout": 60,  # Handle slow responses
        "model_kwargs": {"stream_options": {"include_usage": True}},
        "extra_body": {
            "verbosity": "low"  # OpenRouter-specific param goes in extra_body
        },
    },
    "openai/gpt-5": {
        # OpenRouter supports all standard OpenAI parameters for GPT-5
        "temperature": 0.0,  # Keep low for tool calling reliability
        "top_p": 0.7,  # 0.6-0.8 band for controlled randomness
        "max_tokens": 3000,  # 2000-8000 per step
        "streaming": True,
        "supports_tools": True,
        "context_window": 400000,  # 400K tokens input
        "frequency_penalty": 0,  # No repetition penalty for tools
        "presence_penalty": 0,  # No novelty penalty for tools
        "model_kwargs": {
            "stream_options": {"include_usage": True},
            "parallel_tool_calls": False,  # Sequential for clarity
        },
        "extra_body": {
            "verbosity": "low",  # OpenRouter-specific param
            "reasoning": {"effort": "low"},  # GPT-5 reasoning mode
        },
    },
    "x-ai/grok-4": {
        # xAI Grok 4 via OpenRouter - 256K context window
        "temperature": 0.7,  # Default for balanced agent responses
        "top_p": 0.9,  # Slightly constrained for tool calling
        "max_tokens": 2000,  # Reasonable for tool operations
        "streaming": True,
        "supports_tools": True,  # Grok 4 supports function calling
        "context_window": 256000,  # 256K tokens combined input/output
        "frequency_penalty": 0,  # No repetition penalty for tools
        "presence_penalty": 0,  # No novelty penalty for tools
        "model_kwargs": {
            "stream_options": {"include_usage": True},
            "parallel_tool_calls": False,  # Sequential for clarity
        },
        "extra_body": {
            "verbosity": "low"  # OpenRouter-specific param
        },
    },
    "openai/o3": {
        # OpenAI o3 reasoning model (April 2025) - 200K context window
        "temperature": 0.0,  # Low for deterministic reasoning
        "top_p": 0.8,  # Focused sampling for reasoning tasks
        "max_tokens": 4000,  # Higher for complex reasoning chains
        "streaming": True,
        "supports_tools": True,  # o3 supports function calling
        "context_window": 200000,  # 200K tokens context
        "frequency_penalty": 0,  # No repetition penalty for reasoning
        "presence_penalty": 0,  # No novelty penalty for reasoning
        "model_kwargs": {
            "stream_options": {"include_usage": True},
            "parallel_tool_calls": False,  # Sequential for clarity
            "seed": 42,  # For reproducible reasoning
        },
        "extra_body": {
            "reasoning_effort": "medium"  # o3 reasoning depth control
        },
    },
}


def get_openrouter_llm(
    model: str = "default", api_key: Optional[str] = None
) -> ChatOpenAI:
    """Create OpenRouter LLM instance using coder patterns"""
    # Resolve alias to full path
    if model not in MODEL_REGISTRY:
        available = ", ".join(sorted(MODEL_REGISTRY.keys()))
        raise ValueError(f"Unknown model: '{model}'. Available models: {available}")

    model_path = MODEL_REGISTRY[model]

    # Get hardcoded config for this model
    if model_path not in MODEL_CONFIGS:
        raise ValueError(f"No configuration found for model: {model_path}")

    config = MODEL_CONFIGS[model_path]

    # Get API key
    if not api_key:
        api_key = os.getenv("OPENROUTER_API_KEY")
        if not api_key:
            raise ValueError("OPENROUTER_API_KEY not found in environment")

    # Create base kwargs
    llm_kwargs = {
        "model": model_path,
        "openai_api_key": api_key,
        "openai_api_base": "https://openrouter.ai/api/v1",
        "default_headers": {
            "HTTP-Referer": "https://github.com/continuous-agent",
            "X-Title": "Continuous LangGraph Agent",
        },
        "streaming": config["streaming"],
        "model_kwargs": config.get("model_kwargs", {}),
    }

    # Handle temperature
    if "temperature" in config:
        llm_kwargs["temperature"] = config["temperature"]

    # Add optional parameters
    if "max_tokens" in config:
        llm_kwargs["max_tokens"] = config["max_tokens"]
    if "top_p" in config:
        llm_kwargs["top_p"] = config["top_p"]
    if "top_k" in config:
        llm_kwargs["top_k"] = config["top_k"]
    if "frequency_penalty" in config:
        llm_kwargs["frequency_penalty"] = config["frequency_penalty"]
    if "presence_penalty" in config:
        llm_kwargs["presence_penalty"] = config["presence_penalty"]

    # Add request_timeout for models that need it (e.g., Gemini)
    if "request_timeout" in config:
        llm_kwargs["request_timeout"] = config["request_timeout"]

    # Add extra_body for OpenRouter-specific parameters
    if "extra_body" in config:
        llm_kwargs["extra_body"] = config["extra_body"]

    return ChatOpenAI(**llm_kwargs)


# Memory v2 System - JSON-based key-value store


@tool
def memory_list() -> str:
    """List all memory keys in anti-chronological order (newest first)"""
    print("(memory: list)", flush=True)

    log("Memory list invoked", {}, "tool_invoke")

    try:
        memory_file = Path("memory.json")
        if not memory_file.exists():
            log(LOG_MEMORY_FILE_NOT_FOUND, {}, "tool_result")
            with open(memory_file, "w") as f:
                json.dump({}, f)
            return ERROR_NO_MEMORY_ENTRIES

        with open(memory_file, "r") as f:
            memory = json.load(f)

        keys = list(memory.keys())
        log(
            LOG_MEMORY_LIST_COMPLETE,
            {"key_count": len(keys), "keys_preview": keys[:10] if keys else []},
            "tool_result",
        )

        if not keys:
            return MSG_MEMORY_LIST_EMPTY

        return MSG_MEMORY_LIST_FORMAT.format(count=len(keys), keys=", ".join(keys))

    except Exception as e:
        log("Memory list failed", {"error": str(e)}, "tool_error")
        return f"Error listing memory: {str(e)}"


@tool
def memory_read(key: str) -> str:
    """Read value for a specific memory key"""
    print(f"(memory: read '{key}')", flush=True)

    log("Memory read invoked", {"key": key}, "tool_invoke")

    try:
        memory_file = Path("memory.json")
        if not memory_file.exists():
            log("Memory file not found", {"key": key}, "tool_result")
            return ERROR_MEMORY_NOT_INITIALIZED.format(key=key)

        with open(memory_file, "r") as f:
            memory = json.load(f)

        if key not in memory:
            log("Key not found", {"key": key}, "tool_result")
            return ERROR_KEY_NOT_FOUND.format(key=key)

        value = memory[key]
        log(
            LOG_MEMORY_READ_COMPLETE,
            {"key": key, "value_length": len(value), "value_preview": value[:200]},
            "tool_result",
        )

        return MSG_MEMORY_READ_FORMAT.format(key=key, value=value)

    except Exception as e:
        log("Memory read failed", {"key": key, "error": str(e)}, "tool_error")
        return f"Error reading memory: {str(e)}"


@tool
def memory_write(key: str, value: str) -> str:
    """Create or update a memory key-value pair. Updates move key to top (newest)."""
    # Replace newlines with spaces in preview to keep output on one line
    clean_value = value.replace("\n", " ").replace("\r", " ")
    preview = clean_value[:48] + "..." if len(clean_value) > 48 else clean_value
    print(f"(memory: write '{key}' '{preview}')", flush=True)

    log(
        "Memory write invoked",
        {"key": key, "value_length": len(value), "value_preview": value[:200]},
        "tool_invoke",
    )

    try:
        memory_file = Path("memory.json")

        # Load existing memory or create new
        if memory_file.exists():
            with open(memory_file, "r") as f:
                memory = json.load(f)
        else:
            memory = {}

        # Check if this is an update or new entry
        is_update = key in memory

        # Remove key if it exists (to reinsert at beginning)
        if is_update:
            del memory[key]

        # Create new ordered dict with new/updated key first
        new_memory = {key: value}
        new_memory.update(memory)

        # Save with pretty printing for readability using atomic write
        # Write to temp file first, then rename for atomicity
        temp_fd, temp_path = tempfile.mkstemp(
            dir=memory_file.parent, prefix=".memory_", suffix=".tmp"
        )
        try:
            with os.fdopen(temp_fd, "w") as f:
                json.dump(new_memory, f, indent=2, ensure_ascii=False)
                f.flush()
                os.fsync(f.fileno())  # Force write to disk
            # Atomic rename
            Path(temp_path).rename(memory_file)
        except Exception:
            # Clean up temp file on error
            Path(temp_path).unlink(missing_ok=True)
            raise

        result = (
            MSG_MEMORY_WRITE_UPDATE.format(key=key)
            if is_update
            else MSG_MEMORY_WRITE_CREATE.format(key=key)
        )

        log(
            LOG_MEMORY_WRITE_COMPLETE,
            {
                "key": key,
                "operation": "update" if is_update else "create",
                "total_keys": len(new_memory),
            },
            "tool_result",
        )

        return result

    except Exception as e:
        log("Memory write failed", {"key": key, "error": str(e)}, "tool_error")
        return f"Error writing memory: {str(e)}"


@tool
def memory_delete(key: str) -> str:
    """Delete a memory key-value pair (rarely needed)"""
    print(f"(memory: delete '{key}')", flush=True)

    log("Memory delete invoked", {"key": key}, "tool_invoke")

    try:
        memory_file = Path("memory.json")
        if not memory_file.exists():
            log("Memory file not found", {"key": key}, "tool_result")
            return ERROR_MEMORY_NOT_INITIALIZED.format(key=key)

        with open(memory_file, "r") as f:
            memory = json.load(f)

        if key not in memory:
            log("Key not found for deletion", {"key": key}, "tool_result")
            return ERROR_KEY_NOT_FOUND.format(key=key)

        del memory[key]

        with open(memory_file, "w") as f:
            json.dump(memory, f, indent=2, ensure_ascii=False)

        log(
            LOG_MEMORY_DELETE_COMPLETE,
            {"key": key, "remaining_keys": len(memory)},
            "tool_result",
        )

        return MSG_MEMORY_DELETE_SUCCESS.format(key=key)

    except Exception as e:
        log("Memory delete failed", {"key": key, "error": str(e)}, "tool_error")
        return f"Error deleting from memory: {str(e)}"


@tool
def memory_search(pattern: str) -> str:
    """Find memory keys containing pattern (case-insensitive)"""
    print(f"(memory: search '{pattern}')", flush=True)

    log("Memory search invoked", {"pattern": pattern}, "tool_invoke")

    try:
        memory_file = Path("memory.json")
        if not memory_file.exists():
            log("Memory file not found", {"pattern": pattern}, "tool_result")
            return "Memory not initialized. No keys to search."

        with open(memory_file, "r") as f:
            memory = json.load(f)

        pattern_lower = pattern.lower()
        matching_keys = [k for k in memory.keys() if pattern_lower in k.lower()]

        log(
            LOG_MEMORY_SEARCH_COMPLETE,
            {
                "pattern": pattern,
                "match_count": len(matching_keys),
                "matches": matching_keys,
            },
            "tool_result",
        )

        if not matching_keys:
            return MSG_MEMORY_SEARCH_NO_MATCH.format(pattern=pattern)

        return MSG_MEMORY_SEARCH_FORMAT.format(
            pattern=pattern, count=len(matching_keys), keys=", ".join(matching_keys)
        )

    except Exception as e:
        log("Memory search failed", {"pattern": pattern, "error": str(e)}, "tool_error")
        return f"Error searching memory: {str(e)}"


def save_to_chat(
    agent_msg: str,
    user_response: str = None,
    mode: str = "async",
    request_id: str = None,
):
    """Save message exchange to chat.json with full content"""
    chat_file = Path("chat.json")

    if chat_file.exists():
        with open(chat_file) as f:
            chat = json.load(f)
    else:
        chat = {"messages": [], "last_check": {"agent": None, "user": None}}

    # Get current cycle
    cycle_state_file = Path("cycle_state.json")
    cycle = 1
    if cycle_state_file.exists():
        with open(cycle_state_file) as f:
            state = json.load(f)
            cycle = state.get("current_cycle", 1)

    # Add agent message with full content
    agent_entry = {
        "id": f"msg_{len(chat['messages']) + 1:03d}",
        "timestamp": datetime.now().isoformat(),
        "role": "assistant",
        "content": agent_msg,  # FULL message, never truncated
        "mode": mode,
        "sync_request_id": request_id,
        "cycle": cycle,
        "read_by_user": mode == "sync",
    }
    chat["messages"].append(agent_entry)

    # Add user response if provided (sync mode)
    if user_response is not None:
        user_entry = {
            "id": f"msg_{len(chat['messages']) + 1:03d}",
            "timestamp": datetime.now().isoformat(),
            "role": "user",
            "content": user_response,  # FULL response
            "mode": "sync_response",
            "sync_request_id": request_id,
            "cycle": cycle,
            "read_by_agent": True,
        }
        chat["messages"].append(user_entry)

    with open(chat_file, "w") as f:
        json.dump(chat, f, indent=2)

    return agent_entry.get("id"), user_entry.get("id") if user_response else None


@tool
def send_message(message: str) -> str:
    """Send message to operator - synchronous if stdin available, async otherwise.

    Args:
        message: The message to send to the operator

    Returns:
        Operator's response in sync mode, or confirmation in async mode
    """
    preview = message[:66] + "..." if len(message) > 66 else message
    print(f"(msg: {preview})", flush=True)

    # Determine if we're in sync mode
    sync_mode = os.environ.get("AGENT_SYNC_MODE") == "true"

    # Log tool invocation with mode
    log(
        "Send message invoked",
        {
            "message": message,  # FULL message in agent_full.jsonl
            "message_length": len(message),
            "preview": preview,
            "sync_mode": sync_mode,
            "mode": "sync" if sync_mode else "async",
        },
        "tool_invoke",
    )

    if sync_mode:
        # SYNCHRONOUS MODE - wait for user response
        import uuid

        request = {
            "type": "INPUT_REQUEST",
            "message": message,
            "id": str(uuid.uuid4()),
            "timestamp": datetime.now().isoformat(),
        }

        # Log sync request details
        log(
            "Sync message request sent",
            {
                "request_id": request["id"],
                "message": message,  # Full message logged
                "timestamp": request["timestamp"],
            },
            "sync_request",
        )

        # Signal controller with special marker
        import sys

        try:
            marker = f"<<<INPUT_REQUEST:{json.dumps(request)}>>>\n"
            sys.stdout.write(marker)
            sys.stdout.flush()
            # Debug: Log that we wrote the marker
            log(
                "INPUT_REQUEST marker written to stdout",
                {"marker_length": len(marker), "request_id": request["id"]},
                "debug",
            )
        except Exception as e:
            log(
                "Failed to write INPUT_REQUEST marker",
                {"error": str(e), "request_id": request["id"]},
                "error",
            )

        try:
            # Wait for response on stdin
            print("(waiting for stdin response...)", flush=True)
            raw_response = sys.stdin.readline().strip()
            # Decode escaped newlines back to actual newlines
            response = raw_response.replace("\\n", "\n")
            print(f"(received from stdin: '{response}')", flush=True)

            # Handle empty responses
            if not response or response.isspace():
                response = MSG_OPERATOR_READ

            # Log sync response received
            log(
                "Sync message response received",
                {
                    "request_id": request["id"],
                    "response": response,  # Full response logged
                    "response_length": len(response),
                    "timestamp": datetime.now().isoformat(),
                },
                "sync_response",
            )

            # Save to chat.json for history
            agent_msg_id, user_msg_id = save_to_chat(
                message, response, mode="sync", request_id=request["id"]
            )

            # Log tool result
            log(
                "Send message completed (sync)",
                {
                    "request_id": request["id"],
                    "agent_msg_id": agent_msg_id,
                    "user_msg_id": user_msg_id,
                    "message": message,
                    "response": response,
                    "mode": "sync",
                },
                "tool_result",
            )

            return MSG_SEND_MESSAGE_SYNC.format(response=response)

        except Exception as e:
            log(
                "Sync message failed, falling back to async",
                {"request_id": request["id"], "error": str(e)},
                "tool_error",
            )
            # Fall through to async mode

    # ASYNCHRONOUS MODE - original behavior
    try:
        # Save message to chat
        agent_msg_id, _ = save_to_chat(message, mode="async")

        # Log successful send
        log(
            "Message sent to operator (async)",
            {
                "message_id": agent_msg_id,
                "timestamp": datetime.now().isoformat(),
                "message": message,
                "mode": "async",
            },
            "tool_result",
        )

        return MSG_SEND_MESSAGE_ASYNC.format(preview=message[:50])
    except Exception as e:
        log(
            "Failed to send message",
            {"error": str(e), "message": message},
            "tool_error",
        )
        return f"Failed to send message: {str(e)}"


# File-based history functions
def load_history():
    """Load conversation history from file"""
    history_file = Path("history.json")
    if history_file.exists():
        try:
            with open(history_file, "r") as f:
                data = json.load(f)
                messages = data.get("messages", [])
                log(
                    f"Loaded {len(messages)} messages from history",
                    {"message_count": len(messages), "file": "history.json"},
                    "history_load",
                )
                return messages
        except json.JSONDecodeError:
            log(LOG_HISTORY_CORRUPT, {}, "error")
            # Optional: backup corrupt file
            history_file.rename(
                f"history_corrupt_{datetime.now().strftime('%Y%m%d_%H%M%S')}.json"
            )
            # Fall through to create new file

    # Create empty history file if it doesn't exist or was corrupt
    with open(history_file, "w") as f:
        json.dump({"messages": []}, f, indent=2)
    log(LOG_CREATED_EMPTY_HISTORY, {}, "history_load")
    return []


def save_history(messages):
    """Save conversation history to file"""
    with open("history.json", "w") as f:
        json.dump({"messages": messages}, f, indent=2)

    log(
        f"Saved {len(messages)} messages to history",
        {"message_count": len(messages), "file": "history.json"},
        "history_save",
    )

    return messages


def compact_history_with_summary(history, agent, model):
    """Use agent to create summary of history"""
    log(
        "Starting history compaction...",
        {"original_count": len(history), "model": model},
        "compaction_start",
    )

    # Find existing summary if present
    existing_summary = None
    system_prompt = None
    recent_messages = []

    for msg in history:
        if msg.get("role") == "system":
            if "summary" in msg.get("content", "").lower():
                existing_summary = msg
            else:
                system_prompt = msg  # Keep the original system prompt
        else:
            recent_messages.append(msg)

    # Use compaction prompt template from constants
    prompt_template = COMPACTION_PROMPT_TEMPLATE

    # Prepare context description based on whether we have existing summary
    if existing_summary:
        context_desc = f"This is an ongoing conversation. Previous summary:\n{existing_summary['content']}\n\nRecent messages to incorporate: {len(recent_messages[-20:])} messages"
    else:
        context_desc = "This is the first summarization of this conversation."

    # Format the prompt
    compact_prompt = prompt_template.replace("{context_description}", context_desc)
    compact_prompt = compact_prompt.replace(
        "{messages_json}", json.dumps(recent_messages[-20:], indent=2)
    )

    # Get summary from agent - include system prompt for context
    try:
        # Build messages for summarization with full context
        summarization_messages = []

        # Include system prompt if exists so agent knows its role/context
        if system_prompt:
            summarization_messages.append(system_prompt)

        # Add the summarization request
        summarization_messages.append({"role": "user", "content": compact_prompt})

        result = agent.invoke(
            {"messages": summarization_messages},
            config={"configurable": {"thread_id": "compact"}},
        )
        summary_text = result["messages"][-1].content

        # Create new compacted history
        new_history = []

        # Add system prompt if exists
        if system_prompt:
            new_history.append(system_prompt)

        # Add new summary clearly marked as reference material
        new_history.append(
            {
                "role": "system",
                "content": COMPACTED_HISTORY_WRAPPER.format(summary_text=summary_text),
            }
        )

        # Keep last 10 messages for better continuity
        new_history.extend(recent_messages[-10:])

        log(
            f"History compacted: {len(history)} -> {len(new_history)} messages",
            {
                "original_count": len(history),
                "final_count": len(new_history),
                "summary_length": len(summary_text),
                "kept_recent": 10,
                "summary_preview": summary_text,  # Full summary
            },
            "compaction_complete",
        )
        save_history(new_history)
        return new_history

    except Exception as e:
        log(
            f"Error during compaction: {e}",
            {"error": str(e), "fallback": "trim_to_20"},
            "compaction_error",
        )
        # On error, just trim old way as fallback
        return history[-20:]


def load_system_prompt() -> str:
    """Load system prompt from markdown file and inject memory keys"""
    try:
        with open("system_prompt.md", "r") as f:
            base_prompt = f.read()

        # Load memory keys if available
        memory_file = Path("memory.json")
        if memory_file.exists():
            with open(memory_file, "r") as f:
                memory = json.load(f)

            if memory:
                keys = list(memory.keys())
                # Format key list for injection - show ALL keys
                key_list = ", ".join(keys)

                memory_context = f"\n\n## Available Memory Keys ({len(keys)} items, newest first):\n{key_list}\n\n"

                # Inject at the beginning of the prompt, after the first line
                lines = base_prompt.split("\n")
                if lines:
                    # Insert after the title/first line
                    return lines[0] + memory_context + "\n".join(lines[1:])
                else:
                    return memory_context + base_prompt

        return base_prompt
    except FileNotFoundError:
        raise FileNotFoundError(ERROR_SYSTEM_PROMPT_MISSING)


def create_agent(model: str = "default"):
    """Create a stateless agent instance using coder patterns"""
    # Check if model supports tools
    if model not in MODEL_REGISTRY:
        raise ValueError(f"Unknown model: {model}")

    model_path = MODEL_REGISTRY[model]
    if model_path in MODEL_CONFIGS:
        config = MODEL_CONFIGS[model_path]
        supports_tools = config.get("supports_tools", False)

        if not supports_tools:
            print(
                f"⚠️  Warning: Model {model} ({model_path}) may not support tool calling."
            )
            print("   Consider using: claude, opus, gemini, or gpt5")

    llm = get_openrouter_llm(model=model)
    prompt = load_system_prompt()
    # Tools available (no web search)
    tools = [
        memory_list,
        memory_read,
        memory_write,
        memory_delete,
        memory_search,
        send_message,
    ]
    return create_react_agent(llm, tools, prompt=prompt)


def log(message, data=None, log_type="info"):
    """Simplified logging - only to agent_full.jsonl with complete data"""
    timestamp = datetime.now().strftime("%H:%M:%S")

    # Console output for debugging (only if debug mode enabled)
    if os.environ.get("AGENT_DEBUG") == "true":
        print(f"[{timestamp}] {message}")

    # Single source of truth: agent_full.jsonl with complete data
    with open("agent_full.jsonl", "a") as f:
        # Extract cycle number if available
        cycle = None
        if data and isinstance(data, dict):
            cycle = data.get("cycle") or data.get("cycle_number")

        # If cycle not in data, try to get it from cycle_state.json
        if not cycle:
            cycle_state_file = Path("cycle_state.json")
            if cycle_state_file.exists():
                try:
                    with open(cycle_state_file) as csf:
                        state = json.load(csf)
                        cycle = state.get("current_cycle")
                except (FileNotFoundError, json.JSONDecodeError, KeyError):
                    pass  # Failed to get cycle, which is acceptable

        full_log_entry = {
            "timestamp": datetime.now().isoformat(),
            "cycle": cycle,
            "type": log_type,
            "message": message,
            "data": data,  # NEVER truncated
            "data_size": len(json.dumps(data)) if data else 0,
        }
        f.write(json.dumps(full_log_entry) + "\n")


def check_for_user_messages():
    """Check for unread user messages (WITHOUT marking them as read yet)"""
    chat_file = Path("chat.json")
    if not chat_file.exists():
        return None, []

    try:
        with open(chat_file) as f:
            chat = json.load(f)

        unread = [
            m
            for m in chat["messages"]
            if m["role"] == "user" and not m.get("read_by_agent", False)
        ]

        if unread:
            # Get all unread messages
            messages = [msg["content"] for msg in unread]
            combined = " | ".join(messages)  # Combine multiple messages

            # Return combined messages AND the IDs to mark later
            unread_ids = [msg["id"] for msg in unread]
            return combined, unread_ids
    except Exception as e:
        log(f"Error checking user messages: {e}", {"error": str(e)}, "error")

    return None, []


def mark_messages_as_read(message_ids):
    """Mark specific messages as read by their IDs"""
    if not message_ids:
        return

    chat_file = Path("chat.json")
    if not chat_file.exists():
        return

    try:
        with open(chat_file) as f:
            chat = json.load(f)

        # Mark messages as read
        for m in chat["messages"]:
            if m.get("id") in message_ids:
                m["read_by_agent"] = True

        # Add last_check if it doesn't exist
        if "last_check" not in chat:
            chat["last_check"] = {"agent": None, "user": None}
        timestamp = datetime.now().isoformat()
        chat["last_check"]["agent"] = timestamp

        # Save back
        with open(chat_file, "w") as f:
            json.dump(chat, f, indent=2)

        log(
            f"Marked {len(message_ids)} messages as read",
            {"message_ids": message_ids},
            "messages_marked",
        )
    except Exception as e:
        log(
            f"Error marking messages as read: {e}",
            {"error": str(e), "message_ids": message_ids},
            "error",
        )


def run_single_cycle(cycle_num_from_controller=None):
    """Run one agent cycle - stateless with verbose logging"""
    thought_tracker = None  # Initialize to None in case of early exception
    try:
        # Load history from file
        history = load_history()
        log(
            f"Loaded history with {len(history)} messages",
            {"history_size": len(history)},
            "state",
        )

        # Create fresh agent with model from model.txt or default
        model_file = Path("model.txt")
        if model_file.exists():
            model = model_file.read_text().strip()
            log(f"Using model from model.txt: {model}", {"model": model}, "config")
        else:
            model = "default"
            log("No model.txt found, using default model", {"model": model}, "config")

        agent = create_agent(model=model)
        log(f"Created agent with model: {model}", {"model": model}, "state")

        # First, determine the cycle number
        cycle_state_file = Path("cycle_state.json")
        if cycle_num_from_controller is not None:
            cycle_num = cycle_num_from_controller
            log(
                f"Cycle number provided by controller: {cycle_num}",
                {"source": "controller_arg"},
                "info",
            )
        elif cycle_state_file.exists():
            with open(cycle_state_file, "r") as f:
                cycle_state = json.load(f)
                cycle_num = cycle_state.get("current_cycle", 1)
            log(
                f"Cycle number loaded from state file: {cycle_num}",
                {"source": "state_file"},
                "info",
            )
        else:
            cycle_num = 1
            log("Cycle number defaulted to 1", {"source": "default"}, "info")

        # Check if compaction needed BEFORE the cycle - based on cycle number not message count
        # Schedule: Cycle 99 only (per user request)
        compaction_cycles = [99]

        if cycle_num in compaction_cycles:
            # Count real messages (non-system) for logging
            real_msg_count = sum(1 for msg in history if msg.get("role") != "system")
            cycles_to_compact = cycle_num - 1  # Previous cycles
            log(
                f"History compaction triggered at cycle {cycle_num}",
                {
                    "cycle": cycle_num,
                    "messages_before": len(history),
                    "real_messages": real_msg_count,
                },
                "compaction",
            )
            # Output marker for controller to display
            print(
                f"(compact: summarizing {cycles_to_compact} cycles into concise history)"
            )
            history = compact_history_with_summary(history, agent, model)

        # Cycle number already determined above for compaction check

        # Initialize thought tracker for reflection deduplication
        thought_tracker = ThoughtTracker(max_thoughts=10)
        log(
            "Initialized thought tracker",
            {"existing_thoughts": len(thought_tracker.thoughts)},
            "init",
        )

        # Check for thought feedback from previous cycle
        thought_feedback_context = ""
        thought_feedback_file = Path("thought_feedback.txt")
        if thought_feedback_file.exists():
            with open(thought_feedback_file, "r") as f:
                thought_feedback_context = f.read()
            # Delete after reading to avoid stale feedback
            thought_feedback_file.unlink()
            log(
                "Loaded thought feedback from previous cycle",
                {"feedback_length": len(thought_feedback_context)},
                "thought_feedback_load",
            )

        # Inject memory key reminder into wake message
        memory_reminder = ""
        memory_file = Path("memory.json")
        if not memory_file.exists():
            # Create empty memory file if it doesn't exist
            with open(memory_file, "w") as f:
                json.dump({}, f)
            log(LOG_CREATED_EMPTY_MEMORY, {}, "init")

        with open(memory_file, "r") as f:
            memory = json.load(f)
        if memory:
            keys = list(memory.keys())
            # Show all available keys at cycle start in anti-chronological order
            keys_display = ", ".join(keys)
            memory_reminder = MEMORY_REMINDER_WITH_KEYS.format(
                keys_display=keys_display
            )
        else:
            memory_reminder = MEMORY_REMINDER_EMPTY

        # Check for user messages and inject them
        user_messages, message_ids = check_for_user_messages()

        if user_messages:
            wake_msg = WAKE_MSG_WITH_USER_INPUT.format(
                user_messages=user_messages,
                thought_feedback_context=thought_feedback_context,
                memory_reminder=memory_reminder,
            )
            log(
                f"Cycle {cycle_num} starting with operator message",
                {
                    "cycle": cycle_num,
                    "operator_message": user_messages,
                    "message_ids": message_ids,
                    "memory_keys_count": len(memory) if "memory" in locals() else 0,
                },
                "cycle_start",
            )
        else:
            wake_msg = WAKE_MSG_CONTINUE.format(
                cycle_num=cycle_num,
                thought_feedback_context=thought_feedback_context,
                memory_reminder=memory_reminder,
            )
            log(
                f"Cycle {cycle_num} starting",
                {
                    "cycle": cycle_num,
                    "memory_keys_count": len(memory) if "memory" in locals() else 0,
                },
                "cycle_start",
            )

        # DO NOT update cycle state here - will be done at the end of successful cycle

        # Log the wake message being sent
        log(
            "Sending wake message to agent",
            {"wake_msg": wake_msg, "history_size": len(history)},
            "message",
        )

        # Agent already created above for potential compaction
        # Add cycle number to the wake message
        messages = history + [{"role": "user", "content": wake_msg, "cycle": cycle_num}]

        # Run agent with increased recursion limit
        log(
            "Invoking agent",
            {"message_count": len(messages), "recursion_limit": 50},
            "invoke",
        )

        result = agent.invoke({"messages": messages}, config={"recursion_limit": 50})

        # Log all messages from the result
        log(
            "Agent invocation complete",
            {"result_messages": len(result["messages"]), "messages_in": len(messages)},
            "invoke_complete",
        )

        # Extract and log each message in the result
        for i, msg in enumerate(result["messages"]):
            # Log tool calls
            if hasattr(msg, "tool_calls") and msg.tool_calls:
                for tool_call in msg.tool_calls:
                    log(
                        f"Tool call: {tool_call.get('name', 'unknown')}",
                        {
                            "tool": tool_call.get("name"),
                            "args": tool_call.get("args", {}),
                            "id": tool_call.get("id"),
                            "message_index": i,
                        },
                        "tool_call",
                    )

            # Log tool responses
            if hasattr(msg, "name"):
                content_preview = (
                    str(msg.content) if hasattr(msg, "content") else None
                )  # Full content
                log(
                    f"Tool response: {msg.name}",
                    {
                        "tool": msg.name,
                        "content_preview": content_preview,
                        "content_length": len(str(msg.content))
                        if hasattr(msg, "content")
                        else 0,
                        "message_index": i,
                    },
                    "tool_response",
                )

            # Log AI messages (agent's thoughts/responses)
            if hasattr(msg, "content") and hasattr(msg, "type") and msg.type == "ai":
                # Check if this is a tool-calling message or regular response
                is_tool_message = hasattr(msg, "tool_calls") and msg.tool_calls
                msg_type = "agent_tool_request" if is_tool_message else "agent_message"

                log(
                    f"Agent {'tool request' if is_tool_message else 'message'}",
                    {
                        "content": msg.content if msg.content else None,  # Full content
                        "full_length": len(msg.content) if msg.content else 0,
                        "has_tools": is_tool_message,
                        "message_index": i,
                        "cycle": cycle_num,
                    },
                    msg_type,
                )

                # Internal thoughts are now captured in agent_full.jsonl - no separate file needed

        # Extract agent's final response and add to history
        agent_response = result["messages"][-1]
        if hasattr(agent_response, "content"):
            response_content = agent_response.content
        else:
            response_content = str(agent_response)

        log(
            "Final agent response",
            {
                "response_preview": response_content
                if response_content
                else None,  # Full response
                "full_length": len(response_content) if response_content else 0,
                "type": agent_response.type
                if hasattr(agent_response, "type")
                else "unknown",
            },
            "final_response",
        )

        # Check for thought similarity if response contains JSON reflection
        thought_feedback = ""
        if response_content and thought_tracker:
            try:
                # Try to extract JSON reflection/plan from response
                import re

                json_match = re.search(
                    r"```json\s*(\{.*?\})\s*```", response_content, re.DOTALL
                )
                if json_match:
                    reflection_json = json.loads(json_match.group(1))

                    # Extract text from reflection and plan
                    reflection_text = ""
                    if "reflection" in reflection_json:
                        ref = reflection_json["reflection"]
                        reflection_text += (
                            ref.get("thoughts", "") + " " + ref.get("actions", "")
                        )
                    if "plan" in reflection_json:
                        plan = reflection_json["plan"]
                        reflection_text += (
                            " "
                            + plan.get("goal", "")
                            + " "
                            + plan.get("first_action", "")
                        )

                    # Check similarity with recent thoughts
                    if reflection_text.strip():
                        similarity_result = thought_tracker.check_similarity(
                            reflection_text, cycle_num
                        )
                        if (
                            similarity_result
                            and "thought_similarity_info" in similarity_result
                        ):
                            # Log the similarity warning
                            log(
                                "Thought similarity detected",
                                similarity_result,
                                "thought_similarity",
                            )
                            info = similarity_result["thought_similarity_info"]

                            # Use severity to determine feedback type
                            if info["severity"] == "high_similarity":
                                thought_feedback = THOUGHT_FEEDBACK_WARNING.format(
                                    message=info["message"]
                                )
                            else:
                                thought_feedback = THOUGHT_FEEDBACK_INFO.format(
                                    message=info["message"]
                                )

                            # Store feedback for next cycle
                            with open("thought_feedback.txt", "w") as f:
                                f.write(thought_feedback)

                    log(
                        "Extracted and analyzed reflection JSON",
                        {
                            "has_reflection": "reflection" in reflection_json,
                            "has_plan": "plan" in reflection_json,
                            "text_length": len(reflection_text),
                            "similarity_detected": bool(similarity_result)
                            if "similarity_result" in locals()
                            else False,
                        },
                        "thought_extraction",
                    )

            except (json.JSONDecodeError, AttributeError) as e:
                log(
                    f"Could not extract JSON reflection: {e}",
                    {},
                    "thought_extraction_skip",
                )

        new_history = messages + [
            {"role": "assistant", "content": response_content, "cycle": cycle_num}
        ]
        save_history(new_history)
        log(
            f"History saved with {len(new_history)} messages",
            {"history_size": len(new_history), "added_messages": 1},
            "state",
        )

        # Mark messages as read AFTER the agent has responded
        if message_ids:
            mark_messages_as_read(message_ids)

        log(
            f"Cycle {cycle_num} completed successfully",
            {"cycle": cycle_num, "final_history_size": len(new_history)},
            "cycle_end",
        )

        # Update cycle state file for next run (only on successful completion)
        next_cycle_num = cycle_num + 1
        cycle_state = {
            "current_cycle": next_cycle_num,
            "last_run": datetime.now().isoformat(),
            "status": "idle",
        }
        with open(cycle_state_file, "w") as f:
            json.dump(cycle_state, f, indent=2)
        log(
            f"Updated cycle_state.json for next cycle: {next_cycle_num}",
            {"next_cycle": next_cycle_num},
            "state_update",
        )

    except Exception as e:
        log(
            f"Error in cycle: {e}",
            {"error": str(e), "error_type": type(e).__name__},
            "error",
        )
        raise
    finally:
        # Save thought embeddings
        if thought_tracker:
            thought_tracker.save()
            log(
                "Saved thought embeddings at end of cycle",
                {"thoughts_count": len(thought_tracker.thoughts)},
                "state",
            )


def check_required_files():
    """Check that required prompt files exist at startup"""
    # Only check for system_prompt.md - all other prompts are now constants
    if not Path("system_prompt.md").exists():
        print(f"ERROR: {ERROR_SYSTEM_PROMPT_MISSING}")
        import sys

        sys.exit(1)


if __name__ == "__main__":
    import argparse

    check_required_files()

    parser = argparse.ArgumentParser(description="Autonomous Agent (Single Cycle)")
    parser.add_argument(
        "--cycle", type=int, help="The current cycle number to execute."
    )
    args = parser.parse_args()

    run_single_cycle(args.cycle)
