from ddgs import DDGS
from .tool import Tool
from ..logging import logger
import os 

class WebSearchTool(Tool):
    NAME = "web_search"
    DESCRIPTION = "Search the web for information using DuckDuckGo. Use sparingly and only when you need specific technical information that you cannot determine through analysis. Search for specific CTF writeups, vulnerability details, or technical documentation only when absolutely necessary. After finding relevant URLs, you MUST explore them deeply using curl to extract detailed information, follow internal links, and analyze the full content structure."
    PARAMETERS = {
        "query": ("string", "the search query to look up on the web"),
        "max_results": ("integer", "maximum number of search results to return (default: 3, max: 10)"),
        "search_type": ("string", "type of search: 'general', 'news', 'academic' (default: 'general')"),
        "include_images": ("boolean", "whether to include image results (default: false)")
    }
    REQUIRED_PARAMETERS = {"query"}

    def __init__(self, environment):
        super().__init__()
        self.environment = environment
        
        # Initialize DuckDuckGo search
        self.ddgs = DDGS()
        
        # DuckDuckGo is free - no cost
        self.cost_per_search = 0.0

    def call(self, query=None, max_results=3, search_type="general", include_images=False):
        if query is None:
            return {"error": "No search query provided"}

        # Limit max_results to prevent abuse
        max_results = min(max(int(max_results), 1), 10)
        
        try:
            print(f"Searching with DuckDuckGo for: {query}")
            
            # Search using DuckDuckGo
            search_results = list(self.ddgs.text(query, max_results=max_results))
            
            # Format results
            formatted_results = []
            for result in search_results:
                formatted_results.append({
                    'title': result.get('title', 'No title'),
                    'url': result.get('href', ''),
                    'snippet': result.get('body', 'No description available'),
                    'type': 'search_result'
                })
            
            print(f"DuckDuckGo search cost: $0.000000 (free)")
            
            return {
                "query": query,
                "total_results": len(formatted_results),
                "results": formatted_results,
                "search_type": search_type,
                "include_images": include_images,
                "search_engine": "duckduckgo",
                "search_cost": 0.0
            }
            
        except Exception as e:
            logger.debug_message(f"DuckDuckGo search error: {str(e)}")
            return {
                "query": query,
                "total_results": 1,
                "results": [{
                    'title': f"Search Error for: {query}",
                    'url': "DuckDuckGo Search",
                    'snippet': f"DuckDuckGo search failed: {str(e)}. Please try again or use a different search approach.",
                    'type': 'search_result'
                }],
                "search_type": search_type,
                "include_images": include_images,
                "search_engine": "duckduckgo",
                "search_cost": 0.0
            }

    def print_tool_call(self, tool_call):
        args = tool_call.parsed_arguments
        query = args.get('query', 'unknown query') if args else 'unknown query'
        logger.assistant_action(f"**{self.NAME}**: searching the web for '{query}' using DuckDuckGo search")

    def print_result(self, tool_result):
        if "error" in tool_result.result:
            logger.print(f"[bold]{self.NAME}[/bold]: [red]{tool_result.result['error']}[/red]", markup=True)
        else:
            result = tool_result.result
            total_results = result.get('total_results', 0)
            query = result.get('query', 'unknown')
            results = result.get('results', [])
            
            formatted_results = self._format_results(results)
            logger.observation_message(
                f"**{self.NAME}**: Found {total_results} results for '{query}' using DuckDuckGo search\n\n" +
                (formatted_results if formatted_results else "No results found.")
            )

    def _format_results(self, results):
        if not results or not isinstance(results, list):
            return "No results found."
        
        formatted = ""
        for i, result in enumerate(results, 1):
            if not isinstance(result, dict):
                continue
                
            title = result.get('title', 'No title')
            url = result.get('url', '')
            snippet = result.get('snippet', 'No description available')
            
            # Clean up title (remove markdown formatting)
            clean_title = title.replace('**', '').replace('###', '').replace('##', '').strip()
            
            formatted += f"{i}. **{clean_title}**\n"
            if url and url != "DuckDuckGo Search":
                formatted += f"   URL: {url}\n"
            
            # Show more content for better analysis
            clean_snippet = snippet.strip()
            if len(clean_snippet) > 300:
                clean_snippet = clean_snippet[:300] + "..."
            formatted += f"   Content: {clean_snippet}\n\n"
        
        formatted += "\n**🔍 ANALYSIS REQUIRED**: You must analyze these search results before taking any action:\n"
        formatted += "1. **Read each result carefully** - What technical information is provided?\n"
        formatted += "2. **Evaluate relevance** - How does this help solve the current challenge?\n"
        formatted += "3. **Explore URLs with curl** - If you see URLs that might contain CTF problem-related information, use curl to explore them:\n"
        formatted += "   - `curl -s <URL>` to get the content\n"
        formatted += "   - `curl -I <URL>` to check headers\n"
        formatted += "   - Look for writeups, solutions, or technical details\n"
        formatted += "4. **Plan next steps** - What specific actions will you take based on this information?\n"
        formatted += "5. **Avoid immediate delegation** - Process the information first, then decide your next move.\n\n"
        formatted += "**💡 URL EXPLORATION TIP**: If any URL looks like it contains CTF writeups, solutions, or technical documentation related to your current problem, immediately use curl to fetch and analyze its content before proceeding.\n\n"
        formatted += "**Remember**: Do not delegate immediately after searching. Analyze the results and determine the most effective next action.\n\n"
        
        return formatted if formatted else "No results found."