from typing import List, Dict, Optional, Any
from scale_env.environment.toolkit import ToolKitBase, ToolType, is_tool
from .database import *
from thefuzz import fuzz, process

"""Tools for job_seeking."""

class JobSeekingTools(ToolKitBase):
    """All tools for job_seeking."""
    
    db: JobSeekingDB
    
    def __init__(self, db: JobSeekingDB):
        """Initialize tools with database."""
        super().__init__(db)
    
    @is_tool()
    def calculate_application_success_rate(self, total_applications: int, successful_applications: int, rejected_applications: int = None) -> dict:
        """
        Calculate the success rate of applications by status.

        This method computes the percentage of successful, rejected, and pending applications
        based on the provided counts. It performs validation on input parameters and calculates
        the rates as percentages of the total applications.

        Args:
            total_applications: Total number of applications submitted
            successful_applications: Number of applications that resulted in offers
            rejected_applications: Number of rejected applications (optional)

        Returns:
            A dictionary containing:
            - success_rate: Percentage of successful applications
            - rejection_rate: Percentage of rejected applications
            - pending_rate: Percentage of pending applications

        Raises:
            ValueError: If input parameters are invalid
        """
        # Validate that total_applications is a positive integer
        if not isinstance(total_applications, int) or total_applications < 0:
            raise ValueError("total_applications must be a non-negative integer")

        # Validate that successful_applications is a non-negative integer
        if not isinstance(successful_applications, int) or successful_applications < 0:
            raise ValueError("successful_applications must be a non-negative integer")

        # Validate that rejected_applications (if provided) is a non-negative integer
        if rejected_applications is not None:
            if not isinstance(rejected_applications, int) or rejected_applications < 0:
                raise ValueError("rejected_applications must be a non-negative integer")
        else:
            # If rejected_applications is not provided, default to 0
            rejected_applications = 0

        # Validate that successful_applications doesn't exceed total_applications
        if successful_applications > total_applications:
            raise ValueError("successful_applications cannot exceed total_applications")

        # Validate that rejected_applications doesn't exceed total_applications
        if rejected_applications > total_applications:
            raise ValueError("rejected_applications cannot exceed total_applications")

        # Validate that the sum of successful and rejected doesn't exceed total
        if successful_applications + rejected_applications > total_applications:
            raise ValueError("Sum of successful_applications and rejected_applications cannot exceed total_applications")

        # Handle edge case where total_applications is 0
        if total_applications == 0:
            return {
                'success_rate': 0.0,
                'rejection_rate': 0.0,
                'pending_rate': 0.0
            }

        # Calculate the number of pending applications
        # Pending = Total - Successful - Rejected
        pending_applications = total_applications - successful_applications - rejected_applications

        # Calculate success rate as a percentage
        # Success Rate = (Successful Applications / Total Applications) * 100
        success_rate = (successful_applications / total_applications) * 100

        # Calculate rejection rate as a percentage
        # Rejection Rate = (Rejected Applications / Total Applications) * 100
        rejection_rate = (rejected_applications / total_applications) * 100

        # Calculate pending rate as a percentage
        # Pending Rate = (Pending Applications / Total Applications) * 100
        pending_rate = (pending_applications / total_applications) * 100

        # Return the calculated rates
        return {
            'success_rate': round(success_rate, 2),
            'rejection_rate': round(rejection_rate, 2),
            'pending_rate': round(pending_rate, 2)
        }

    @is_tool()
    def delete_job_application(self, application_id: str) -> dict:
        """
        Delete a job application from the system

        Args:
            application_id: Unique identifier of the application to delete

        Returns:
            Dictionary containing:
            - application_id: Unique identifier of the deleted application
            - deletion_status: Status of the deletion operation
            - deleted_at: Timestamp when the application was deleted in yyyy-mm-dd HH:MM:SS format

        Raises:
            KeyError: If the application_id does not exist in the system
        """
        from datetime import datetime

        # Validate input parameter
        if not application_id or not isinstance(application_id, str):
            raise ValueError("application_id must be a non-empty string")

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' does not exist in the system")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' does not exist in the system")

        # Remove the application from the table
        # Create a new dictionary without the deleted application
        updated_table = {k: v for k, v in job_application_table.items() if k != application_id}

        # Update the database table with the new dictionary
        setattr(db, 'job_application', updated_table)

        # Generate deletion timestamp
        deleted_at = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Return the deletion result
        return {
            'application_id': application_id,
            'deletion_status': 'deleted',
            'deleted_at': deleted_at
        }

    @is_tool()
    def get_application_notes(self, application_id: str) -> dict:
        """
        Retrieve all notes associated with a job application

        Args:
            application_id: Unique identifier of the application

        Returns:
            Dictionary containing list of notes with note_id, note_content, note_type, and created_at

        Raises:
            KeyError: If application_id does not exist in the system
        """
        # Get database instance
        db = self.db

        # Get application_note table from database
        application_note_table = getattr(db, 'application_note', None)

        # Check if application_note table exists
        if application_note_table is None:
            raise KeyError(f"Application note table not found in database")

        # Collect all notes for the specified application_id
        notes_list = []
        for note in application_note_table.values():
            # Filter notes by application_id
            if note.application_id == application_id:
                # Format the note data according to the return schema
                note_dict = {
                    'note_id': note.note_id,
                    'note_content': note.note_content,
                    'note_type': note.note_type if note.note_type is not None else '',
                    # Convert datetime object to string format "yyyy-mm-dd HH:MM:SS"
                    'created_at': note.created_at.strftime('%Y-%m-%d %H:%M:%S') if hasattr(note.created_at, 'strftime') else str(note.created_at)
                }
                notes_list.append(note_dict)

        # If no notes found for this application_id, raise KeyError
        if not notes_list:
            raise KeyError(f"No notes found for application_id: {application_id}")

        # Sort notes by created_at timestamp (most recent first) for better user experience
        notes_list.sort(key=lambda x: x['created_at'], reverse=True)

        # Return the result in the specified format
        return {
            'notes': notes_list
        }

    @is_tool()
    def update_interview_schedule(self, interview_id: str, new_interview_date: str = None, new_location: str = None) -> dict:
        """
        Update an existing interview schedule with new date and/or location.

        Args:
            interview_id: Unique identifier of the interview to update
            new_interview_date: New scheduled date and time in "yyyy-mm-dd HH:MM:SS" format (optional)
            new_location: New location or platform for the interview (optional)

        Returns:
            Dictionary containing:
                - interview_id: The updated interview's identifier
                - update_status: Status of the update operation ("updated")

        Raises:
            KeyError: If the interview_id does not exist in the system
            ValueError: If new_interview_date format is invalid or if no update parameters provided
        """
        # Validate that at least one update parameter is provided
        if new_interview_date is None and new_location is None:
            raise ValueError("At least one of new_interview_date or new_location must be provided for update")

        # Access the database
        db = self.db

        # Retrieve the interview_schedule table from database
        interview_schedule_table = getattr(db, 'interview_schedule', None)

        # Check if the table exists and is not empty
        if interview_schedule_table is None:
            raise KeyError("Interview schedule table not found in database")

        # Check if the interview exists in the table
        if interview_id not in interview_schedule_table:
            raise KeyError(f"Interview with id '{interview_id}' not found")

        # Get the existing interview record
        interview = interview_schedule_table[interview_id]

        # Update interview_date if provided
        if new_interview_date is not None:
            try:
                # Parse the new interview date string to datetime object
                # Support both full datetime format and date-only format
                if len(new_interview_date.strip()) == 10:
                    # Date only format: "yyyy-mm-dd"
                    parsed_date = datetime.strptime(new_interview_date.strip(), "%Y-%m-%d")
                else:
                    # Full datetime format: "yyyy-mm-dd HH:MM:SS"
                    parsed_date = datetime.strptime(new_interview_date.strip(), "%Y-%m-%d %H:%M:%S")

                # Update the interview_date field
                interview.interview_date = parsed_date
            except ValueError as e:
                raise ValueError(f"Invalid date format for new_interview_date. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got '{new_interview_date}': {str(e)}")

        # Update interview_location if provided
        if new_location is not None:
            interview.interview_location = new_location

        # Save the updated interview back to the database
        interview_schedule_table[interview_id] = interview
        setattr(db, 'interview_schedule', interview_schedule_table)

        # Return the result with interview_id and update status
        return {
            'interview_id': interview_id,
            'update_status': 'updated'
        }

    @is_tool()
    def prioritize_applications(self, applications: list) -> dict:
        """
        Prioritize applications based on multiple criteria including deadline urgency,
        match score, and company preference.

        Args:
            applications: List of application dictionaries with priority factors

        Returns:
            Dictionary containing prioritized applications sorted by priority score

        Raises:
            ValueError: If applications list is empty or invalid data is provided
        """
        # Validate input parameters
        if not applications:
            raise ValueError("Applications list cannot be empty")

        if not isinstance(applications, list):
            raise ValueError("Applications must be a list")

        # Validate each application has required fields
        for app in applications:
            if not isinstance(app, dict):
                raise ValueError("Each application must be a dictionary")

            if 'application_id' not in app:
                raise ValueError("Each application must have an 'application_id' field")

            # Validate and set default values for priority factors
            if 'deadline_urgency' not in app:
                app['deadline_urgency'] = 0
            if 'match_score' not in app:
                app['match_score'] = 0.0
            if 'company_preference' not in app:
                app['company_preference'] = 0

            # Validate data types and ranges
            if not isinstance(app['application_id'], str):
                raise ValueError(f"application_id must be a string for application {app.get('application_id', 'unknown')}")

            if not isinstance(app['deadline_urgency'], (int, float)):
                raise ValueError(f"deadline_urgency must be a number for application {app['application_id']}")

            if not isinstance(app['match_score'], (int, float)):
                raise ValueError(f"match_score must be a number for application {app['application_id']}")

            if not isinstance(app['company_preference'], (int, float)):
                raise ValueError(f"company_preference must be a number for application {app['application_id']}")

            # Validate reasonable ranges (optional but good practice)
            if app['deadline_urgency'] < 0:
                raise ValueError(f"deadline_urgency cannot be negative for application {app['application_id']}")

            if app['match_score'] < 0 or app['match_score'] > 100:
                raise ValueError(f"match_score must be between 0 and 100 for application {app['application_id']}")

            if app['company_preference'] < 0:
                raise ValueError(f"company_preference cannot be negative for application {app['application_id']}")

        # Calculate priority score for each application
        # Priority score formula: weighted sum of normalized factors
        # - deadline_urgency: weight 0.4 (40%) - most important for time-sensitive applications
        # - match_score: weight 0.35 (35%) - important for fit quality
        # - company_preference: weight 0.25 (25%) - personal preference factor

        prioritized_list = []

        for app in applications:
            # Extract priority factors
            deadline_urgency = float(app['deadline_urgency'])
            match_score = float(app['match_score'])
            company_preference = float(app['company_preference'])

            # Normalize deadline_urgency to 0-100 scale (assuming max urgency is 5)
            # Higher urgency = higher score
            normalized_urgency = (deadline_urgency / 5.0) * 100.0 if deadline_urgency <= 5 else 100.0

            # match_score is already on 0-100 scale
            normalized_match = match_score

            # Normalize company_preference to 0-100 scale (assuming max preference is 5)
            # Higher preference = higher score
            normalized_preference = (company_preference / 5.0) * 100.0 if company_preference <= 5 else 100.0

            # Calculate weighted priority score
            priority_score = (
                normalized_urgency * 0.4 +
                normalized_match * 0.35 +
                normalized_preference * 0.25
            )

            # Round to 1 decimal place for cleaner output
            priority_score = round(priority_score, 1)

            # Add to prioritized list
            prioritized_list.append({
                'application_id': app['application_id'],
                'priority_score': priority_score
            })

        # Sort by priority score in descending order (highest priority first)
        prioritized_list.sort(key=lambda x: x['priority_score'], reverse=True)

        # Return the prioritized applications
        return {
            'prioritized_applications': prioritized_list
        }

    @is_tool()
    def compare_applications(self, application_1: dict, application_2: dict) -> dict:
        """
        Compare two job applications side by side and provide a comparison summary and recommendation.

        This method analyzes two application datasets and generates insights about their differences,
        helping users prioritize their job applications based on various factors including match score,
        status, job title, and company.

        Args:
            application_1: First application data containing job_title, company_name, status, and match_score
            application_2: Second application data containing job_title, company_name, status, and match_score

        Returns:
            dict: Contains comparison_summary and recommendation

        Raises:
            ValueError: If required fields are missing or invalid in either application
        """
        # Validate that both applications are provided and are dictionaries
        if not isinstance(application_1, dict) or not isinstance(application_2, dict):
            raise ValueError("Both application_1 and application_2 must be dictionary objects")

        # Define required fields for each application
        required_fields = ['job_title', 'company_name', 'status', 'match_score']

        # Validate application_1 has all required fields
        for field in required_fields:
            if field not in application_1:
                raise ValueError(f"application_1 is missing required field: {field}")

        # Validate application_2 has all required fields
        for field in required_fields:
            if field not in application_2:
                raise ValueError(f"application_2 is missing required field: {field}")

        # Validate match_score is a number for both applications
        try:
            score_1 = float(application_1['match_score'])
            score_2 = float(application_2['match_score'])
        except (ValueError, TypeError):
            raise ValueError("match_score must be a valid number for both applications")

        # Extract application details
        job_title_1 = application_1['job_title']
        company_1 = application_1['company_name']
        status_1 = application_1['status']

        job_title_2 = application_2['job_title']
        company_2 = application_2['company_name']
        status_2 = application_2['status']

        # Define status priority mapping (higher value = more advanced in process)
        # This helps determine which application is further along
        status_priority = {
            'submitted': 1,
            'under_review': 2,
            'phone_screening': 3,
            'technical_interview': 4,
            'final_interview': 5,
            'accepted': 6,
            'rejected': 0,
            'withdrawn': 0,
            'archived': 0
        }

        # Get status priorities (default to 1 if status not in mapping)
        priority_1 = status_priority.get(status_1.lower(), 1)
        priority_2 = status_priority.get(status_2.lower(), 1)

        # Build comparison summary components
        summary_parts = []

        # Compare match scores
        score_diff = abs(score_1 - score_2)
        if score_diff > 5:  # Significant difference threshold
            if score_1 > score_2:
                summary_parts.append(f"Application 1 has a higher match score ({score_1:.1f} vs {score_2:.1f})")
            else:
                summary_parts.append(f"Application 2 has a higher match score ({score_2:.1f} vs {score_1:.1f})")
        else:
            summary_parts.append(f"Both applications have similar match scores ({score_1:.1f} vs {score_2:.1f})")

        # Compare application status/stage
        if priority_1 > priority_2:
            summary_parts.append(f"Application 1 is at a more advanced stage ({status_1} vs {status_2})")
        elif priority_2 > priority_1:
            summary_parts.append(f"Application 2 is at a more advanced stage ({status_2} vs {status_1})")
        else:
            summary_parts.append(f"Both applications are at similar stages ({status_1})")

        # Add company and job title information
        summary_parts.append(f"Application 1: {job_title_1} at {company_1}")
        summary_parts.append(f"Application 2: {job_title_2} at {company_2}")

        # Combine summary parts
        comparison_summary = "; ".join(summary_parts)

        # Generate recommendation based on multiple factors
        # Calculate weighted score: match_score (60%) + status_priority (40%)
        weighted_score_1 = score_1 * 0.6 + priority_1 * 8 * 0.4  # Normalize priority to ~0-48 scale
        weighted_score_2 = score_2 * 0.6 + priority_2 * 8 * 0.4

        # Determine recommendation
        recommendation_parts = []

        # Check for rejected/withdrawn/archived status - these should not be prioritized
        if priority_1 == 0 and priority_2 == 0:
            recommendation = "Neither application should be prioritized as both are inactive (rejected, withdrawn, or archived)"
        elif priority_1 == 0:
            recommendation = "Prioritize Application 2 as Application 1 is inactive (rejected, withdrawn, or archived)"
        elif priority_2 == 0:
            recommendation = "Prioritize Application 1 as Application 2 is inactive (rejected, withdrawn, or archived)"
        else:
            # Both applications are active, compare weighted scores
            if weighted_score_1 > weighted_score_2 + 5:  # Threshold for clear preference
                recommendation_parts.append("Prioritize Application 1")

                # Add specific reasons
                reasons = []
                if score_1 > score_2 + 5:
                    reasons.append(f"higher match score ({score_1:.1f})")
                if priority_1 > priority_2:
                    reasons.append(f"more advanced stage ({status_1})")

                if reasons:
                    recommendation_parts.append("due to " + " and ".join(reasons))

                recommendation = " ".join(recommendation_parts)

            elif weighted_score_2 > weighted_score_1 + 5:
                recommendation_parts.append("Prioritize Application 2")

                # Add specific reasons
                reasons = []
                if score_2 > score_1 + 5:
                    reasons.append(f"higher match score ({score_2:.1f})")
                if priority_2 > priority_1:
                    reasons.append(f"more advanced stage ({status_2})")

                if reasons:
                    recommendation_parts.append("due to " + " and ".join(reasons))

                recommendation = " ".join(recommendation_parts)

            else:
                # Very close scores - provide balanced recommendation
                recommendation = (f"Both applications are competitive. "
                                f"Application 1 (score: {score_1:.1f}, status: {status_1}) and "
                                f"Application 2 (score: {score_2:.1f}, status: {status_2}) "
                                f"have similar potential. Consider other factors like company culture, "
                                f"career growth opportunities, and personal preferences")

        # Return comparison result
        return {
            'comparison_summary': comparison_summary,
            'recommendation': recommendation
        }

    @is_tool()
    def attach_resume_to_application(self, application_id: str, resume_content: str, resume_format: str = None, uploaded_at: str = None):
        """
        Attach or update resume content for a job application.

        This method updates the resume-related fields of an existing job application,
        including the resume content, format, and upload timestamp.

        Args:
            application_id: Unique identifier of the application
            resume_content: Text content of the resume
            resume_format: Format of the resume document (e.g., 'pdf', 'docx'), optional
            uploaded_at: Timestamp when the resume was uploaded in yyyy-mm-dd HH:MM:SS format, optional

        Returns:
            dict: Contains application_id and resume_attached status

        Raises:
            KeyError: If the application_id does not exist in the database
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Retrieve the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' not found: job_application table does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found in the system")

        # Retrieve the application record
        application = job_application_table[application_id]

        # Update resume content (required field)
        application.resume_content = resume_content

        # Update resume format if provided
        if resume_format is not None:
            application.resume_format = resume_format

        # Update resume uploaded timestamp
        if uploaded_at is not None:
            # Parse the uploaded_at string to datetime object
            try:
                application.resume_uploaded_at = datetime.strptime(uploaded_at, "%Y-%m-%d %H:%M:%S")
            except ValueError:
                # If time part is missing, try parsing date only
                try:
                    application.resume_uploaded_at = datetime.strptime(uploaded_at, "%Y-%m-%d")
                except ValueError:
                    raise ValueError(f"Invalid datetime format for uploaded_at: '{uploaded_at}'. Expected format: 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd'")
        else:
            # If no uploaded_at provided, use current timestamp
            application.resume_uploaded_at = datetime.now()

        # Update the updated_at timestamp to reflect the modification
        application.updated_at = datetime.now()

        # Write the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success response
        return {
            'application_id': application_id,
            'resume_attached': True
        }

    @is_tool()
    def add_application_note(self, application_id: str, note_content: str, created_at: str, note_type: str = None):
        """
        Add a note or comment to a job application for tracking purposes.

        Args:
            application_id: Unique identifier of the application
            note_content: Content of the note
            created_at: Timestamp when the note was created in yyyy-mm-dd HH:MM:SS format
            note_type: Type or category of the note (optional)

        Returns:
            dict: Dictionary containing note_id and application_id

        Raises:
            KeyError: If the application does not exist in the system
            ValueError: If required parameters are invalid
        """
        import secrets
        import hashlib
        from datetime import datetime

        # Validate required parameters
        if not application_id or not isinstance(application_id, str):
            raise ValueError("application_id must be a non-empty string")

        if not note_content or not isinstance(note_content, str):
            raise ValueError("note_content must be a non-empty string")

        if not created_at or not isinstance(created_at, str):
            raise ValueError("created_at must be a non-empty string")

        # Validate and parse created_at timestamp
        try:
            created_at_dt = datetime.strptime(created_at, "%Y-%m-%d %H:%M:%S")
        except ValueError:
            try:
                # Try date-only format as fallback
                created_at_dt = datetime.strptime(created_at, "%Y-%m-%d")
                # Add default time for date-only format
                created_at_dt = created_at_dt.replace(hour=0, minute=0, second=0)
            except ValueError:
                raise ValueError("created_at must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format")

        # Validate note_type if provided
        if note_type is not None and not isinstance(note_type, str):
            raise ValueError("note_type must be a string if provided")

        # Access the database
        db = self.db

        # Verify that the application exists by checking job_application table
        # This is the pre-condition: Application must exist in the system
        job_application_table = getattr(db, "job_application", None)
        if job_application_table is None or application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' does not exist in the system")

        # Get the application_note table
        application_note_table = getattr(db, "application_note", None)

        # Initialize the table if it doesn't exist
        if application_note_table is None:
            application_note_table = {}
            setattr(db, "application_note", application_note_table)

        # Generate a unique note_id
        prefix = "NOTE-"
        year = created_at_dt.strftime("%Y")

        # Generate unique ID with year prefix and hash suffix
        note_id = f"{prefix}{year}-{hashlib.sha256(secrets.token_bytes(32)).hexdigest()[:6].upper()}"

        # Ensure the generated note_id is unique
        while note_id in application_note_table:
            note_id = f"{prefix}{year}-{hashlib.sha256(secrets.token_bytes(32)).hexdigest()[:6].upper()}"

        # Create the new ApplicationNote instance
        new_note = ApplicationNote(
            note_id=note_id,
            application_id=application_id,
            note_content=note_content,
            note_type=note_type,
            created_at=created_at_dt
        )

        # Add the note to the application_note table
        application_note_table[note_id] = new_note
        setattr(db, "application_note", application_note_table)

        # Return the result with note_id and application_id
        return {
            "note_id": note_id,
            "application_id": application_id
        }

    @is_tool()
    def generate_follow_up_reminder(self, job_title: str, company_name: str, application_date: str, follow_up_date: str) -> dict:
        """
        Generate a follow-up reminder message for a job application.

        This method creates a formatted reminder message based on the provided application details.
        It validates the date formats and generates a professional reminder message.

        Args:
            job_title: The title of the job position
            company_name: The name of the company
            application_date: Date when the application was submitted (format: yyyy-mm-dd HH:MM:SS)
            follow_up_date: Date when follow-up should occur (format: yyyy-mm-dd HH:MM:SS)

        Returns:
            dict: A dictionary containing the generated reminder message
                - reminder_message: The formatted reminder message string

        Raises:
            ValueError: If required parameters are missing or date formats are invalid
        """
        from datetime import datetime

        # Validate required parameters are not empty
        if not job_title or not isinstance(job_title, str) or not job_title.strip():
            raise ValueError("job_title must be a non-empty string")

        if not company_name or not isinstance(company_name, str) or not company_name.strip():
            raise ValueError("company_name must be a non-empty string")

        if not application_date or not isinstance(application_date, str):
            raise ValueError("application_date must be a non-empty string")

        if not follow_up_date or not isinstance(follow_up_date, str):
            raise ValueError("follow_up_date must be a non-empty string")

        # Validate and parse application_date
        try:
            # Try parsing with full datetime format first (yyyy-mm-dd HH:MM:SS)
            if len(application_date.strip()) > 10:
                app_date_obj = datetime.strptime(application_date.strip(), "%Y-%m-%d %H:%M:%S")
                app_date_str = app_date_obj.strftime("%Y-%m-%d")
            else:
                # If only date is provided (yyyy-mm-dd)
                app_date_obj = datetime.strptime(application_date.strip(), "%Y-%m-%d")
                app_date_str = app_date_obj.strftime("%Y-%m-%d")
        except ValueError as e:
            raise ValueError(f"application_date must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format: {str(e)}")

        # Validate and parse follow_up_date
        try:
            # Try parsing with full datetime format first (yyyy-mm-dd HH:MM:SS)
            if len(follow_up_date.strip()) > 10:
                follow_date_obj = datetime.strptime(follow_up_date.strip(), "%Y-%m-%d %H:%M:%S")
            else:
                # If only date is provided (yyyy-mm-dd)
                follow_date_obj = datetime.strptime(follow_up_date.strip(), "%Y-%m-%d")
        except ValueError as e:
            raise ValueError(f"follow_up_date must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format: {str(e)}")

        # Check that follow_up_date is after application_date
        if follow_date_obj < app_date_obj:
            raise ValueError("follow_up_date must be on or after application_date")

        # Generate the reminder message
        # Format: "Follow up on your [Job Title] application at [Company Name] (applied on [Date])"
        reminder_message = f"Follow up on your {job_title.strip()} application at {company_name.strip()} (applied on {app_date_str})"

        return {
            "reminder_message": reminder_message
        }

    @is_tool()
    def add_interview_schedule(self, application_id: str, interview_type: str, interview_date: str, 
                              interviewer_name: Optional[str] = None, interview_location: Optional[str] = None, 
                              interview_duration_minutes: Optional[int] = None) -> dict:
        """
        Add an interview schedule to a job application.

        This method creates a new interview schedule record in the database for a given job application.
        It validates the input parameters, checks if the application exists, generates a unique interview ID,
        and stores the interview schedule information.

        Args:
            application_id: Unique identifier of the application
            interview_type: Type of interview (e.g., technical_interview, phone_screening)
            interview_date: Scheduled date and time in "yyyy-mm-dd HH:MM:SS" format
            interviewer_name: Optional name of the interviewer
            interview_location: Optional location or platform for the interview
            interview_duration_minutes: Optional expected duration in minutes

        Returns:
            Dictionary containing:
                - interview_id: Generated unique identifier for the interview
                - application_id: The application ID this interview is associated with

        Raises:
            KeyError: If the application_id does not exist in the system
            ValueError: If interview_date format is invalid or parameters are invalid
        """
        from datetime import datetime

        # Validate required parameters
        if not application_id or not isinstance(application_id, str):
            raise ValueError("application_id must be a non-empty string")

        if not interview_type or not isinstance(interview_type, str):
            raise ValueError("interview_type must be a non-empty string")

        if not interview_date or not isinstance(interview_date, str):
            raise ValueError("interview_date must be a non-empty string")

        # Validate optional parameters
        if interviewer_name is not None and not isinstance(interviewer_name, str):
            raise ValueError("interviewer_name must be a string")

        if interview_location is not None and not isinstance(interview_location, str):
            raise ValueError("interview_location must be a string")

        if interview_duration_minutes is not None:
            if not isinstance(interview_duration_minutes, int):
                raise ValueError("interview_duration_minutes must be an integer")
            if interview_duration_minutes <= 0:
                raise ValueError("interview_duration_minutes must be a positive integer")

        # Parse and validate interview_date string
        try:
            if len(interview_date.strip()) == 10:  # Date only format "yyyy-mm-dd"
                parsed_date = datetime.strptime(interview_date.strip(), "%Y-%m-%d")
                formatted_date = parsed_date.strftime("%Y-%m-%d %H:%M:%S")
            else:  # Full datetime format "yyyy-mm-dd HH:MM:SS"
                parsed_date = datetime.strptime(interview_date.strip(), "%Y-%m-%d %H:%M:%S")
                formatted_date = interview_date.strip()
        except ValueError as e:
            raise ValueError(f"interview_date must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format: {str(e)}")

        # Access the database
        db = self.db

        # Verify that the application exists in the system
        job_application_table = getattr(db, "job_application", None)
        if job_application_table is None or application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' does not exist in the system")

        # Check if interview_schedule table exists in database
        interview_schedule_table = getattr(db, "interview_schedule", None)
        if interview_schedule_table is None:
            setattr(db, "interview_schedule", {})
            interview_schedule_table = getattr(db, "interview_schedule")

        # Generate unique interview_id
        import random
        import string
        counter = 1
        while True:
            random_suffix = ''.join(random.choices(string.digits, k=3))
            interview_id = f"INT-{random_suffix}{counter:04d}"
            if interview_id not in interview_schedule_table:
                break
            counter += 1

        # Create new InterviewSchedule instance
        new_interview = InterviewSchedule(
            interview_id=interview_id,
            application_id=application_id,
            interview_type=interview_type,
            interview_date=formatted_date,
            interviewer_name=interviewer_name,
            interview_location=interview_location,
            interview_duration_minutes=interview_duration_minutes
        )

        # Add the new interview schedule to the database
        interview_schedule_table[interview_id] = new_interview
        setattr(db, "interview_schedule", interview_schedule_table)

        # Return the result with interview_id and application_id
        return {
            "interview_id": interview_id,
            "application_id": application_id
        }

    @is_tool()
    def extract_keywords_from_resume(self, resume_content: str) -> dict:
        """
        Extract key skills and keywords from resume content.

        This method analyzes resume text to identify technical skills, soft skills,
        and general keywords using natural language processing techniques.
        """
        import re
        from collections import Counter

        # Validate input
        if not resume_content:
            raise ValueError("Resume content cannot be empty")

        if not isinstance(resume_content, str):
            raise ValueError("Resume content must be a string")

        # Convert to lowercase for processing
        content_lower = resume_content.lower()

        # Define comprehensive technical skills keywords
        # These are common technical skills found in resumes
        technical_skills_patterns = {
            # Programming languages
            'python', 'java', 'javascript', 'typescript', 'c++', 'c#', 'ruby', 'php', 
            'swift', 'kotlin', 'go', 'rust', 'scala', 'r', 'matlab', 'perl',

            # Web technologies
            'html', 'css', 'react', 'angular', 'vue', 'node.js', 'express', 'django',
            'flask', 'spring', 'asp.net', 'jquery', 'bootstrap', 'webpack', 'sass',

            # Databases
            'sql', 'mysql', 'postgresql', 'mongodb', 'redis', 'cassandra', 'oracle',
            'sqlite', 'dynamodb', 'elasticsearch', 'neo4j',

            # Cloud & DevOps
            'aws', 'azure', 'gcp', 'docker', 'kubernetes', 'jenkins', 'terraform',
            'ansible', 'ci/cd', 'git', 'github', 'gitlab', 'bitbucket', 'linux',

            # Data Science & ML
            'machine learning', 'deep learning', 'tensorflow', 'pytorch', 'keras',
            'scikit-learn', 'pandas', 'numpy', 'data analysis', 'statistics',
            'neural networks', 'nlp', 'computer vision', 'ai',

            # Testing & Quality
            'junit', 'pytest', 'selenium', 'cypress', 'jest', 'testing',
            'unit testing', 'integration testing', 'tdd', 'bdd',

            # Other technical
            'api', 'rest', 'graphql', 'microservices', 'agile', 'scrum',
            'jira', 'confluence', 'soap', 'xml', 'json', 'yaml'
        }

        # Define soft skills keywords
        soft_skills_patterns = {
            'leadership', 'communication', 'teamwork', 'problem solving', 
            'critical thinking', 'creativity', 'adaptability', 'time management',
            'collaboration', 'interpersonal', 'analytical', 'detail-oriented',
            'self-motivated', 'initiative', 'organization', 'presentation',
            'negotiation', 'conflict resolution', 'mentoring', 'coaching',
            'strategic thinking', 'decision making', 'emotional intelligence',
            'project management', 'multitasking', 'flexibility', 'innovative'
        }

        # Extract technical skills
        technical_skills = []
        for skill in technical_skills_patterns:
            # Use word boundaries to match whole words/phrases
            pattern = r'\b' + re.escape(skill) + r'\b'
            if re.search(pattern, content_lower):
                # Preserve original casing from common abbreviations
                if skill.upper() in ['AWS', 'GCP', 'SQL', 'API', 'REST', 'HTML', 
                                     'CSS', 'XML', 'JSON', 'YAML', 'CI/CD', 'AI',
                                     'ML', 'NLP', 'TDD', 'BDD']:
                    technical_skills.append(skill.upper())
                else:
                    technical_skills.append(skill.title() if ' ' in skill else skill)

        # Extract soft skills
        soft_skills = []
        for skill in soft_skills_patterns:
            pattern = r'\b' + re.escape(skill) + r'\b'
            if re.search(pattern, content_lower):
                soft_skills.append(skill.title() if ' ' in skill else skill)

        # Extract general keywords
        # Remove common stop words
        stop_words = {
            'the', 'a', 'an', 'and', 'or', 'but', 'in', 'on', 'at', 'to', 'for',
            'of', 'with', 'by', 'from', 'as', 'is', 'was', 'are', 'were', 'been',
            'be', 'have', 'has', 'had', 'do', 'does', 'did', 'will', 'would',
            'could', 'should', 'may', 'might', 'must', 'can', 'this', 'that',
            'these', 'those', 'i', 'you', 'he', 'she', 'it', 'we', 'they',
            'my', 'your', 'his', 'her', 'its', 'our', 'their', 'me', 'him',
            'them', 'us', 'who', 'what', 'where', 'when', 'why', 'how'
        }

        # Tokenize: extract words (alphanumeric sequences, preserving dots for abbreviations)
        words = re.findall(r'\b[a-z0-9.]+\b', content_lower)

        # Filter and count meaningful words
        # Keep words that are:
        # 1. Not stop words
        # 2. Length >= 3 characters
        # 3. Not purely numeric
        meaningful_words = [
            word for word in words 
            if word not in stop_words 
            and len(word) >= 3 
            and not word.isdigit()
        ]

        # Count word frequency
        word_freq = Counter(meaningful_words)

        # Extract top keywords (appearing at least once, sorted by frequency)
        # Take top 50 most common words as keywords
        top_keywords = [word for word, count in word_freq.most_common(50)]

        # Capitalize keywords appropriately
        keywords = []
        for word in top_keywords:
            # Check if it's a known technical term that should be uppercase
            if word.upper() in ['AWS', 'GCP', 'SQL', 'API', 'REST', 'HTML', 
                                'CSS', 'XML', 'JSON', 'YAML', 'AI', 'ML', 'NLP']:
                keywords.append(word.upper())
            else:
                keywords.append(word)

        # Remove duplicates while preserving order
        technical_skills = list(dict.fromkeys(technical_skills))
        soft_skills = list(dict.fromkeys(soft_skills))
        keywords = list(dict.fromkeys(keywords))

        return {
            'technical_skills': technical_skills,
            'soft_skills': soft_skills,
            'keywords': keywords
        }

    @is_tool()
    def update_application_status(self, application_id: str, new_status: str, updated_at: str):
        """
        Update the status of an existing job application

        Args:
            application_id: Unique identifier of the application
            new_status: New status to be set for the application
            updated_at: Timestamp of the status update in yyyy-mm-dd HH:MM:SS format

        Returns:
            dict: Dictionary containing application_id, previous_status, and current status

        Raises:
            KeyError: If application_id does not exist in the database
            ValueError: If updated_at format is invalid
        """
        from datetime import datetime

        # Validate and parse the updated_at timestamp
        try:
            update_timestamp = datetime.strptime(updated_at, "%Y-%m-%d %H:%M:%S")
        except ValueError:
            raise ValueError(f"Invalid timestamp format for updated_at: '{updated_at}'. Expected format: 'yyyy-mm-dd HH:MM:SS'")

        # Access the database
        db = self.db

        # Retrieve the job_application table
        job_application_table = getattr(db, "job_application", None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' does not exist")

        # Retrieve the existing application record
        application = job_application_table[application_id]

        # Store the previous status before updating
        previous_status = application.status

        # Update the application status and updated_at timestamp
        application.status = new_status
        application.updated_at = update_timestamp

        # Write the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, "job_application", job_application_table)

        # Return the result with application_id, previous_status, and current status
        return {
            "application_id": application_id,
            "previous_status": previous_status,
            "status": new_status
        }

    @is_tool()
    def calculate_application_response_time(self, application_date: str, current_date: str) -> dict:
        """
        Calculate the time elapsed since application submission.

        This method computes:
        - Total days elapsed
        - Total hours elapsed
        - Business days elapsed (excluding weekends)

        Args:
            application_date: Date when the application was submitted in yyyy-mm-dd HH:MM:SS format
            current_date: Current date for calculation in yyyy-mm-dd HH:MM:SS format

        Returns:
            dict: Dictionary containing days_elapsed, hours_elapsed, and business_days_elapsed

        Raises:
            ValueError: If date format is invalid or current_date is before application_date
        """
        from datetime import datetime

        # Validate input parameters are not empty
        if not application_date or not isinstance(application_date, str):
            raise ValueError("application_date must be a non-empty string")
        if not current_date or not isinstance(current_date, str):
            raise ValueError("current_date must be a non-empty string")

        # Parse the date strings to datetime objects
        # Support both full datetime format (yyyy-mm-dd HH:MM:SS) and date-only format (yyyy-mm-dd)
        try:
            # Try parsing with time first
            if len(application_date.strip()) > 10:
                app_datetime = datetime.strptime(application_date.strip(), "%Y-%m-%d %H:%M:%S")
            else:
                # If only date is provided, assume 00:00:00
                app_datetime = datetime.strptime(application_date.strip(), "%Y-%m-%d")
        except ValueError as e:
            raise ValueError(f"Invalid application_date format. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got: {application_date}") from e

        try:
            # Try parsing with time first
            if len(current_date.strip()) > 10:
                curr_datetime = datetime.strptime(current_date.strip(), "%Y-%m-%d %H:%M:%S")
            else:
                # If only date is provided, assume 00:00:00
                curr_datetime = datetime.strptime(current_date.strip(), "%Y-%m-%d")
        except ValueError as e:
            raise ValueError(f"Invalid current_date format. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got: {current_date}") from e

        # Validate that current_date is not before application_date
        if curr_datetime < app_datetime:
            raise ValueError("current_date cannot be before application_date")

        # Calculate the time difference
        time_delta = curr_datetime - app_datetime

        # Calculate days elapsed (total days including partial days)
        days_elapsed = time_delta.days

        # Calculate total hours elapsed
        total_seconds = time_delta.total_seconds()
        hours_elapsed = int(total_seconds // 3600)

        # Calculate business days elapsed (excluding weekends: Saturday=5, Sunday=6)
        business_days_elapsed = 0
        current_check_date = app_datetime.date()
        end_date = curr_datetime.date()

        # Iterate through each day and count business days
        while current_check_date <= end_date:
            # weekday() returns 0=Monday, 1=Tuesday, ..., 4=Friday, 5=Saturday, 6=Sunday
            if current_check_date.weekday() < 5:  # Monday to Friday
                business_days_elapsed += 1

            # Move to next day
            from datetime import timedelta
            current_check_date += timedelta(days=1)

        # If the application was submitted and current date is on the same day,
        # we should count it as 0 business days if it's the same calendar day
        if app_datetime.date() == curr_datetime.date():
            business_days_elapsed = 0
        else:
            # Adjust: we've been counting inclusive of both start and end dates
            # We need to exclude the start date from the count
            if app_datetime.date().weekday() < 5:
                business_days_elapsed -= 1

        # Ensure business days is not negative
        if business_days_elapsed < 0:
            business_days_elapsed = 0

        return {
            "days_elapsed": days_elapsed,
            "hours_elapsed": hours_elapsed,
            "business_days_elapsed": business_days_elapsed
        }

    @is_tool()
    def calculate_application_diversity_score(self, applications: list) -> dict:
        """
        Calculate diversity score based on variety of companies and roles applied to.

        This method analyzes the diversity of job applications by counting unique companies,
        job titles, and industries. It then calculates an overall diversity score based on
        these metrics.

        Args:
            applications: List of application dictionaries, each containing:
                - job_title (str): Title of the job position
                - company_name (str): Name of the company
                - industry (str): Industry sector

        Returns:
            dict: Dictionary containing:
                - unique_companies (int): Number of unique companies
                - unique_job_titles (int): Number of unique job titles
                - unique_industries (int): Number of unique industries
                - diversity_score (float): Overall diversity score (0-100)

        Raises:
            ValueError: If applications list is empty or contains invalid data
        """
        # Validate input: applications must be a non-empty list
        if not applications:
            raise ValueError("Applications list cannot be empty")

        if not isinstance(applications, list):
            raise ValueError("Applications must be a list")

        # Initialize sets to track unique values (sets automatically handle duplicates)
        unique_companies = set()
        unique_job_titles = set()
        unique_industries = set()

        # Iterate through all applications and extract unique values
        for idx, app in enumerate(applications):
            # Validate that each application is a dictionary
            if not isinstance(app, dict):
                raise ValueError(f"Application at index {idx} must be a dictionary")

            # Extract and validate required fields
            job_title = app.get('job_title')
            company_name = app.get('company_name')
            industry = app.get('industry')

            # Validate that required fields are present and are strings
            if not job_title or not isinstance(job_title, str):
                raise ValueError(f"Application at index {idx} must have a valid 'job_title' string")
            if not company_name or not isinstance(company_name, str):
                raise ValueError(f"Application at index {idx} must have a valid 'company_name' string")
            if not industry or not isinstance(industry, str):
                raise ValueError(f"Application at index {idx} must have a valid 'industry' string")

            # Add normalized values to sets (strip whitespace and convert to lowercase for consistency)
            unique_companies.add(company_name.strip().lower())
            unique_job_titles.add(job_title.strip().lower())
            unique_industries.add(industry.strip().lower())

        # Count unique values
        num_unique_companies = len(unique_companies)
        num_unique_job_titles = len(unique_job_titles)
        num_unique_industries = len(unique_industries)
        total_applications = len(applications)

        # Calculate diversity score (0-100 scale)
        # The score is based on the ratio of unique values to total applications
        # We weight each component equally (companies: 40%, job titles: 40%, industries: 20%)
        # Higher ratios indicate more diversity

        # Company diversity component (40% weight)
        # Maximum score when each application is to a different company
        company_diversity = min((num_unique_companies / total_applications) * 100, 100) * 0.4

        # Job title diversity component (40% weight)
        # Maximum score when each application is for a different job title
        job_title_diversity = min((num_unique_job_titles / total_applications) * 100, 100) * 0.4

        # Industry diversity component (20% weight)
        # Maximum score when applications span multiple industries
        industry_diversity = min((num_unique_industries / total_applications) * 100, 100) * 0.2

        # Calculate overall diversity score
        diversity_score = company_diversity + job_title_diversity + industry_diversity

        # Round to one decimal place for readability
        diversity_score = round(diversity_score, 1)

        # Return results
        return {
            'unique_companies': num_unique_companies,
            'unique_job_titles': num_unique_job_titles,
            'unique_industries': num_unique_industries,
            'diversity_score': diversity_score
        }

    @is_tool()
    def export_application_data(self, application_id: str, export_format: str) -> dict:
        """
        Export application data in a specified format

        Args:
            application_id: Unique identifier of the application
            export_format: Format for export (currently supports 'json')

        Returns:
            dict containing:
                - exported_data: Exported application data in specified format
                - export_timestamp: Timestamp when data was exported in yyyy-mm-dd HH:MM:SS format

        Raises:
            KeyError: If application_id does not exist in the database
            ValueError: If export_format is not supported
        """
        from datetime import datetime
        import json

        # Validate export_format parameter
        supported_formats = ['json']
        if export_format.lower() not in supported_formats:
            raise ValueError(f"Unsupported export format: {export_format}. Supported formats: {supported_formats}")

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists and has data
        if job_application_table is None or not isinstance(job_application_table, dict):
            raise KeyError(f"Application with ID '{application_id}' not found")

        # Retrieve the application by application_id
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found")

        application = job_application_table[application_id]

        # Prepare the data for export
        # Convert the application object to a dictionary
        application_dict = {}

        # Iterate through all attributes of the application object
        for field_name in application.model_fields.keys():
            field_value = getattr(application, field_name, None)

            # Convert datetime objects to string format yyyy-mm-dd HH:MM:SS
            if isinstance(field_value, datetime):
                application_dict[field_name] = field_value.strftime('%Y-%m-%d %H:%M:%S')
            else:
                application_dict[field_name] = field_value

        # Export based on the specified format
        if export_format.lower() == 'json':
            # Convert dictionary to JSON string with proper formatting
            exported_data = json.dumps(application_dict, ensure_ascii=False, indent=2)

        # Generate export timestamp
        export_timestamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S')

        # Return the exported data and timestamp
        return {
            'exported_data': exported_data,
            'export_timestamp': export_timestamp
        }

    @is_tool()
    def set_application_deadline(self, application_id: str, deadline_date: str, deadline_type: str = None):
        """
        Set a follow-up or response deadline for a job application.

        Args:
            application_id: Unique identifier of the application
            deadline_date: Deadline date in yyyy-mm-dd HH:MM:SS format
            deadline_type: Type of deadline (e.g., follow_up, response), optional

        Returns:
            dict: Contains application_id and deadline_set status

        Raises:
            KeyError: If application does not exist
            ValueError: If deadline_date format is invalid
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Validate deadline_date format
        try:
            # Try to parse the deadline_date string to ensure it's valid
            # Support both full datetime format "yyyy-mm-dd HH:MM:SS" and date-only format "yyyy-mm-dd"
            if len(deadline_date.strip()) == 10:  # Date only format
                parsed_deadline = datetime.strptime(deadline_date.strip(), "%Y-%m-%d")
            else:  # Full datetime format
                parsed_deadline = datetime.strptime(deadline_date.strip(), "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid deadline_date format. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got: {deadline_date}") from e

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application table does not exist in database")

        # Check if the application exists
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' does not exist")

        # Get the application record
        application = job_application_table[application_id]

        # Update the deadline fields
        application.deadline_date = parsed_deadline

        # Set deadline_type if provided, otherwise keep existing or set to None
        if deadline_type is not None:
            application.deadline_type = deadline_type

        # Update the updated_at timestamp
        application.updated_at = datetime.now()

        # Save the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success result
        return {
            'application_id': application_id,
            'deadline_set': True
        }

    @is_tool()
    def match_resume_to_job_description(self, resume_content: str, job_description: str) -> dict:
        """
        Calculate match score between resume and job description by analyzing keyword overlap
        and semantic similarity.

        Args:
            resume_content: Text content of the resume
            job_description: Text content of the job description

        Returns:
            dict containing:
                - match_score: Overall match score (0-100)
                - matched_keywords: Keywords that match between resume and job
                - missing_keywords: Keywords in job description not found in resume

        Raises:
            ValueError: If resume_content or job_description is empty or invalid
        """
        import re
        from collections import Counter

        # Validate input parameters
        if not resume_content or not isinstance(resume_content, str):
            raise ValueError("resume_content must be a non-empty string")
        if not job_description or not isinstance(job_description, str):
            raise ValueError("job_description must be a non-empty string")

        resume_content = resume_content.strip()
        job_description = job_description.strip()

        if not resume_content:
            raise ValueError("resume_content cannot be empty or whitespace only")
        if not job_description:
            raise ValueError("job_description cannot be empty or whitespace only")

        # Define common stop words to filter out
        stop_words = {
            'a', 'an', 'and', 'are', 'as', 'at', 'be', 'by', 'for', 'from', 'has', 'he',
            'in', 'is', 'it', 'its', 'of', 'on', 'that', 'the', 'to', 'was', 'will', 'with',
            'we', 'you', 'your', 'this', 'these', 'those', 'or', 'but', 'not', 'have', 'had',
            'do', 'does', 'did', 'can', 'could', 'would', 'should', 'may', 'might', 'must',
            'our', 'their', 'what', 'which', 'who', 'when', 'where', 'why', 'how', 'all',
            'each', 'every', 'both', 'few', 'more', 'most', 'other', 'some', 'such', 'no',
            'nor', 'only', 'own', 'same', 'so', 'than', 'too', 'very', 'about', 'after',
            'before', 'between', 'during', 'through', 'into', 'out', 'over', 'under', 'up',
            'down', 'off', 'again', 'further', 'then', 'once', 'here', 'there', 'been',
            'being', 'if', 'because', 'while', 'until', 'any', 'also', 'am'
        }

        def extract_keywords(text):
            """
            Extract meaningful keywords from text by:
            1. Converting to lowercase
            2. Extracting words and multi-word phrases
            3. Filtering stop words
            4. Normalizing terms
            """
            text_lower = text.lower()

            # Extract multi-word technical terms and phrases (2-4 words)
            # Common patterns in job descriptions and resumes
            multi_word_patterns = [
                r'\b(?:machine|deep|natural language|computer|software|data|web|mobile|cloud|full stack|front end|back end|devops)\s+(?:learning|processing|vision|science|engineering|development|developer|engineer|architect|analyst)\b',
                r'\b(?:project|product|team|technical|business|data|quality|software)\s+(?:management|manager|lead|leader|analyst|analysis)\b',
                r'\b(?:agile|scrum|waterfall|kanban)\s+(?:methodology|development|framework)\b',
                r'\b(?:rest|graphql|soap)\s+(?:api|apis)\b',
                r'\b(?:unit|integration|end to end|e2e)\s+(?:test|testing|tests)\b',
                r'\b(?:version|source)\s+control\b',
                r'\b(?:continuous|ci/cd)\s+(?:integration|deployment|delivery)\b',
                r'\b(?:object|functional|procedural)\s+(?:oriented|programming)\b'
            ]

            phrases = set()
            for pattern in multi_word_patterns:
                matches = re.findall(pattern, text_lower)
                phrases.update(matches)

            # Extract individual words (alphanumeric with possible hyphens, dots, plus signs)
            # This captures: Python, C++, Node.js, AWS, etc.
            words = re.findall(r'\b[a-z0-9][a-z0-9\-\+\.]*[a-z0-9]\b|\b[a-z0-9]\b', text_lower)

            # Filter out stop words and very short words (< 2 chars) for individual words
            meaningful_words = {
                word for word in words 
                if word not in stop_words and len(word) >= 2
            }

            # Combine phrases and words
            all_keywords = phrases.union(meaningful_words)

            return all_keywords

        def extract_weighted_keywords(text):
            """
            Extract keywords with frequency weighting to identify important terms
            """
            keywords = extract_keywords(text)

            # Count frequency of each keyword in the text
            text_lower = text.lower()
            keyword_freq = {}
            for keyword in keywords:
                # Use word boundary matching for accurate counting
                count = len(re.findall(r'\b' + re.escape(keyword) + r'\b', text_lower))
                keyword_freq[keyword] = count

            return keyword_freq

        # Extract keywords from both texts
        resume_keywords = extract_weighted_keywords(resume_content)
        job_keywords = extract_weighted_keywords(job_description)

        # Identify matched and missing keywords
        matched_keywords = []
        missing_keywords = []

        # For each job requirement keyword, check if it exists in resume
        for job_keyword in job_keywords.keys():
            if job_keyword in resume_keywords:
                matched_keywords.append(job_keyword)
            else:
                missing_keywords.append(job_keyword)

        # Calculate match score based on multiple factors
        if len(job_keywords) == 0:
            # If job description has no meaningful keywords, return low score
            match_score = 0.0
        else:
            # Factor 1: Keyword coverage (what percentage of job keywords are in resume)
            keyword_coverage = len(matched_keywords) / len(job_keywords)

            # Factor 2: Weighted keyword match (considering frequency in job description)
            # More frequently mentioned keywords in job description are more important
            total_job_keyword_weight = sum(job_keywords.values())
            matched_weight = sum(job_keywords[kw] for kw in matched_keywords)
            weighted_coverage = matched_weight / total_job_keyword_weight if total_job_keyword_weight > 0 else 0

            # Factor 3: Resume keyword density (avoid keyword stuffing penalty)
            # If resume has too many keywords not in job description, it might be less focused
            total_resume_keywords = len(resume_keywords)
            if total_resume_keywords > 0:
                focus_score = len(matched_keywords) / total_resume_keywords
                # Cap focus score to avoid penalizing comprehensive resumes
                focus_score = min(focus_score * 2, 1.0)
            else:
                focus_score = 0.0

            # Combine factors with weights
            # Keyword coverage: 50%, Weighted coverage: 35%, Focus: 15%
            match_score = (
                keyword_coverage * 0.50 +
                weighted_coverage * 0.35 +
                focus_score * 0.15
            ) * 100

            # Ensure score is within 0-100 range
            match_score = max(0.0, min(100.0, match_score))

        # Sort matched and missing keywords for consistent output
        matched_keywords.sort()
        missing_keywords.sort()

        return {
            'match_score': round(match_score, 1),
            'matched_keywords': matched_keywords,
            'missing_keywords': missing_keywords
        }

    @is_tool()
    def attach_cover_letter_to_application(self, application_id: str, cover_letter_content: str, uploaded_at: str = None):
        """
        Attach or update cover letter content for a job application.

        This method updates the cover letter content and upload timestamp for an existing job application.
        If no uploaded_at is provided, the current timestamp will be used.

        Args:
            application_id: Unique identifier of the application
            cover_letter_content: Text content of the cover letter
            uploaded_at: Timestamp when the cover letter was uploaded in yyyy-mm-dd HH:MM:SS format (optional)

        Returns:
            dict: Contains application_id and cover_letter_attached status

        Raises:
            KeyError: If the application_id does not exist in the database
            ValueError: If the uploaded_at timestamp format is invalid
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Retrieve the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' not found: job_application table does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found")

        # Retrieve the application record
        application = job_application_table[application_id]

        # Parse the uploaded_at timestamp if provided, otherwise use current time
        if uploaded_at is not None:
            # Validate and parse the timestamp format
            try:
                upload_timestamp = datetime.strptime(uploaded_at, "%Y-%m-%d %H:%M:%S")
            except ValueError:
                # If full datetime format fails, try date-only format
                try:
                    upload_timestamp = datetime.strptime(uploaded_at, "%Y-%m-%d")
                except ValueError:
                    raise ValueError(f"Invalid timestamp format: '{uploaded_at}'. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd'")

            # Convert to string format for storage
            upload_timestamp_str = upload_timestamp.strftime("%Y-%m-%d %H:%M:%S")
        else:
            # Use current timestamp if not provided
            upload_timestamp_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Update the cover letter content and upload timestamp
        application.cover_letter_content = cover_letter_content
        application.cover_letter_uploaded_at = upload_timestamp_str

        # Update the updated_at timestamp to reflect the modification
        application.updated_at = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Save the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success response
        return {
            'application_id': application_id,
            'cover_letter_attached': True
        }

    @is_tool()
    def track_referral_source(self, application_id: str, referral_source: str, referral_person: str = None) -> dict:
        """
        Track the source or referral for a job application by updating the referral_source
        and referral_person fields in the job_application table.

        Args:
            application_id: Unique identifier of the application to update
            referral_source: Source of the job referral (e.g., LinkedIn, Indeed, employee referral)
            referral_person: Optional name of person who referred the applicant

        Returns:
            Dictionary containing:
                - application_id: The application ID that was updated
                - referral_tracked: Boolean indicating if the referral was successfully tracked

        Raises:
            KeyError: If the application_id does not exist in the database
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists and is not empty
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' not found - job_application table does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found in the database")

        # Retrieve the application record
        application = job_application_table[application_id]

        # Update the referral_source field (required parameter)
        application.referral_source = referral_source

        # Update the referral_person field if provided (optional parameter)
        if referral_person is not None:
            application.referral_person = referral_person

        # Update the updated_at timestamp to reflect the modification
        # Format: "yyyy-mm-dd HH:MM:SS"
        application.updated_at = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Write the updated data back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success response
        return {
            'application_id': application_id,
            'referral_tracked': True
        }

    @is_tool()
    def check_application_deadline(self, deadline_date: str, current_date: str, warning_days: int = 7) -> dict:
        """
        Check if an application deadline has passed or is approaching.

        This method compares the deadline date with the current date to determine:
        1. Whether the deadline has already passed (is_overdue)
        2. Whether the deadline is approaching within the warning period (is_approaching)
        3. How many days remain until the deadline (days_remaining)

        Args:
            deadline_date: Deadline date in yyyy-mm-dd HH:MM:SS format
            current_date: Current date for comparison in yyyy-mm-dd HH:MM:SS format
            warning_days: Number of days before deadline to trigger warning (default: 7)

        Returns:
            dict: Contains is_overdue, is_approaching, and days_remaining

        Raises:
            ValueError: If date formats are invalid or warning_days is negative
        """
        from datetime import datetime

        # Validate warning_days parameter
        if warning_days < 0:
            raise ValueError("warning_days must be a non-negative integer")

        # Parse deadline_date
        try:
            deadline_dt = datetime.strptime(deadline_date.strip(), "%Y-%m-%d %H:%M:%S")
        except ValueError:
            # Try parsing date-only format if full datetime format fails
            try:
                deadline_dt = datetime.strptime(deadline_date.strip(), "%Y-%m-%d")
            except ValueError:
                raise ValueError(f"Invalid deadline_date format: {deadline_date}. Expected format: yyyy-mm-dd HH:MM:SS or yyyy-mm-dd")

        # Parse current_date
        try:
            current_dt = datetime.strptime(current_date.strip(), "%Y-%m-%d %H:%M:%S")
        except ValueError:
            # Try parsing date-only format if full datetime format fails
            try:
                current_dt = datetime.strptime(current_date.strip(), "%Y-%m-%d")
            except ValueError:
                raise ValueError(f"Invalid current_date format: {current_date}. Expected format: yyyy-mm-dd HH:MM:SS or yyyy-mm-dd")

        # Calculate time difference
        time_difference = deadline_dt - current_dt

        # Calculate days remaining (can be negative if overdue)
        # Using total_seconds() and converting to days for precision
        days_remaining = int(time_difference.total_seconds() / 86400)  # 86400 seconds in a day

        # Determine if deadline has passed
        is_overdue = current_dt > deadline_dt

        # Determine if deadline is approaching
        # Deadline is approaching if:
        # 1. It hasn't passed yet (not overdue)
        # 2. The remaining days are within the warning period
        is_approaching = False
        if not is_overdue and 0 <= days_remaining <= warning_days:
            is_approaching = True

        # Return the result dictionary
        return {
            "is_overdue": is_overdue,
            "is_approaching": is_approaching,
            "days_remaining": days_remaining
        }

    @is_tool()
    def add_interview_feedback(self, interview_id: str, feedback_content: str, created_at: str, performance_rating: Optional[int] = None) -> dict:
        """
        Add feedback or notes after an interview

        Args:
            interview_id: Unique identifier of the interview
            feedback_content: Content of the feedback
            created_at: Timestamp when feedback was created in yyyy-mm-dd HH:MM:SS format
            performance_rating: Optional self-assessment rating of interview performance

        Returns:
            Dictionary containing feedback_id and interview_id

        Raises:
            KeyError: If the interview does not exist in the system
            ValueError: If created_at format is invalid or performance_rating is out of valid range
        """
        import secrets
        import hashlib
        from datetime import datetime

        # Access the database
        db = self.db

        # Validate that interview exists in the system
        # Get interview_schedule table to verify interview exists
        interview_schedule_table = getattr(db, 'interview_schedule', None)
        if interview_schedule_table is None:
            raise KeyError(f"Interview with ID '{interview_id}' does not exist in the system")

        # Check if the interview_id exists in interview_schedule table
        if interview_id not in interview_schedule_table:
            raise KeyError(f"Interview with ID '{interview_id}' does not exist in the system")

        # Validate created_at timestamp format
        try:
            created_at_datetime = datetime.strptime(created_at, "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid created_at format. Expected 'yyyy-mm-dd HH:MM:SS', got '{created_at}'") from e

        # Validate performance_rating if provided (should be in reasonable range, e.g., 1-5)
        if performance_rating is not None:
            if not isinstance(performance_rating, int):
                raise ValueError(f"performance_rating must be an integer, got {type(performance_rating).__name__}")
            if performance_rating < 1 or performance_rating > 5:
                raise ValueError(f"performance_rating must be between 1 and 5, got {performance_rating}")

        # Validate feedback_content is not empty
        if not feedback_content or not feedback_content.strip():
            raise ValueError("feedback_content cannot be empty")

        # Generate unique feedback_id with proper format
        timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
        random_suffix = secrets.token_hex(3).upper()
        feedback_id = f"FEEDBACK-{timestamp[:4]}-{random_suffix}"

        # Create new InterviewFeedback instance
        new_feedback = InterviewFeedback(
            feedback_id=feedback_id,
            interview_id=interview_id,
            feedback_content=feedback_content,
            performance_rating=performance_rating,
            created_at=created_at_datetime
        )

        # Get interview_feedback table
        interview_feedback_table = getattr(db, 'interview_feedback', None)

        # Initialize table if it doesn't exist
        if interview_feedback_table is None:
            interview_feedback_table = {}

        # Add new feedback to the table
        interview_feedback_table[feedback_id] = new_feedback

        # Update the database with the new feedback
        setattr(db, 'interview_feedback', interview_feedback_table)

        # Return the feedback_id and interview_id
        return {
            'feedback_id': feedback_id,
            'interview_id': interview_id
        }

    @is_tool()
    def get_application_interviews(self, application_id: str) -> dict:
        """
        Retrieve all interview schedules for a job application

        Args:
            application_id: Unique identifier of the application

        Returns:
            Dictionary containing list of interviews with their details

        Raises:
            KeyError: If application_id does not exist in the system
        """
        # Access the database instance
        db = self.db

        # Get the job_application table to verify application exists
        job_application_table = getattr(db, 'job_application', None)
        if job_application_table is None:
            raise KeyError(f"Job application table not found in database")

        # Verify the application exists (pre-condition check)
        if application_id not in job_application_table:
            raise KeyError(f"Application with application_id '{application_id}' does not exist in the system")

        # Get the interview_schedule table from database
        interview_schedule_table = getattr(db, 'interview_schedule', None)
        if interview_schedule_table is None:
            raise KeyError(f"Interview schedule table not found in database")

        # Initialize the result list to store matching interviews
        interviews_list = []

        # Iterate through all interview records in the table
        for interview_id, interview_obj in interview_schedule_table.items():
            # Check if this interview belongs to the requested application
            if interview_obj.application_id == application_id:
                # Format the interview_date from datetime object to string format "yyyy-mm-dd HH:MM:SS"
                formatted_date = interview_obj.interview_date.strftime("%Y-%m-%d %H:%M:%S")

                # Build the interview dictionary with all required fields
                interview_dict = {
                    'interview_id': interview_obj.interview_id,
                    'interview_type': interview_obj.interview_type,
                    'interview_date': formatted_date,
                    'interviewer_name': interview_obj.interviewer_name if interview_obj.interviewer_name else '',
                    'interview_location': interview_obj.interview_location if interview_obj.interview_location else ''
                }

                # Add the interview to the result list
                interviews_list.append(interview_dict)

        # Sort interviews by interview_date to provide chronological order
        interviews_list.sort(key=lambda x: x['interview_date'])

        # Return the result in the expected format (empty list if no interviews found)
        return {
            'interviews': interviews_list
        }

    @is_tool()
    def validate_application_completeness(self, application_id: str) -> dict:
        """
        Check if a job application has all required fields and documents.

        This method validates that an application has all mandatory information needed
        for submission, including basic applicant info, job details, and required documents.

        Args:
            application_id: Unique identifier of the application to validate

        Returns:
            dict: Validation result containing:
                - is_complete: Boolean indicating if application is complete
                - missing_fields: List of missing required field names
                - validation_message: Detailed message about validation status

        Raises:
            KeyError: If the application_id does not exist in the database
        """
        # Access the database
        db = self.db

        # Retrieve the job_application table
        job_application_table = getattr(db, "job_application", None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application table not found in database")

        # Check if the application exists
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found")

        # Get the application record
        application = job_application_table[application_id]

        # Define required fields for a complete application
        # Based on the schema, these are the non-optional core fields plus critical documents
        required_fields = {
            'applicant_name': application.applicant_name,
            'email': application.email,
            'job_title': application.job_title,
            'company_name': application.company_name,
            'application_date': application.application_date,
            'resume_content': application.resume_content,  # Resume is critical for job applications
            'cover_letter_content': application.cover_letter_content  # Cover letter is typically required
        }

        # Track missing fields
        missing_fields = []

        # Check each required field
        for field_name, field_value in required_fields.items():
            # Check if field is None, empty string, or whitespace-only
            if field_value is None or (isinstance(field_value, str) and not field_value.strip()):
                missing_fields.append(field_name)

        # Determine if application is complete
        is_complete = len(missing_fields) == 0

        # Generate validation message
        if is_complete:
            validation_message = "Application is complete and ready for submission"
        else:
            # Create a human-readable list of missing fields
            missing_list = ", ".join(missing_fields)
            validation_message = f"Application is incomplete. Missing required fields: {missing_list}"

        # Return validation result
        return {
            'is_complete': is_complete,
            'missing_fields': missing_fields,
            'validation_message': validation_message
        }

    @is_tool()
    def batch_update_application_status(self, application_ids: list, new_status: str, updated_at: str) -> dict:
        """
        Update status for multiple applications at once

        Args:
            application_ids: List of application identifiers to update
            new_status: New status to apply to all applications
            updated_at: Timestamp of the batch update in yyyy-mm-dd HH:MM:SS format

        Returns:
            dict: Contains updated_count (number of successfully updated applications) 
                  and failed_updates (list of application IDs that failed to update)

        Raises:
            ValueError: If parameters are invalid or applications don't exist
        """
        from datetime import datetime

        # Validate input parameters
        if not application_ids:
            raise ValueError("application_ids cannot be empty")

        if not isinstance(application_ids, list):
            raise ValueError("application_ids must be a list")

        if not new_status or not isinstance(new_status, str):
            raise ValueError("new_status must be a non-empty string")

        if not updated_at or not isinstance(updated_at, str):
            raise ValueError("updated_at must be a non-empty string")

        # Parse and validate the updated_at timestamp
        try:
            update_datetime = datetime.strptime(updated_at, "%Y-%m-%d %H:%M:%S")
            formatted_updated_at = update_datetime.strftime("%Y-%m-%d %H:%M:%S")
        except ValueError:
            raise ValueError("updated_at must be in 'yyyy-mm-dd HH:MM:SS' format")

        # Access the database
        db = self.db
        job_application_table = getattr(db, "job_application", None)

        if job_application_table is None:
            raise ValueError("job_application table not found in database")

        # Initialize tracking variables
        updated_count = 0
        failed_updates = []

        # Process each application ID
        for app_id in application_ids:
            try:
                # Check if the application exists
                if app_id not in job_application_table:
                    # Application doesn't exist, add to failed list
                    failed_updates.append(app_id)
                    continue

                # Retrieve the application record
                application = job_application_table[app_id]

                # Update the status and updated_at timestamp (as string)
                application.status = new_status
                application.updated_at = formatted_updated_at

                # Save the updated application back to the database
                job_application_table[app_id] = application

                # Increment successful update count
                updated_count += 1

            except Exception:
                # If any error occurs during update, add to failed list
                failed_updates.append(app_id)
                continue

        # Update the database table
        setattr(db, "job_application", job_application_table)

        # Return the results
        return {
            "updated_count": updated_count,
            "failed_updates": failed_updates
        }

    @is_tool()
    def calculate_interview_preparation_time(self, current_date: str, interview_date: str) -> dict:
        """
        Calculate the time available for interview preparation.

        This method computes the time difference between the current date and the scheduled
        interview date, providing information about days and hours until the interview,
        as well as whether the interview is urgent (within 48 hours).

        Args:
            current_date: Current date and time in yyyy-mm-dd HH:MM:SS format
            interview_date: Scheduled interview date and time in yyyy-mm-dd HH:MM:SS format

        Returns:
            dict: A dictionary containing:
                - days_until_interview: Number of complete days until the interview
                - hours_until_interview: Total hours until the interview (rounded down)
                - is_urgent: Boolean indicating if interview is within 48 hours

        Raises:
            ValueError: If date format is invalid or interview_date is before current_date
        """
        from datetime import datetime

        # Validate and parse input date strings
        try:
            # Parse current_date string to datetime object
            current_dt = datetime.strptime(current_date, "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid current_date format. Expected yyyy-mm-dd HH:MM:SS, got: {current_date}") from e

        try:
            # Parse interview_date string to datetime object
            interview_dt = datetime.strptime(interview_date, "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid interview_date format. Expected yyyy-mm-dd HH:MM:SS, got: {interview_date}") from e

        # Validate that interview_date is not in the past
        if interview_dt < current_dt:
            raise ValueError(f"Interview date ({interview_date}) cannot be before current date ({current_date})")

        # Calculate time difference
        time_delta = interview_dt - current_dt

        # Calculate days until interview (complete days only)
        # total_seconds() returns the total number of seconds in the timedelta
        # dividing by 86400 (seconds in a day) and using int() gives complete days
        days_until_interview = int(time_delta.total_seconds() // 86400)

        # Calculate total hours until interview (rounded down)
        # dividing total seconds by 3600 (seconds in an hour) gives total hours
        hours_until_interview = int(time_delta.total_seconds() // 3600)

        # Determine if interview is urgent (within 48 hours)
        # 48 hours = 48 * 3600 = 172800 seconds
        is_urgent = time_delta.total_seconds() <= 172800

        # Return the calculated preparation time information
        return {
            "days_until_interview": days_until_interview,
            "hours_until_interview": hours_until_interview,
            "is_urgent": is_urgent
        }

    @is_tool()
    def search_applications_by_keyword(self, keyword: str, search_fields: Optional[list] = None) -> dict:
        """
        Search applications using keywords in job title or company name.
        Uses fuzzy matching for natural language text fields to improve search robustness.

        Args:
            keyword: Keyword to search for in the specified fields
            search_fields: Optional list of fields to search in. If not provided, defaults to ['job_title', 'company_name']

        Returns:
            Dictionary containing:
            - matching_applications: List of matching application records with application_id, job_title, and company_name
            - total_matches: Total number of matching applications

        Raises:
            ValueError: If keyword is empty or invalid, or if search_fields contains invalid field names
        """
        from thefuzz import fuzz

        # Validate keyword parameter
        if not keyword or not isinstance(keyword, str) or not keyword.strip():
            raise ValueError("Keyword must be a non-empty string")

        keyword = keyword.strip()

        # Set default search fields if not provided
        if search_fields is None:
            search_fields = ['job_title', 'company_name']

        # Validate search_fields parameter
        if not isinstance(search_fields, list) or len(search_fields) == 0:
            raise ValueError("search_fields must be a non-empty list")

        # Define valid searchable fields (natural language text fields that support fuzzy matching)
        valid_fields = ['job_title', 'company_name', 'applicant_name', 'referral_source', 
                        'referral_person', 'priority_reason', 'resume_content', 'cover_letter_content']

        # Validate that all search_fields are valid
        for field in search_fields:
            if field not in valid_fields:
                raise ValueError(f"Invalid search field: {field}. Valid fields are: {valid_fields}")

        # Access the database
        db = self.db
        job_application_table = getattr(db, 'job_application', None)

        # If table doesn't exist or is empty, return empty results
        if job_application_table is None or len(job_application_table) == 0:
            return {
                'matching_applications': [],
                'total_matches': 0
            }

        # Perform fuzzy search across all applications
        matching_applications = []

        # Define similarity threshold for fuzzy matching (can be adjusted based on requirements)
        SIMILARITY_THRESHOLD = 60

        for app_id, application in job_application_table.items():
            # Check if any of the search fields match the keyword using fuzzy matching
            is_match = False

            for field in search_fields:
                # Get field value from application
                field_value = getattr(application, field, None)

                # Skip if field value is None or empty
                if field_value is None or (isinstance(field_value, str) and not field_value.strip()):
                    continue

                # Convert field value to string for comparison
                field_value_str = str(field_value)

                # Use fuzzy matching for natural language text fields
                # Use partial_ratio for better substring matching
                similarity_score = fuzz.partial_ratio(keyword.lower(), field_value_str.lower())

                # If similarity score exceeds threshold, consider it a match
                if similarity_score >= SIMILARITY_THRESHOLD:
                    is_match = True
                    break

            # If match found, add to results
            if is_match:
                matching_applications.append({
                    'application_id': application.application_id,
                    'job_title': application.job_title,
                    'company_name': application.company_name
                })

        # Return results with total count
        return {
            'matching_applications': matching_applications,
            'total_matches': len(matching_applications)
        }

    @is_tool()
    def archive_old_applications(self, cutoff_date: str, archive_status: str = "archived") -> dict:
        """
        Archive applications older than a specified date by updating their status.

        This method finds all job applications with application_date before the cutoff_date
        and updates their status to the specified archive_status (default: 'archived').

        Args:
            cutoff_date: Date before which applications should be archived in yyyy-mm-dd format
            archive_status: Status to set for archived applications (default: 'archived')

        Returns:
            dict: Contains 'archived_count' (number of applications archived) and 
                  'archived_application_ids' (list of archived application IDs)

        Raises:
            ValueError: If cutoff_date format is invalid or if no job_application table exists
        """
        from datetime import datetime

        # Validate cutoff_date format
        try:
            # Parse the cutoff_date string to datetime object (only date part, no time)
            cutoff_datetime = datetime.strptime(cutoff_date, "%Y-%m-%d")
        except ValueError as e:
            raise ValueError(f"Invalid cutoff_date format. Expected yyyy-mm-dd, got: {cutoff_date}") from e

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, "job_application", None)

        # Validate that the table exists
        if job_application_table is None:
            raise ValueError("job_application table does not exist in the database")

        # Initialize tracking variables
        archived_count = 0
        archived_application_ids = []

        # Iterate through all applications in the table
        for application_id, application in job_application_table.items():
            # Check if application_date is before the cutoff_date
            # Compare only the date part (ignore time component)
            if application.application_date.date() < cutoff_datetime.date():
                # Update the application status to archive_status
                application.status = archive_status

                # Update the updated_at timestamp to current time
                application.updated_at = datetime.now()

                # Track the archived application
                archived_count += 1
                archived_application_ids.append(application_id)

        # Write the updated table back to the database
        # This persists all the status changes we made above
        setattr(db, "job_application", job_application_table)

        # Return the results
        return {
            "archived_count": archived_count,
            "archived_application_ids": archived_application_ids
        }

    @is_tool()
    def calculate_application_roi(
        self,
        total_applications: int,
        total_interviews: int,
        total_offers: int,
        average_time_per_application_hours: float = None
    ) -> dict:
        """
        Calculate return on investment metrics for job applications.

        This method computes various conversion rates and time investment metrics
        to help job seekers understand the effectiveness of their application efforts.

        Args:
            total_applications: Total number of applications submitted
            total_interviews: Total number of interviews received
            total_offers: Total number of offers received
            average_time_per_application_hours: Average time spent per application in hours (optional)

        Returns:
            dict: A dictionary containing:
                - interview_conversion_rate: Percentage of applications leading to interviews
                - offer_conversion_rate: Percentage of applications leading to offers
                - interview_to_offer_rate: Percentage of interviews leading to offers
                - total_time_invested_hours: Total time invested in applications (if average_time provided)

        Raises:
            ValueError: If any input values are invalid
        """
        # Validate input parameters - must be non-negative integers
        if not isinstance(total_applications, int) or total_applications < 0:
            raise ValueError("total_applications must be a non-negative integer")

        if not isinstance(total_interviews, int) or total_interviews < 0:
            raise ValueError("total_interviews must be a non-negative integer")

        if not isinstance(total_offers, int) or total_offers < 0:
            raise ValueError("total_offers must be a non-negative integer")

        # Validate optional parameter if provided
        if average_time_per_application_hours is not None:
            if not isinstance(average_time_per_application_hours, (int, float)) or average_time_per_application_hours < 0:
                raise ValueError("average_time_per_application_hours must be a non-negative number")

        # Validate logical constraints - interviews and offers cannot exceed applications
        if total_interviews > total_applications:
            raise ValueError("total_interviews cannot exceed total_applications")

        if total_offers > total_applications:
            raise ValueError("total_offers cannot exceed total_applications")

        # Validate that offers cannot exceed interviews (you can't get an offer without an interview)
        if total_offers > total_interviews:
            raise ValueError("total_offers cannot exceed total_interviews")

        # Initialize result dictionary
        result = {}

        # Calculate interview conversion rate (applications -> interviews)
        # This represents the percentage of applications that resulted in an interview
        if total_applications > 0:
            interview_conversion_rate = (total_interviews / total_applications) * 100
        else:
            # If no applications were submitted, conversion rate is 0
            interview_conversion_rate = 0.0

        result['interview_conversion_rate'] = round(interview_conversion_rate, 2)

        # Calculate offer conversion rate (applications -> offers)
        # This represents the percentage of applications that resulted in a job offer
        if total_applications > 0:
            offer_conversion_rate = (total_offers / total_applications) * 100
        else:
            # If no applications were submitted, conversion rate is 0
            offer_conversion_rate = 0.0

        result['offer_conversion_rate'] = round(offer_conversion_rate, 2)

        # Calculate interview to offer rate (interviews -> offers)
        # This represents the percentage of interviews that resulted in a job offer
        if total_interviews > 0:
            interview_to_offer_rate = (total_offers / total_interviews) * 100
        else:
            # If no interviews were conducted, conversion rate is 0
            interview_to_offer_rate = 0.0

        result['interview_to_offer_rate'] = round(interview_to_offer_rate, 2)

        # Calculate total time invested if average time per application is provided
        # This helps job seekers understand their time investment
        if average_time_per_application_hours is not None:
            total_time_invested_hours = total_applications * average_time_per_application_hours
            result['total_time_invested_hours'] = round(total_time_invested_hours, 2)

        return result

    @is_tool()
    def merge_duplicate_applications(self, primary_application_id: str, secondary_application_id: str) -> dict:
        from datetime import datetime

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Table 'job_application' does not exist in the database")

        # Check if both applications exist
        if primary_application_id not in job_application_table:
            raise KeyError(f"Primary application with ID '{primary_application_id}' does not exist")

        if secondary_application_id not in job_application_table:
            raise KeyError(f"Secondary application with ID '{secondary_application_id}' does not exist")

        # Get both application records (these are JobApplication objects, not dicts)
        primary_app = job_application_table[primary_application_id]
        secondary_app = job_application_table[secondary_application_id]

        # Merge logic: Update primary application with non-null values from secondary application
        # Priority: keep primary's data, but fill in missing (None) fields from secondary

        # Merge optional fields - only update if primary field is None and secondary has a value
        if getattr(primary_app, 'phone', None) is None and getattr(secondary_app, 'phone', None) is not None:
            primary_app.phone = secondary_app.phone

        if getattr(primary_app, 'resume_content', None) is None and getattr(secondary_app, 'resume_content', None) is not None:
            primary_app.resume_content = secondary_app.resume_content
            primary_app.resume_format = getattr(secondary_app, 'resume_format', None)
            primary_app.resume_uploaded_at = getattr(secondary_app, 'resume_uploaded_at', None)

        if getattr(primary_app, 'cover_letter_content', None) is None and getattr(secondary_app, 'cover_letter_content', None) is not None:
            primary_app.cover_letter_content = secondary_app.cover_letter_content
            primary_app.cover_letter_uploaded_at = getattr(secondary_app, 'cover_letter_uploaded_at', None)

        if getattr(primary_app, 'deadline_date', None) is None and getattr(secondary_app, 'deadline_date', None) is not None:
            primary_app.deadline_date = secondary_app.deadline_date
            primary_app.deadline_type = getattr(secondary_app, 'deadline_type', None)

        if getattr(primary_app, 'referral_source', None) is None and getattr(secondary_app, 'referral_source', None) is not None:
            primary_app.referral_source = secondary_app.referral_source

        if getattr(primary_app, 'referral_person', None) is None and getattr(secondary_app, 'referral_person', None) is not None:
            primary_app.referral_person = secondary_app.referral_person

        # For priority, keep higher priority level
        secondary_priority = getattr(secondary_app, 'priority_level', None)
        if secondary_priority is not None:
            primary_priority = getattr(primary_app, 'priority_level', None)
            if primary_priority is None or secondary_priority > primary_priority:
                primary_app.priority_level = secondary_priority
                primary_app.priority_reason = getattr(secondary_app, 'priority_reason', None)

        # For salary expectations, use wider range (lower min, higher max)
        secondary_min = getattr(secondary_app, 'expected_salary_min', None)
        if secondary_min is not None:
            primary_min = getattr(primary_app, 'expected_salary_min', None)
            if primary_min is None:
                primary_app.expected_salary_min = secondary_min
            else:
                primary_app.expected_salary_min = min(float(primary_min), float(secondary_min))

        secondary_max = getattr(secondary_app, 'expected_salary_max', None)
        if secondary_max is not None:
            primary_max = getattr(primary_app, 'expected_salary_max', None)
            if primary_max is None:
                primary_app.expected_salary_max = secondary_max
            else:
                primary_app.expected_salary_max = max(float(primary_max), float(secondary_max))

        if getattr(primary_app, 'salary_currency', None) is None and getattr(secondary_app, 'salary_currency', None) is not None:
            primary_app.salary_currency = secondary_app.salary_currency

        # Use the earlier application date (the first one submitted)
        # Convert to datetime objects if they are strings
        primary_date = datetime.strptime(primary_app.application_date, "%Y-%m-%d %H:%M:%S") if isinstance(primary_app.application_date, str) else primary_app.application_date
        secondary_date = datetime.strptime(secondary_app.application_date, "%Y-%m-%d %H:%M:%S") if isinstance(secondary_app.application_date, str) else secondary_app.application_date

        if secondary_date < primary_date:
            primary_app.application_date = secondary_app.application_date

        # Use the earlier created_at timestamp
        primary_created = datetime.strptime(primary_app.created_at, "%Y-%m-%d %H:%M:%S") if isinstance(primary_app.created_at, str) else primary_app.created_at
        secondary_created = datetime.strptime(secondary_app.created_at, "%Y-%m-%d %H:%M:%S") if isinstance(secondary_app.created_at, str) else secondary_app.created_at

        if secondary_created < primary_created:
            primary_app.created_at = secondary_app.created_at

        # Update the updated_at timestamp to current time
        primary_app.updated_at = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Update the primary application in the database
        job_application_table[primary_application_id] = primary_app

        # Remove the secondary application from the database
        del job_application_table[secondary_application_id]

        # Return the merge result
        return {
            'merged_application_id': primary_application_id,
            'merge_status': 'merged'
        }

    @is_tool()
    def list_applications_by_applicant(self, email: str):
        """
        Retrieve all job applications submitted by a specific applicant

        This method searches for all applications matching the provided email address
        and returns them with their key details in a standardized format.

        Args:
            email: Email address of the applicant

        Returns:
            Dictionary containing:
            - applications: List of application details (application_id, job_title, 
              company_name, status, application_date)
            - total_count: Total number of applications found

        Raises:
            ValueError: If email parameter is empty or invalid
        """
        from datetime import datetime

        # Validate input parameter
        if not email or not isinstance(email, str):
            raise ValueError("Email address must be a non-empty string")

        # Strip whitespace from email for better matching
        email = email.strip()

        if not email:
            raise ValueError("Email address cannot be empty or whitespace only")

        # Access the database
        db = self.db

        # Get the job_application table data
        job_application_table = getattr(db, 'job_application', None)

        # If table doesn't exist or is empty, return empty result
        if job_application_table is None or len(job_application_table) == 0:
            return {
                'applications': [],
                'total_count': 0
            }

        # List to store matching applications
        matching_applications = []

        # Iterate through all applications in the table
        # job_application_table is a Dict[str, JobApplication] where key is application_id
        for application_id, application in job_application_table.items():
            # Check if the email matches (case-insensitive comparison for robustness)
            if application.email.lower() == email.lower():
                # Format application_date to required string format "yyyy-mm-dd HH:MM:SS"
                application_date_str = application.application_date.strftime("%Y-%m-%d %H:%M:%S")

                # Build the application detail dictionary
                application_detail = {
                    'application_id': application.application_id,
                    'job_title': application.job_title,
                    'company_name': application.company_name,
                    'status': application.status,
                    'application_date': application_date_str
                }

                matching_applications.append(application_detail)

        # Sort applications by application_date in descending order (most recent first)
        # This provides a better user experience
        matching_applications.sort(
            key=lambda x: datetime.strptime(x['application_date'], "%Y-%m-%d %H:%M:%S"),
            reverse=True
        )

        # Return the result with applications list and total count
        return {
            'applications': matching_applications,
            'total_count': len(matching_applications)
        }

    @is_tool()
    def set_application_priority(self, application_id: str, priority_level: int, priority_reason: str = None) -> dict:
        """
        Set priority level for a job application

        This method updates the priority_level and priority_reason fields for an existing
        job application in the database. It validates the priority level range (1-5) and
        ensures the application exists before updating.

        Args:
            application_id: Unique identifier of the application to update
            priority_level: Priority level (1-5, where 5 is highest priority)
            priority_reason: Optional reason explaining why this priority was assigned

        Returns:
            dict: Contains application_id and priority_set status
                {
                    'application_id': str,
                    'priority_set': bool
                }

        Raises:
            KeyError: If the application_id does not exist in the database
            ValueError: If priority_level is not in valid range (1-5)
        """
        from datetime import datetime

        # Validate priority_level is within valid range (1-5)
        if not isinstance(priority_level, int) or priority_level < 1 or priority_level > 5:
            raise ValueError(f"priority_level must be an integer between 1 and 5, got: {priority_level}")

        # Access the database
        db = self.db

        # Get the job_application table from database
        job_application_table = getattr(db, 'job_application', None)

        # Check if table exists and is not empty
        if job_application_table is None:
            raise KeyError(f"Application with application_id '{application_id}' does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with application_id '{application_id}' does not exist")

        # Retrieve the application record
        application = job_application_table[application_id]

        # Update the priority_level field
        application.priority_level = priority_level

        # Update the priority_reason field if provided
        if priority_reason is not None:
            application.priority_reason = priority_reason

        # Update the updated_at timestamp to reflect the modification
        application.updated_at = datetime.now().strftime('%Y-%m-%d %H:%M:%S')

        # Write the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success response
        return {
            'application_id': application_id,
            'priority_set': True
        }

    @is_tool()
    def validate_contact_information(self, email: str = None, phone: str = None) -> dict:
        """
        Validate the format of contact information (email and phone number).

        This method validates email and phone formats independently and returns
        detailed validation results including any errors found.

        Args:
            email: Email address to validate (optional)
            phone: Phone number to validate (optional)

        Returns:
            dict: Dictionary containing validation results with keys:
                - email_valid (bool): Whether email format is valid
                - phone_valid (bool): Whether phone format is valid
                - validation_errors (list): List of validation error messages

        Raises:
            ValueError: If both email and phone are None/empty
        """
        import re

        # Initialize result dictionary
        result = {
            'email_valid': False,
            'phone_valid': False,
            'validation_errors': []
        }

        # Check if at least one contact method is provided
        if not email and not phone:
            raise ValueError("At least one contact information (email or phone) must be provided for validation")

        # Validate email if provided
        if email is not None:
            # Email validation regex pattern
            # Pattern explanation:
            # - Start with alphanumeric, dot, underscore, percent, plus, or hyphen
            # - Must have @ symbol
            # - Domain part with alphanumeric and hyphens
            # - Must have dot followed by 2+ letter TLD
            email_pattern = r'^[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}$'

            if not isinstance(email, str):
                result['validation_errors'].append("Email must be a string")
            elif not email.strip():
                result['validation_errors'].append("Email cannot be empty")
            elif re.match(email_pattern, email.strip()):
                result['email_valid'] = True
            else:
                result['validation_errors'].append("Invalid email format. Expected format: user@domain.com")
        else:
            # If email is not provided, mark as valid (not applicable)
            result['email_valid'] = True

        # Validate phone if provided
        if phone is not None:
            # Phone validation regex patterns
            # Support multiple common formats:
            # - International: +1-555-0123, +86 138 0000 0000
            # - With parentheses: (555) 123-4567
            # - With dots: 555.123.4567
            # - With spaces: 555 123 4567
            # - Plain digits: 5551234567
            # Pattern allows optional country code (+), parentheses, spaces, hyphens, and dots
            phone_pattern = r'^\+?[\d\s\-\(\)\.]{7,20}$'

            if not isinstance(phone, str):
                result['validation_errors'].append("Phone must be a string")
            elif not phone.strip():
                result['validation_errors'].append("Phone cannot be empty")
            else:
                phone_stripped = phone.strip()
                # Check basic pattern match
                if re.match(phone_pattern, phone_stripped):
                    # Extract only digits to verify minimum length
                    digits_only = re.sub(r'\D', '', phone_stripped)
                    if len(digits_only) >= 7:  # Minimum 7 digits for a valid phone
                        result['phone_valid'] = True
                    else:
                        result['validation_errors'].append("Phone number must contain at least 7 digits")
                else:
                    result['validation_errors'].append("Invalid phone format. Expected formats: +1-555-0123, (555) 123-4567, 555.123.4567, etc.")
        else:
            # If phone is not provided, mark as valid (not applicable)
            result['phone_valid'] = True

        return result

    @is_tool()
    def track_application_stage(self, application_id: str, stage_name: str, stage_date: str, stage_notes: str = None) -> dict:
        """
        Record the current stage of the application process.

        This method creates a new application stage record in the database, tracking the progression
        of a job application through various hiring stages (e.g., phone_screening, technical_interview).

        Args:
            application_id: Unique identifier of the application
            stage_name: Name of the application stage
            stage_date: Date when the stage was reached in yyyy-mm-dd HH:MM:SS format
            stage_notes: Optional additional notes about the stage

        Returns:
            dict: Contains stage_id and application_id of the newly created stage record

        Raises:
            KeyError: If the application_id does not exist in the system
            ValueError: If stage_date format is invalid
        """
        import secrets
        import hashlib
        from datetime import datetime

        # Access the database instance
        db = self.db

        # Validate that stage_date is in the correct format
        try:
            parsed_stage_date = datetime.strptime(stage_date, "%Y-%m-%d %H:%M:%S")
        except ValueError:
            raise ValueError(f"Invalid stage_date format: {stage_date}. Expected format: yyyy-mm-dd HH:MM:SS")

        # Check if application exists in the system
        # According to pre_condition, application must exist in the system
        # We need to verify the application_id exists in job_application table
        job_application_table = getattr(db, "job_application", None)

        if job_application_table is None or application_id not in job_application_table:
            raise KeyError(f"Application with application_id '{application_id}' does not exist in the system")

        # Get the application_stage table data
        application_stage_table = getattr(db, "application_stage", None)

        if application_stage_table is None:
            application_stage_table = {}

        # Generate a unique stage_id
        # Use a format similar to the example: STAGE-2024-001
        # Generate sequential number based on existing stages
        existing_stage_ids = [sid for sid in application_stage_table.keys() if sid.startswith("STAGE-")]

        if existing_stage_ids:
            # Extract numbers and find the maximum
            numbers = []
            for sid in existing_stage_ids:
                try:
                    # Extract the numeric part after the last hyphen
                    num_part = sid.split("-")[-1]
                    numbers.append(int(num_part))
                except (ValueError, IndexError):
                    continue

            if numbers:
                next_num = max(numbers) + 1
            else:
                next_num = 1
        else:
            next_num = 1

        # Format stage_id to match example format: STAGE-2024-001
        from datetime import datetime as dt
        current_year = dt.now().year
        stage_id = f"STAGE-{current_year}-{next_num:03d}"

        # Create the new ApplicationStage instance
        new_stage = ApplicationStage(
            stage_id=stage_id,
            application_id=application_id,
            stage_name=stage_name,
            stage_date=parsed_stage_date,
            stage_notes=stage_notes
        )

        # Add the new stage to the table
        application_stage_table[stage_id] = new_stage

        # Write the updated table back to the database
        setattr(db, "application_stage", application_stage_table)

        # Return the stage_id and application_id as specified in the returns schema
        return {
            "stage_id": stage_id,
            "application_id": application_id
        }

    @is_tool()
    def get_application_details(self, application_id: str):
        """
        Retrieve complete details of a specific job application

        This method fetches all details of a job application from the database
        and returns them in the required format with datetime fields converted
        to string format.

        Args:
            application_id: Unique identifier of the application to retrieve

        Returns:
            dict: Application details including:
                - application_id: Unique identifier of the application
                - applicant_name: Full name of the applicant
                - applicant_email: Email address of the applicant
                - job_title: Title of the job position
                - company_name: Name of the company
                - status: Current status of the application
                - application_date: Date of application submission in yyyy-mm-dd HH:MM:SS format

        Raises:
            KeyError: If the application_id does not exist in the database
        """
        # Validate input parameter
        if not application_id or not isinstance(application_id, str):
            raise ValueError("application_id must be a non-empty string")

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application with ID '{application_id}' not found: job_application table does not exist")

        # Check if the application exists in the table
        if application_id not in job_application_table:
            raise KeyError(f"Application with ID '{application_id}' not found")

        # Retrieve the application record
        application = job_application_table[application_id]

        # Convert application_date from datetime object to string format
        # The database stores datetime objects, but we need to return string format
        application_date_str = application.application_date.strftime("%Y-%m-%d %H:%M:%S")

        # Build and return the result dictionary with required fields
        result = {
            'application_id': application.application_id,
            'applicant_name': application.applicant_name,
            'applicant_email': application.email,  # Note: database field is 'email', return field is 'applicant_email'
            'job_title': application.job_title,
            'company_name': application.company_name,
            'status': application.status,
            'application_date': application_date_str
        }

        return result

    @is_tool()
    def get_application_stage_history(self, application_id: str) -> dict:
        """
        Retrieve the complete stage progression history of an application.

        This method fetches all stage records associated with a given application ID,
        sorts them chronologically by stage_date, and returns them in a structured format.

        Args:
            application_id: Unique identifier of the application

        Returns:
            Dictionary containing a list of stages in chronological order, where each stage includes:
            - stage_id: Unique identifier of the stage
            - stage_name: Name of the stage (e.g., phone_screening, technical_interview)
            - stage_date: Date and time when the stage was reached (formatted as "yyyy-mm-dd HH:MM:SS")
            - stage_notes: Additional notes about the stage (empty string if None)

        Raises:
            KeyError: If the application_id does not exist in the system
        """
        # Access the database instance
        db = self.db

        # Retrieve the application_stage table from the database
        application_stage_table = getattr(db, 'application_stage', None)

        # Check if the application_stage table exists and is not empty
        if application_stage_table is None or not application_stage_table:
            # If no stages exist at all, the application_id cannot be found
            raise KeyError(f"Application with ID '{application_id}' not found in the system")

        # Filter stages that belong to the specified application_id
        matching_stages = []
        application_found = False

        for stage_id, stage_record in application_stage_table.items():
            if stage_record.application_id == application_id:
                application_found = True
                matching_stages.append(stage_record)

        # If no stages were found for this application_id, raise KeyError
        if not application_found:
            raise KeyError(f"Application with ID '{application_id}' not found in the system")

        # Sort the stages by stage_date in chronological order (earliest first)
        matching_stages.sort(key=lambda stage: stage.stage_date)

        # Format the stages into the required output structure
        stages_list = []
        for stage in matching_stages:
            # Format the stage_date from datetime object to "yyyy-mm-dd HH:MM:SS" string
            formatted_date = stage.stage_date.strftime("%Y-%m-%d %H:%M:%S")

            # Handle optional stage_notes field (convert None to empty string for consistency)
            stage_notes_value = stage.stage_notes if stage.stage_notes is not None else ""

            # Create the stage dictionary with required fields
            stage_dict = {
                'stage_id': stage.stage_id,
                'stage_name': stage.stage_name,
                'stage_date': formatted_date,
                'stage_notes': stage_notes_value
            }

            stages_list.append(stage_dict)

        # Return the result in the required format
        return {
            'stages': stages_list
        }

    @is_tool()
    def compare_application_requirements(self, job_requirements: list, applicant_qualifications: list) -> dict:
        """
        Compare applicant qualifications against job requirements using fuzzy matching.

        This method analyzes how well an applicant's qualifications match the job requirements
        by performing fuzzy string matching on each requirement against all qualifications.
        It returns matched requirements, missing requirements, and an overall match percentage.

        Args:
            job_requirements: List of job requirements (e.g., skills, experience, certifications)
            applicant_qualifications: List of applicant qualifications to compare against requirements

        Returns:
            dict: Dictionary containing:
                - matched_requirements: List of requirements that match applicant qualifications
                - missing_requirements: List of requirements not met by applicant
                - match_percentage: Percentage of requirements matched (0-100)

        Raises:
            ValueError: If job_requirements or applicant_qualifications is not a list,
                       or if either list is empty
        """
        from thefuzz import fuzz, process

        # Input validation: check if parameters are lists
        if not isinstance(job_requirements, list):
            raise ValueError("job_requirements must be a list")
        if not isinstance(applicant_qualifications, list):
            raise ValueError("applicant_qualifications must be a list")

        # Input validation: check if lists are not empty
        if len(job_requirements) == 0:
            raise ValueError("job_requirements cannot be empty")
        if len(applicant_qualifications) == 0:
            raise ValueError("applicant_qualifications cannot be empty")

        # Input validation: check if all elements are strings
        if not all(isinstance(req, str) for req in job_requirements):
            raise ValueError("All job_requirements must be strings")
        if not all(isinstance(qual, str) for qual in applicant_qualifications):
            raise ValueError("All applicant_qualifications must be strings")

        # Initialize result containers
        matched_requirements = []
        missing_requirements = []

        # Define matching threshold for fuzzy matching (80% similarity)
        # This threshold balances between being too strict and too lenient
        MATCH_THRESHOLD = 80

        # Process each job requirement
        for requirement in job_requirements:
            # Strip whitespace for cleaner comparison
            requirement_clean = requirement.strip()

            # Use fuzzy matching to find the best match from applicant qualifications
            # process.extractOne returns (best_match, score) or None if no candidates
            best_match = process.extractOne(
                requirement_clean, 
                [qual.strip() for qual in applicant_qualifications]
            )

            # Check if a good enough match was found
            if best_match and best_match[1] >= MATCH_THRESHOLD:
                # Requirement is matched - add original requirement text to matched list
                matched_requirements.append(requirement)
            else:
                # Requirement is not met - add to missing list
                missing_requirements.append(requirement)

        # Calculate match percentage
        # Percentage = (number of matched requirements / total requirements) * 100
        total_requirements = len(job_requirements)
        matched_count = len(matched_requirements)
        match_percentage = (matched_count / total_requirements) * 100.0

        # Round to 2 decimal places for cleaner output
        match_percentage = round(match_percentage, 2)

        # Return comparison results
        return {
            'matched_requirements': matched_requirements,
            'missing_requirements': missing_requirements,
            'match_percentage': match_percentage
        }

    @is_tool()
    def restore_archived_application(self, application_id: str, restored_status: str = "submitted") -> dict:
        """
        Restore an archived application to active status

        Args:
            application_id: Unique identifier of the archived application
            restored_status: Status to set after restoration (default: "submitted")

        Returns:
            dict: Contains application_id and restore_status

        Raises:
            KeyError: If application_id does not exist or application is not archived
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, "job_application", None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"job_application table not found in database")

        # Check if the application exists
        if application_id not in job_application_table:
            raise KeyError(f"Application with id '{application_id}' does not exist")

        # Get the application record
        application = job_application_table[application_id]

        # Verify the application is currently archived
        if application.status != "archived":
            raise KeyError(f"Application '{application_id}' is not archived (current status: {application.status})")

        # Update the application status to the restored status
        application.status = restored_status

        # Update the updated_at timestamp with formatted string
        application.updated_at = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Write the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, "job_application", job_application_table)

        # Return the result
        return {
            "application_id": application_id,
            "restore_status": "restored"
        }

    @is_tool()
    def generate_application_timeline(self, application_stages):
        """
        Generate a timeline visualization of application progress.

        This method takes a list of application stages with their dates and generates
        a structured timeline showing the progression of stages and days elapsed since
        the first stage.

        Args:
            application_stages: List of dicts containing stage_name and stage_date

        Returns:
            Dict containing timeline_data with stage, date, and days_since_start

        Raises:
            ValueError: If application_stages is empty, invalid, or contains invalid dates
        """
        from datetime import datetime

        # Validate input parameter
        if not application_stages:
            raise ValueError("application_stages must not be empty")

        if not isinstance(application_stages, list):
            raise ValueError("application_stages must be a list")

        # Validate each stage entry and parse dates
        parsed_stages = []
        for idx, stage in enumerate(application_stages):
            # Validate stage structure
            if not isinstance(stage, dict):
                raise ValueError(f"Stage at index {idx} must be a dictionary")

            if 'stage_name' not in stage or 'stage_date' not in stage:
                raise ValueError(f"Stage at index {idx} must contain 'stage_name' and 'stage_date' fields")

            stage_name = stage['stage_name']
            stage_date_str = stage['stage_date']

            # Validate stage_name
            if not isinstance(stage_name, str) or not stage_name.strip():
                raise ValueError(f"stage_name at index {idx} must be a non-empty string")

            # Validate and parse stage_date
            if not isinstance(stage_date_str, str):
                raise ValueError(f"stage_date at index {idx} must be a string")

            # Try to parse the date string in the expected format
            try:
                # Support both full datetime format and date-only format
                if len(stage_date_str.strip()) == 10:  # Date only format "yyyy-mm-dd"
                    stage_date = datetime.strptime(stage_date_str.strip(), "%Y-%m-%d")
                else:  # Full datetime format "yyyy-mm-dd HH:MM:SS"
                    stage_date = datetime.strptime(stage_date_str.strip(), "%Y-%m-%d %H:%M:%S")
            except ValueError as e:
                raise ValueError(f"stage_date at index {idx} has invalid format. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got '{stage_date_str}': {str(e)}")

            parsed_stages.append({
                'stage_name': stage_name.strip(),
                'stage_date': stage_date,
                'stage_date_str': stage_date_str.strip()
            })

        # Sort stages by date to ensure chronological order
        parsed_stages.sort(key=lambda x: x['stage_date'])

        # Get the first stage date as the starting point
        start_date = parsed_stages[0]['stage_date']

        # Build timeline data
        timeline_data = []
        for stage in parsed_stages:
            stage_date = stage['stage_date']

            # Calculate days since start (using date difference)
            # Convert to days by dividing total seconds by seconds per day
            days_since_start = (stage_date - start_date).days

            timeline_data.append({
                'stage': stage['stage_name'],
                'date': stage['stage_date_str'],
                'days_since_start': days_since_start
            })

        return {
            'timeline_data': timeline_data
        }

    @is_tool()
    def generate_application_statistics(self, applications: list) -> dict:
        """
        Generate statistical summary of all applications.

        This method analyzes a list of applications and generates comprehensive statistics
        including total count, status breakdown, and time-based metrics (this month/week).

        Args:
            applications: List of application dictionaries containing application_id, 
                         status, and application_date

        Returns:
            Dictionary containing:
            - total_applications: Total number of applications
            - status_breakdown: Count of applications by status
            - applications_this_month: Number of applications submitted this month
            - applications_this_week: Number of applications submitted this week

        Raises:
            ValueError: If applications parameter is invalid or contains invalid data
        """
        from datetime import datetime, timedelta

        # Validate input parameter
        if not isinstance(applications, list):
            raise ValueError("applications parameter must be a list")

        if not applications:
            # Return empty statistics for empty list
            return {
                'total_applications': 0,
                'status_breakdown': {},
                'applications_this_month': 0,
                'applications_this_week': 0
            }

        # Initialize statistics containers
        total_applications = len(applications)
        status_breakdown = {}
        applications_this_month = 0
        applications_this_week = 0

        # Get current date and time for comparison
        now = datetime.now()

        # Calculate start of current month (first day at 00:00:00)
        month_start = datetime(now.year, now.month, 1)

        # Calculate start of current week (Monday at 00:00:00)
        # weekday() returns 0 for Monday, 6 for Sunday
        days_since_monday = now.weekday()
        week_start = datetime(now.year, now.month, now.day) - timedelta(days=days_since_monday)

        # Process each application
        for idx, app in enumerate(applications):
            # Validate application structure
            if not isinstance(app, dict):
                raise ValueError(f"Application at index {idx} must be a dictionary")

            if 'application_id' not in app:
                raise ValueError(f"Application at index {idx} is missing required field 'application_id'")

            if 'status' not in app:
                raise ValueError(f"Application at index {idx} is missing required field 'status'")

            if 'application_date' not in app:
                raise ValueError(f"Application at index {idx} is missing required field 'application_date'")

            # Extract status and update status breakdown
            status = app['status']
            if not isinstance(status, str):
                raise ValueError(f"Application {app['application_id']}: status must be a string")

            # Count applications by status
            status_breakdown[status] = status_breakdown.get(status, 0) + 1

            # Parse application date
            application_date_str = app['application_date']
            if not isinstance(application_date_str, str):
                raise ValueError(f"Application {app['application_id']}: application_date must be a string")

            try:
                # Parse datetime string in format "yyyy-mm-dd HH:MM:SS" or "yyyy-mm-dd"
                if len(application_date_str) == 10:
                    # Date only format "yyyy-mm-dd"
                    application_date = datetime.strptime(application_date_str, "%Y-%m-%d")
                else:
                    # Full datetime format "yyyy-mm-dd HH:MM:SS"
                    application_date = datetime.strptime(application_date_str, "%Y-%m-%d %H:%M:%S")
            except ValueError as e:
                raise ValueError(
                    f"Application {app['application_id']}: Invalid application_date format. "
                    f"Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got '{application_date_str}'"
                ) from e

            # Check if application was submitted this month
            if application_date >= month_start:
                applications_this_month += 1

            # Check if application was submitted this week
            if application_date >= week_start:
                applications_this_week += 1

        # Return comprehensive statistics
        return {
            'total_applications': total_applications,
            'status_breakdown': status_breakdown,
            'applications_this_month': applications_this_month,
            'applications_this_week': applications_this_week
        }

    @is_tool()
    def calculate_stage_duration(self, stage_start_date: str, stage_end_date: str) -> dict:
        """
        Calculate the duration spent in a specific application stage.

        This method computes the time difference between stage start and end dates,
        returning both the duration in days and hours.

        Args:
            stage_start_date: Start date of the stage in yyyy-mm-dd HH:MM:SS format
            stage_end_date: End date of the stage in yyyy-mm-dd HH:MM:SS format

        Returns:
            Dictionary containing:
                - duration_days: Duration in days (integer)
                - duration_hours: Duration in hours (integer)

        Raises:
            ValueError: If date format is invalid or end date is before start date
        """
        from datetime import datetime

        # Validate input parameters are not None or empty
        if not stage_start_date or not isinstance(stage_start_date, str):
            raise ValueError("stage_start_date must be a non-empty string")

        if not stage_end_date or not isinstance(stage_end_date, str):
            raise ValueError("stage_end_date must be a non-empty string")

        # Parse the date strings to datetime objects
        try:
            start_dt = datetime.strptime(stage_start_date.strip(), "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid stage_start_date format. Expected 'yyyy-mm-dd HH:MM:SS', got '{stage_start_date}'. Error: {str(e)}")

        try:
            end_dt = datetime.strptime(stage_end_date.strip(), "%Y-%m-%d %H:%M:%S")
        except ValueError as e:
            raise ValueError(f"Invalid stage_end_date format. Expected 'yyyy-mm-dd HH:MM:SS', got '{stage_end_date}'. Error: {str(e)}")

        # Validate that end date is not before start date
        if end_dt < start_dt:
            raise ValueError(f"stage_end_date ({stage_end_date}) cannot be before stage_start_date ({stage_start_date})")

        # Calculate the time difference
        time_delta = end_dt - start_dt

        # Calculate duration in days (integer)
        # Using total_seconds() to get precise calculation, then converting to days
        duration_days = int(time_delta.total_seconds() // 86400)  # 86400 seconds in a day

        # Calculate duration in hours (integer)
        # Using total_seconds() to get precise calculation, then converting to hours
        duration_hours = int(time_delta.total_seconds() // 3600)  # 3600 seconds in an hour

        # Return the calculated durations
        return {
            "duration_days": duration_days,
            "duration_hours": duration_hours
        }

    @is_tool()
    def list_applications_by_status(self, status: str) -> dict:
        """
        Retrieve all job applications with a specific status.

        Args:
            status: Status to filter applications by (e.g., 'under_review', 'submitted', 'accepted')

        Returns:
            Dictionary containing:
            - applications: List of application dictionaries with selected fields
            - total_count: Total number of applications with the specified status

        Raises:
            ValueError: If status parameter is empty or invalid
        """
        # Validate input parameter
        if not status or not isinstance(status, str):
            raise ValueError("Status parameter must be a non-empty string")

        # Strip whitespace from status for comparison
        status = status.strip()

        if not status:
            raise ValueError("Status parameter cannot be empty or whitespace only")

        # Access the database
        db = self.db

        # Get the job_application table data
        job_application_table = getattr(db, 'job_application', None)

        # Initialize result list
        matching_applications = []

        # If table exists and has data, filter by status
        if job_application_table:
            # Iterate through all applications in the table
            for application_id, application in job_application_table.items():
                # Check if the application status matches the requested status
                # Use exact match as 'status' is a predefined field with specific values
                if application.status and application.status.strip() == status:
                    # Format application_date to string in required format
                    application_date_str = application.application_date.strftime("%Y-%m-%d %H:%M:%S")

                    # Build application dictionary with required fields
                    application_dict = {
                        'application_id': application.application_id,
                        'applicant_name': application.applicant_name,
                        'job_title': application.job_title,
                        'company_name': application.company_name,
                        'application_date': application_date_str
                    }

                    matching_applications.append(application_dict)

        # Sort applications by application_date in descending order (most recent first)
        # This provides a more useful ordering for the user
        matching_applications.sort(
            key=lambda x: x['application_date'],
            reverse=True
        )

        # Calculate total count
        total_count = len(matching_applications)

        # Return the result in the specified format
        return {
            'applications': matching_applications,
            'total_count': total_count
        }

    @is_tool()
    def get_high_priority_applications(self, min_priority_level: int) -> dict:
        """
        Retrieve all high priority applications based on minimum priority level threshold.

        Args:
            min_priority_level: Minimum priority level to filter by (integer value)

        Returns:
            Dictionary containing list of high priority applications with their details

        Raises:
            ValueError: If min_priority_level is invalid or no applications found
        """
        # Validate input parameter
        if not isinstance(min_priority_level, int):
            raise ValueError("min_priority_level must be an integer")

        # Priority level should be within reasonable range (1-5 as per schema description)
        if min_priority_level < 1 or min_priority_level > 5:
            raise ValueError("min_priority_level must be between 1 and 5")

        # Access the database
        db = self.db

        # Get the job_application table data
        job_application_table = getattr(db, 'job_application', None)

        # Check if table exists and has data
        if job_application_table is None:
            raise ValueError("job_application table not found in database")

        if not job_application_table:
            raise ValueError("No job applications found in database")

        # Filter applications by priority level
        # Only include applications where priority_level >= min_priority_level
        high_priority_apps = []

        for app_id, application in job_application_table.items():
            # Check if priority_level exists and meets the threshold
            if application.priority_level is not None and application.priority_level >= min_priority_level:
                # Build application dictionary with required fields
                app_dict = {
                    'application_id': application.application_id,
                    'job_title': application.job_title,
                    'company_name': application.company_name,
                    'priority_level': application.priority_level,
                    'status': application.status
                }
                high_priority_apps.append(app_dict)

        # Check if any high priority applications were found
        if not high_priority_apps:
            raise ValueError(f"No applications found with priority level >= {min_priority_level}")

        # Sort by priority level in descending order (highest priority first)
        high_priority_apps.sort(key=lambda x: x['priority_level'], reverse=True)

        # Return the result in the expected format
        return {
            'applications': high_priority_apps
        }

    @is_tool()
    def create_job_application(
        self,
        applicant_name: str,
        email: str,
        job_title: str,
        company_name: str,
        application_date: str,
        phone: str = None,
        resume_content: str = None,
        cover_letter_content: str = None
    ) -> dict:
        """
        Create a new job application with applicant information, job details, and application materials.

        This method validates input parameters, generates a unique application ID, creates a new
        JobApplication record, and stores it in the database.

        Args:
            applicant_name: Full name of the job applicant
            email: Email address of the applicant
            job_title: Title of the job position being applied for
            company_name: Name of the company
            application_date: Date when the application is submitted in yyyy-mm-dd HH:MM:SS format
            phone: Phone number of the applicant (optional)
            resume_content: Text content of the resume (optional)
            cover_letter_content: Text content of the cover letter (optional)

        Returns:
            dict: Dictionary containing application_id, status, and created_at timestamp

        Raises:
            ValueError: If required parameters are missing or invalid
        """
        from datetime import datetime
        import secrets
        import hashlib

        # Validate required parameters are not empty
        if not applicant_name or not applicant_name.strip():
            raise ValueError("applicant_name cannot be empty")

        if not email or not email.strip():
            raise ValueError("email cannot be empty")

        if not job_title or not job_title.strip():
            raise ValueError("job_title cannot be empty")

        if not company_name or not company_name.strip():
            raise ValueError("company_name cannot be empty")

        if not application_date or not application_date.strip():
            raise ValueError("application_date cannot be empty")

        # Validate and parse application_date format
        try:
            # Try parsing with time
            parsed_application_date = datetime.strptime(application_date, "%Y-%m-%d %H:%M:%S")
        except ValueError:
            try:
                # Try parsing date only format and add default time
                parsed_application_date = datetime.strptime(application_date, "%Y-%m-%d")
            except ValueError:
                raise ValueError(
                    "application_date must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format"
                )

        # Validate email format (basic validation)
        if "@" not in email or "." not in email.split("@")[-1]:
            raise ValueError("email must be a valid email address")

        # Generate unique application ID with prefix APP- and year
        current_year = datetime.now().year
        random_suffix = secrets.token_hex(3).upper()
        application_id = f"APP-{current_year}-{random_suffix}"

        # Get current timestamp for created_at
        created_at = datetime.now()

        # Access database
        db = self.db

        # Get job_application table, initialize if not exists
        job_application_table = getattr(db, "job_application", None)
        if job_application_table is None:
            job_application_table = {}

        # Determine resume_uploaded_at timestamp if resume_content is provided
        resume_uploaded_at = created_at if resume_content else None

        # Determine cover_letter_uploaded_at timestamp if cover_letter_content is provided
        cover_letter_uploaded_at = created_at if cover_letter_content else None

        # Create new JobApplication instance
        new_application = JobApplication(
            application_id=application_id,
            applicant_name=applicant_name.strip(),
            email=email.strip(),
            phone=phone.strip() if phone else None,
            job_title=job_title.strip(),
            company_name=company_name.strip(),
            application_date=parsed_application_date,
            status="submitted",  # Default status for new applications
            resume_content=resume_content,
            resume_uploaded_at=resume_uploaded_at,
            cover_letter_content=cover_letter_content,
            cover_letter_uploaded_at=cover_letter_uploaded_at,
            created_at=created_at,
            updated_at=created_at
        )

        # Add new application to the table
        job_application_table[application_id] = new_application

        # Save updated table back to database
        setattr(db, "job_application", job_application_table)

        # Format timestamps for return values
        created_at_str = created_at.strftime("%Y-%m-%d %H:%M:%S")

        # Return success response with application details
        return {
            "application_id": application_id,
            "status": "created",
            "created_at": created_at_str
        }

    @is_tool()
    def calculate_average_response_time(self, application_response_pairs: list) -> dict:
        """
        Calculate average response time across multiple applications.

        This method computes statistical metrics (average, median, fastest, slowest) 
        for response times based on application and response date pairs.

        Args:
            application_response_pairs: List of dictionaries containing 'application_date' 
                                       and 'response_date' in "yyyy-mm-dd HH:MM:SS" format

        Returns:
            Dictionary containing:
                - average_days: Mean response time in days
                - median_days: Median response time in days
                - fastest_response_days: Minimum response time in days
                - slowest_response_days: Maximum response time in days

        Raises:
            ValueError: If input is empty, dates are invalid, or response date is before application date
        """
        from datetime import datetime

        # Validate input is not empty
        if not application_response_pairs or len(application_response_pairs) == 0:
            raise ValueError("application_response_pairs cannot be empty")

        # List to store response times in days
        response_times = []

        # Process each application-response pair
        for idx, pair in enumerate(application_response_pairs):
            # Validate pair structure
            if not isinstance(pair, dict):
                raise ValueError(f"Item at index {idx} must be a dictionary")

            if 'application_date' not in pair or 'response_date' not in pair:
                raise ValueError(f"Item at index {idx} must contain both 'application_date' and 'response_date'")

            application_date_str = pair['application_date']
            response_date_str = pair['response_date']

            # Validate date strings are not empty
            if not application_date_str or not response_date_str:
                raise ValueError(f"Dates at index {idx} cannot be empty")

            try:
                # Parse application date - support both full datetime and date-only formats
                if len(application_date_str.strip()) == 10:  # Date only format "yyyy-mm-dd"
                    application_date = datetime.strptime(application_date_str.strip(), "%Y-%m-%d")
                else:  # Full datetime format "yyyy-mm-dd HH:MM:SS"
                    application_date = datetime.strptime(application_date_str.strip(), "%Y-%m-%d %H:%M:%S")
            except ValueError as e:
                raise ValueError(f"Invalid application_date format at index {idx}: {application_date_str}. Expected 'yyyy-mm-dd' or 'yyyy-mm-dd HH:MM:SS'")

            try:
                # Parse response date - support both full datetime and date-only formats
                if len(response_date_str.strip()) == 10:  # Date only format "yyyy-mm-dd"
                    response_date = datetime.strptime(response_date_str.strip(), "%Y-%m-%d")
                else:  # Full datetime format "yyyy-mm-dd HH:MM:SS"
                    response_date = datetime.strptime(response_date_str.strip(), "%Y-%m-%d %H:%M:%S")
            except ValueError as e:
                raise ValueError(f"Invalid response_date format at index {idx}: {response_date_str}. Expected 'yyyy-mm-dd' or 'yyyy-mm-dd HH:MM:SS'")

            # Validate response date is not before application date
            if response_date < application_date:
                raise ValueError(f"Response date at index {idx} cannot be before application date")

            # Calculate time difference in days (with fractional days for precision)
            time_diff = response_date - application_date
            days_diff = time_diff.total_seconds() / (24 * 3600)

            response_times.append(days_diff)

        # Calculate statistical metrics
        # Average response time
        average_days = sum(response_times) / len(response_times)

        # Median response time
        sorted_times = sorted(response_times)
        n = len(sorted_times)
        if n % 2 == 0:
            # Even number of elements: average of two middle values
            median_days = (sorted_times[n // 2 - 1] + sorted_times[n // 2]) / 2
        else:
            # Odd number of elements: middle value
            median_days = sorted_times[n // 2]

        # Fastest (minimum) response time
        fastest_response_days = min(response_times)

        # Slowest (maximum) response time
        slowest_response_days = max(response_times)

        # Return results
        return {
            'average_days': average_days,
            'median_days': median_days,
            'fastest_response_days': fastest_response_days,
            'slowest_response_days': slowest_response_days
        }

    @is_tool()
    def list_applications_by_date_range(self, start_date: str, end_date: str):
        """
        Retrieve job applications submitted within a specific date range.

        This method filters job applications based on their application_date field,
        returning all applications that fall within the specified date range (inclusive).

        Args:
            start_date: Start date of the range in yyyy-mm-dd format
            end_date: End date of the range in yyyy-mm-dd format

        Returns:
            A dictionary containing:
            - applications: List of application dictionaries with selected fields
            - total_count: Total number of applications in the date range

        Raises:
            ValueError: If date format is invalid or start_date is after end_date
        """
        from datetime import datetime

        # Validate and parse date parameters
        try:
            # Parse start_date and end_date to datetime objects
            start_dt = datetime.strptime(start_date, "%Y-%m-%d")
            end_dt = datetime.strptime(end_date, "%Y-%m-%d")

            # Set end_dt to the end of the day (23:59:59) to include all applications on end_date
            end_dt = end_dt.replace(hour=23, minute=59, second=59)

        except ValueError as e:
            raise ValueError(f"Invalid date format. Expected yyyy-mm-dd format. Error: {str(e)}")

        # Validate that start_date is not after end_date
        if start_dt > end_dt:
            raise ValueError("start_date cannot be after end_date")

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, "job_application", None)

        # If table doesn't exist or is empty, return empty result
        if job_application_table is None or len(job_application_table) == 0:
            return {
                "applications": [],
                "total_count": 0
            }

        # Filter applications within the date range
        filtered_applications = []

        for application_id, application in job_application_table.items():
            # Get the application_date from the application object
            app_date = application.application_date

            # Check if application_date falls within the date range (inclusive)
            if start_dt <= app_date <= end_dt:
                # Format the application_date to string format "yyyy-mm-dd HH:MM:SS"
                formatted_date = app_date.strftime("%Y-%m-%d %H:%M:%S")

                # Create a dictionary with the required fields
                app_dict = {
                    "application_id": application.application_id,
                    "applicant_name": application.applicant_name,
                    "job_title": application.job_title,
                    "company_name": application.company_name,
                    "application_date": formatted_date
                }

                filtered_applications.append(app_dict)

        # Sort applications by application_date (ascending order)
        # This provides a consistent ordering for the results
        filtered_applications.sort(key=lambda x: x["application_date"])

        # Calculate total count
        total_count = len(filtered_applications)

        # Return the result
        return {
            "applications": filtered_applications,
            "total_count": total_count
        }

    @is_tool()
    def detect_duplicate_applications(self, job_title: str, company_name: str, existing_applications: list) -> dict:
        """
        Detect potential duplicate applications based on job title and company name using fuzzy matching.

        This method compares the provided job_title and company_name against existing applications
        to identify potential duplicates. It uses fuzzy string matching to handle variations in
        naming and formatting.

        Args:
            job_title: Job title to check for duplicates
            company_name: Company name to check for duplicates
            existing_applications: List of existing application dictionaries, each containing:
                - application_id: Unique identifier for the application
                - job_title: Job title of the existing application
                - company_name: Company name of the existing application

        Returns:
            Dictionary containing:
                - is_duplicate: Boolean indicating if duplicate(s) were found
                - duplicate_application_ids: List of application IDs that are potential duplicates

        Raises:
            ValueError: If required parameters are missing or invalid
        """
        from thefuzz import fuzz

        # Validate input parameters
        if not job_title or not isinstance(job_title, str):
            raise ValueError("job_title must be a non-empty string")

        if not company_name or not isinstance(company_name, str):
            raise ValueError("company_name must be a non-empty string")

        if not isinstance(existing_applications, list):
            raise ValueError("existing_applications must be a list")

        # Initialize result structure
        duplicate_ids = []

        # Define similarity threshold for fuzzy matching (0-100 scale)
        # Using 85 as threshold - high enough to catch real duplicates but allow minor variations
        SIMILARITY_THRESHOLD = 85

        # Normalize input strings for better matching (strip whitespace, lowercase for comparison)
        job_title_normalized = job_title.strip()
        company_name_normalized = company_name.strip()

        # Iterate through existing applications to find duplicates
        for app in existing_applications:
            # Validate application structure
            if not isinstance(app, dict):
                continue

            if 'application_id' not in app or 'job_title' not in app or 'company_name' not in app:
                continue

            # Extract and normalize existing application data
            existing_job_title = app.get('job_title', '').strip()
            existing_company_name = app.get('company_name', '').strip()
            existing_app_id = app.get('application_id')

            # Skip if any required field is empty
            if not existing_job_title or not existing_company_name or not existing_app_id:
                continue

            # Calculate fuzzy matching scores for both job title and company name
            # Using partial_ratio to handle cases where one string is a substring of another
            job_title_similarity = fuzz.partial_ratio(
                job_title_normalized.lower(),
                existing_job_title.lower()
            )

            company_name_similarity = fuzz.partial_ratio(
                company_name_normalized.lower(),
                existing_company_name.lower()
            )

            # Consider it a duplicate if BOTH job title and company name have high similarity
            # This ensures we don't flag different positions at the same company or
            # same position at different companies as duplicates
            if (job_title_similarity >= SIMILARITY_THRESHOLD and 
                company_name_similarity >= SIMILARITY_THRESHOLD):
                duplicate_ids.append(existing_app_id)

        # Prepare and return result
        result = {
            'is_duplicate': len(duplicate_ids) > 0,
            'duplicate_application_ids': duplicate_ids
        }

        return result

    @is_tool()
    def add_salary_expectation(self, application_id: str, expected_salary_min: float, expected_salary_max: float = None, salary_currency: str = None):
        """
        Add salary expectation information to an application

        This method updates an existing job application with salary expectation details.
        It validates the application exists, checks salary values are valid, and updates
        the application record with the provided salary information.

        Args:
            application_id: Unique identifier of the application
            expected_salary_min: Minimum expected salary (required)
            expected_salary_max: Maximum expected salary (optional)
            salary_currency: Currency for salary (optional, defaults to USD if not provided)

        Returns:
            dict: Contains application_id and salary_expectation_added (boolean)

        Raises:
            KeyError: If application_id does not exist in the database
            ValueError: If salary values are invalid (negative or min > max)
        """
        from datetime import datetime

        # Access the database
        db = self.db

        # Get the job_application table
        job_application_table = getattr(db, 'job_application', None)

        # Check if the table exists
        if job_application_table is None:
            raise KeyError(f"Application table not found in database")

        # Check if the application exists
        if application_id not in job_application_table:
            raise KeyError(f"Application with id '{application_id}' does not exist")

        # Validate salary values
        if expected_salary_min < 0:
            raise ValueError(f"Minimum expected salary cannot be negative: {expected_salary_min}")

        if expected_salary_max is not None:
            if expected_salary_max < 0:
                raise ValueError(f"Maximum expected salary cannot be negative: {expected_salary_max}")
            if expected_salary_max < expected_salary_min:
                raise ValueError(f"Maximum expected salary ({expected_salary_max}) cannot be less than minimum ({expected_salary_min})")

        # Get the application record
        application = job_application_table[application_id]

        # Update salary expectation fields
        application.expected_salary_min = expected_salary_min

        # Update optional fields if provided
        if expected_salary_max is not None:
            application.expected_salary_max = expected_salary_max

        # Set salary currency - use provided value or default to USD
        if salary_currency is not None:
            application.salary_currency = salary_currency
        elif application.salary_currency is None:
            # If no currency provided and none exists, use USD as default
            application.salary_currency = "USD"

        # Update the updated_at timestamp
        application.updated_at = datetime.now()

        # Save the updated application back to the database
        job_application_table[application_id] = application
        setattr(db, 'job_application', job_application_table)

        # Return success response
        return {
            'application_id': application_id,
            'salary_expectation_added': True
        }

    @is_tool()
    def generate_application_summary(self, job_title: str, company_name: str, application_date: str, status: str, job_requirements: list = None) -> dict:
        """
        Generate a summary of key information for a job application.

        This method creates a formatted summary text based on the provided application details.
        It does not require database access as it works with the provided parameters directly.

        Args:
            job_title: Title of the job position
            company_name: Name of the company
            application_date: Date of application in yyyy-mm-dd HH:MM:SS format
            status: Current status of the application
            job_requirements: Optional list of key job requirements

        Returns:
            dict: Dictionary containing the generated summary text

        Raises:
            ValueError: If required parameters are missing or invalid
        """
        from datetime import datetime

        # Validate required parameters
        if not job_title or not isinstance(job_title, str):
            raise ValueError("job_title must be a non-empty string")

        if not company_name or not isinstance(company_name, str):
            raise ValueError("company_name must be a non-empty string")

        if not application_date or not isinstance(application_date, str):
            raise ValueError("application_date must be a non-empty string")

        if not status or not isinstance(status, str):
            raise ValueError("status must be a non-empty string")

        # Validate and parse application_date format
        try:
            # Try to parse the full datetime format
            parsed_date = datetime.strptime(application_date, "%Y-%m-%d %H:%M:%S")
            # Format date for display (just the date part)
            formatted_date = parsed_date.strftime("%Y-%m-%d")
        except ValueError:
            try:
                # Try to parse date-only format
                parsed_date = datetime.strptime(application_date, "%Y-%m-%d")
                formatted_date = parsed_date.strftime("%Y-%m-%d")
            except ValueError:
                raise ValueError("application_date must be in 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd' format")

        # Validate job_requirements if provided
        if job_requirements is not None:
            if not isinstance(job_requirements, list):
                raise ValueError("job_requirements must be a list")
            if not all(isinstance(req, str) for req in job_requirements):
                raise ValueError("All items in job_requirements must be strings")

        # Build the summary text
        summary_parts = []

        # Basic application information
        summary_parts.append(f"Applied for {job_title} position at {company_name} on {formatted_date}.")

        # Current status
        summary_parts.append(f"Current status: {status}.")

        # Add job requirements if provided
        if job_requirements and len(job_requirements) > 0:
            requirements_text = ", ".join(job_requirements)
            summary_parts.append(f"Key requirements: {requirements_text}.")

        # Combine all parts into final summary
        summary_text = " ".join(summary_parts)

        # Return the result as a dictionary with summary_text key
        return {
            "summary_text": summary_text
        }

    @is_tool()
    def format_application_for_display(self, application_data: dict, display_format: str = "summary") -> dict:
        """
        Format application data for user-friendly display.

        This method transforms raw application data into a formatted text string
        suitable for display to users. It supports different display formats.

        Args:
            application_data: Dictionary containing application information with keys:
                - application_id: Unique identifier for the application
                - job_title: Title of the job position
                - company_name: Name of the company
                - status: Current application status
                - application_date: Date when application was submitted (format: "yyyy-mm-dd HH:MM:SS")
            display_format: Format type for display (default: "summary")
                Supported formats:
                - "summary": Brief one-line summary
                - "detailed": Multi-line detailed view
                - "compact": Very brief format

        Returns:
            Dictionary containing:
                - formatted_text: Formatted string ready for display

        Raises:
            ValueError: If required fields are missing or invalid
        """
        from datetime import datetime

        # Validate that application_data is provided and is a dictionary
        if not application_data:
            raise ValueError("application_data is required and cannot be empty")

        if not isinstance(application_data, dict):
            raise ValueError("application_data must be a dictionary")

        # Validate required fields in application_data
        required_fields = ['application_id', 'job_title', 'company_name', 'status', 'application_date']
        missing_fields = [field for field in required_fields if field not in application_data]

        if missing_fields:
            raise ValueError(f"Missing required fields in application_data: {', '.join(missing_fields)}")

        # Extract data from application_data
        application_id = application_data.get('application_id', '')
        job_title = application_data.get('job_title', '')
        company_name = application_data.get('company_name', '')
        status = application_data.get('status', '')
        application_date = application_data.get('application_date', '')

        # Validate that extracted fields are not empty
        if not all([application_id, job_title, company_name, status, application_date]):
            raise ValueError("All required fields (application_id, job_title, company_name, status, application_date) must have non-empty values")

        # Parse and format the application date
        try:
            # Parse the datetime string
            if isinstance(application_date, str):
                # Try parsing with full datetime format first
                try:
                    date_obj = datetime.strptime(application_date, "%Y-%m-%d %H:%M:%S")
                    formatted_date = date_obj.strftime("%Y-%m-%d")
                except ValueError:
                    # Try parsing with date-only format
                    date_obj = datetime.strptime(application_date, "%Y-%m-%d")
                    formatted_date = date_obj.strftime("%Y-%m-%d")
            else:
                raise ValueError("application_date must be a string in format 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd'")
        except ValueError as e:
            raise ValueError(f"Invalid application_date format. Expected 'yyyy-mm-dd HH:MM:SS' or 'yyyy-mm-dd', got: {application_date}")

        # Format status for display (convert underscore to space and title case)
        display_status = status.replace('_', ' ').title()

        # Generate formatted text based on display_format
        if display_format == "summary":
            # Summary format: "Job Title at Company Name - Status: Status (Applied: Date)"
            formatted_text = f"{job_title} at {company_name} - Status: {display_status} (Applied: {formatted_date})"

        elif display_format == "detailed":
            # Detailed format: Multi-line with all information
            formatted_text = (
                f"Application ID: {application_id}\n"
                f"Position: {job_title}\n"
                f"Company: {company_name}\n"
                f"Status: {display_status}\n"
                f"Applied Date: {formatted_date}"
            )

        elif display_format == "compact":
            # Compact format: Very brief, just essentials
            formatted_text = f"{job_title} @ {company_name} ({display_status})"

        else:
            # Default to summary format for unknown formats
            formatted_text = f"{job_title} at {company_name} - Status: {display_status} (Applied: {formatted_date})"

        # Return the formatted result
        return {
            'formatted_text': formatted_text
        }
