"""
Script to scan all JSON files in save/solution directory and delete files 
that contain more than 1 '\boxed' in the new_solution field.
"""

import json
import os
import re
from pathlib import Path
import argparse
from olym_gen.generator.answer_compare_generator import ExtractAnswerMixin
from olym_gen.utils.utils import get_logger

logger = get_logger()
logger.addFilter(lambda record: not "answer_compare_generator.py" in record.pathname)  # Set filter to block ExtractBoxedAnswer logs

def count_boxed_occurrences(text):
    """Count the number of '\boxed' occurrences in the text."""
    if not text:
        return 0
    return len(re.findall(r'\\boxed\s*\{', text))

def process_solution_files(solution_dir, confirm_deletion=True, lines=None):
    """Process all JSON files in the solution directory."""
    solution_path = Path(solution_dir)

    if not solution_path.exists():
        logger.error(f"Directory {solution_dir} does not exist.")
        return

    # Get all JSON files
    json_files = list(solution_path.glob("*.json"))
    logger.info(f"Found {len(json_files)} JSON files to process.")

    files_to_delete = []
    total_processed = 0
    error_count = 0

    for json_file in json_files:
        total_processed += 1

        try:
            # Read the JSON file
            with open(json_file, 'r', encoding='utf-8') as f:
                data = json.load(f)

            # Check if 'new_solution' field exists
            if 'new_solution' not in data:
                logger.warning(f"File {json_file.name} does not have 'new_solution' field.")
                continue

            # Count \boxed occurrences in new_solution
            new_solution = data['new_solution']
            boxed_count = count_boxed_occurrences(new_solution)
            answer = ExtractAnswerMixin().extract_boxed_answer(new_solution)

            if boxed_count != 1 or answer == '':
                files_to_delete.append(json_file)
                logger.debug(f"File {json_file.name}: Found {boxed_count} \\boxed occurrences - MARKED FOR DELETION")
            else:
                logger.debug(f"File {json_file.name}: Found {boxed_count} \\boxed occurrences - OK")

        except json.JSONDecodeError as e:
            logger.error(f"Failed to parse JSON in {json_file.name}: {e}")
            error_count += 1
        except Exception as e:
            logger.error(f"Failed to process {json_file.name}: {e}")
            error_count += 1

        if lines is not None and total_processed >= lines:
            logger.info(f"Processed {lines} files, stopping early.")
            break

    logger.info(f"Processing complete!")
    logger.info(f"Total files processed: {total_processed}")
    logger.info(f"Files with errors: {error_count}")
    logger.info(f"Files marked for deletion: {len(files_to_delete)}")

    if files_to_delete:
        logger.info(f"\nFiles to be deleted ({len(files_to_delete)}):")
        for file_path in files_to_delete:
            logger.debug(f"  - {file_path.name}")

        # Ask for confirmation before deletion

        if confirm_deletion:
            response = input(f"\nDo you want to delete these {len(files_to_delete)} files? (y/N): ").strip().lower()
        else:
            response = 'y'

        if response == 'y' or response == 'yes':
            deleted_count = 0
            for file_path in files_to_delete:
                try:
                    os.remove(file_path)
                    logger.debug(f"Deleted: {file_path.name}")
                    deleted_count += 1
                except Exception as e:
                    logger.error(f"Error deleting {file_path.name}: {e}")

            logger.info(f"\nDeletion complete! Successfully deleted {deleted_count} files.")
        else:
            logger.info("Deletion cancelled.")
    else:
        logger.info("\nNo files need to be deleted.")

if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Process solution files to check for multiple boxed answers.")
    parser.add_argument('--no_confirm', action='store_false', help="Don't ask for confirmation before deleting files.")
    parser.add_argument('--lines', type=int, default=None, help="Number of files to process (default: all).")
    parser.add_argument('--solution_directory', type=str, default='save/solution', help="Directory containing solution JSON files.")
    args = parser.parse_args()
    process_solution_files(args.solution_directory, args.no_confirm, args.lines)
