#!/usr/bin/env python3
"""Script to remove all comments from Python files while preserving strings."""

import os
import re
import sys
from pathlib import Path
import tokenize
import io


def remove_comments_from_python_file(file_path):
    """
    Remove all comments from a Python file while preserving:
    - Shebang lines
    - Strings containing #
    - Functional code
    
    Returns: (modified_content, has_changes)
    """
    try:
        with open(file_path, 'r', encoding='utf-8') as f:
            original_content = f.read()
    except Exception as e:
        print(f"Error reading {file_path}: {e}")
        return None, False
    
    if not original_content.strip():
        return original_content, False
    
    try:
        lines = original_content.splitlines(keepends=True)
        result_lines = []
        tokens = list(tokenize.generate_tokens(io.StringIO(original_content).readline))
        
        comment_positions = set()
        for tok in tokens:
            if tok.type == tokenize.COMMENT:
                line_no = tok.start[0]
                start_col = tok.start[1]
                comment_positions.add((line_no, start_col, tok.string))
        
        for i, line in enumerate(lines, start=1):
            if i == 1 and line.startswith('#!'):
                result_lines.append(line)
                continue
            
            comments_on_line = [(start_col, comment) for (line_no, start_col, comment) in comment_positions if line_no == i]
            
            if not comments_on_line:
                result_lines.append(line)
            else:
                comments_on_line.sort(key=lambda x: x[0])
                first_comment_col = comments_on_line[0][0]
                
                code_before = line[:first_comment_col]
                
                if code_before.strip():
                    result_lines.append(code_before.rstrip() + '\n')
                elif not code_before.strip():
                    pass
        
        modified_content = ''.join(result_lines)
        has_changes = modified_content != original_content
        
        return modified_content, has_changes
    
    except Exception as e:
        print(f"Error processing {file_path}: {e}")
        return None, False


def process_directory(root_dir):
    """Process all Python files in directory."""
    root_path = Path(root_dir)
    py_files = list(root_path.rglob('*.py'))
    
    modified_files = []
    error_files = []
    
    for py_file in py_files:
        print(f"Processing: {py_file}")
        
        modified_content, has_changes = remove_comments_from_python_file(py_file)
        
        if modified_content is None:
            error_files.append(str(py_file))
            continue
        
        if has_changes:
            try:
                with open(py_file, 'w', encoding='utf-8') as f:
                    f.write(modified_content)
                modified_files.append(str(py_file))
                print(f"  ✓ Modified")
            except Exception as e:
                print(f"  ✗ Error writing: {e}")
                error_files.append(str(py_file))
        else:
            print(f"  - No changes needed")
    
    return modified_files, error_files, len(py_files)


if __name__ == '__main__':
    target_dir = r'c:\Users\13113\Downloads\submit\sup-bigym'
    
    print(f"Removing comments from Python files in: {target_dir}\n")
    
    modified_files, error_files, total_files = process_directory(target_dir)
    
    print("\n" + "="*80)
    print("SUMMARY")
    print("="*80)
    print(f"Total files processed: {total_files}")
    print(f"Modified files: {len(modified_files)}")
    print(f"Error files: {len(error_files)}")
    
    if modified_files:
        print("\nModified files:")
        for f in sorted(modified_files):
            print(f"  - {f}")
    
    if error_files:
        print("\nError files:")
        for f in sorted(error_files):
            print(f"  - {f}")
