# python3 clean_procfiles.py /home/miria/CVXDPO/extracted_features/batchsize150/extracted_features_attn_NEG_POS_SFT_distilbert_distilgpt2_ultra/ /home/miria/CVXDPO/extracted_features/batchsize150/extracted_features_attn_NEG_POS_SFT_openai-community_gpt2_ultra/


import os
import argparse
import sys

def clean_proc_files(directory: str):
    """
    Delete all files in `directory` whose names do NOT contain '_proc'.
    """
    if not os.path.isdir(directory):
        print(f"Skipping: {directory} (not a directory)", file=sys.stderr)
        return

    for name in os.listdir(directory):
        path = os.path.join(directory, name)
        # Only consider files
        if os.path.isfile(path):
            # If '_proc' not in the filename, delete it
            if "_proc" not in name:
                try:
                    os.remove(path)
                    print(f"Deleted: {path}")
                except Exception as e:
                    print(f"Failed to delete {path}: {e}", file=sys.stderr)

def main():
    parser = argparse.ArgumentParser(
        description="Keep only files with '_proc' in the name under each given directory."
    )
    parser.add_argument(
        'dirs',
        nargs='+',
        help="One or more directories to clean up"
    )
    args = parser.parse_args()

    for d in args.dirs:
        print(f"\nCleaning directory: {d}")
        clean_proc_files(d)

if __name__ == "__main__":
    main()
