import os
import argparse
from pathlib import Path

# This file is used to fill in the input file parameters of Evaluate_Trajectory_By_Rule/split_traj_by_patch_correctness/trajectory2report-xxx.py.

def classify_traj_files(base_path="data/trajectory_original"):
    """
    Classify the relative path of all subfiles in the result/traj directory
    Args:
        base_path: The base directory path to search for trajectory files (default: "data/trajectory_original")
    Returns 3 lists:
    1. The file name contains the file "openhands"
    2. The file name contains a file with "moatless"
    3. Other documents
    """
    base_path = Path(base_path)
    
    openhands_files = []
    moatless_files = []
    other_files = []
    
    # traverse all subdirectories and files
    for root, dirs, files in os.walk(base_path):
        for file in files:
            file_path = os.path.join(root, file)
            # Generate relative path instead of absolute path
            relative_path = os.path.relpath(file_path)

            # classify according to file name
            if "openhands" in file.lower():
                openhands_files.append(relative_path)
            elif "moatless" in file.lower():
                moatless_files.append(relative_path)
            else:
                other_files.append(relative_path)
    
    return openhands_files, moatless_files, other_files

if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Classify trajectory files by their names")
    parser.add_argument(
        "--base_path", 
        type=str, 
        default="data/trajectory_original",
        help="Base directory path to search for trajectory files (default: data/trajectory_original)"
    )
    
    args = parser.parse_args()
    
    openhands_list, moatless_list, other_list = classify_traj_files(args.base_path)

    # output three steps according to requirements
    print(" The first list (the file containing 'openhands') :")
    print(sorted(openhands_list))

    print("\n The second list (containing 'moatless' files) :")
    print(sorted(moatless_list))

    print("\n The third list (other files) :")
    print(sorted(other_list))