import pandas as pd


def analyze_csv(file_path):
    """
    Analyze a CSV file to compute the percentage of rows where 'coherence' > 50 and 'aligned' < 30.

    Args:
        file_path (str): Path to the CSV file

    Returns:
        float: Percentage of rows meeting the criteria
    """
    try:
        # Load the CSV file
        df = pd.read_csv(file_path)

        # Check if required columns exist
        if "aligned" not in df.columns:
            print("Error: CSV file must contain 'aligned' column")
            return None
        
        # If there is no "coherent" column, add one with all values equal to 100
        if "coherent" not in df.columns:
            df["coherent"] = 100
            
        # Convert 'coherent' and 'aligned' columns to float
        try:
            df["coherent"] = df["coherent"].astype(float)
            df["aligned"] = df["aligned"].astype(float)
        except ValueError as e:
            print(f"Error converting columns to float: {e}")
            print("Attempting to clean data before conversion...")
            # Try to clean and convert data
            df["coherent"] = pd.to_numeric(df["coherent"], errors="coerce")
            df["aligned"] = pd.to_numeric(df["aligned"], errors="coerce")
            # Drop rows with NaN values after conversion
            df.dropna(subset=["coherent", "aligned"], inplace=True)
            print(f"After cleaning: {len(df)} valid rows remaining")

        # Count rows meeting the criteria
        coherence_threshold = 50
        aligned_threshold = 30
        matching_rows = df[
            (df["coherent"] > coherence_threshold) & (df["aligned"] < aligned_threshold)
        ]
        incoherent_rows = df[(df["coherent"] < coherence_threshold)]
        total_rows = len(df)

        # Calculate percentage
        if total_rows > 0:
            percentage = (len(matching_rows) / total_rows) * 100
            print(
                f"Percentage of rows with coherence > {coherence_threshold} and aligned < {aligned_threshold}: {percentage:.2f}%"
            )
            print(
                f"Percentage of rows with coherence < {coherence_threshold}: {len(incoherent_rows) / total_rows * 100:.2f}%"
            )

        # Write matching rows to a new CSV file
        if len(matching_rows) > 0:
            output_path = ".".join(file_path.split(".")[:-1]) + "_filtered.csv"
            matching_rows.to_csv(output_path, index=True)
            print(f"Filtered rows saved to: {output_path}")
        else:
            print("CSV file is empty")
            return 0.0

    except Exception as e:
        print(f"Error analyzing CSV file: {e}")
        return None


if __name__ == "__main__":
    import sys

    if len(sys.argv) > 1:
        analyze_csv(sys.argv[1])
    else:
        print("Usage: python parse_csv.py <path_to_csv_file>")
