#!/usr/bin/env python3
"""
Simple parquet to JSON converter
Usage: python simple_parquet_to_json.py <input_parquet_path> <output_json_path>
"""

import pandas as pd
import json
import numpy as np
import sys
from pathlib import Path

def convert_numpy_objects(obj):
    """Convert numpy objects to JSON-serializable format"""
    if isinstance(obj, np.ndarray):
        return obj.tolist()
    elif isinstance(obj, np.integer):
        return int(obj)
    elif isinstance(obj, np.floating):
        return float(obj)
    elif isinstance(obj, dict):
        return {k: convert_numpy_objects(v) for k, v in obj.items()}
    elif isinstance(obj, list):
        return [convert_numpy_objects(item) for item in obj]
    else:
        return obj

def parquet_to_json(input_path: str, output_path: str, pretty: bool = True):
    """Convert a parquet file to JSON"""
    try:
        # Check if input file exists
        if not Path(input_path).exists():
            print(f"❌ Error: Input file '{input_path}' does not exist")
            return False
        
        # Create output directory if it doesn't exist
        output_dir = Path(output_path).parent
        output_dir.mkdir(parents=True, exist_ok=True)
        
        print(f"Converting {input_path} to {output_path}")
        
        # Read parquet file
        df = pd.read_parquet(input_path)
        
        # Convert to dictionary
        data = df.to_dict('records')
        
        # Convert numpy objects
        data = convert_numpy_objects(data)
        
        # Write to JSON
        with open(output_path, 'w', encoding='utf-8') as f:
            if pretty:
                json.dump(data, f, indent=2, ensure_ascii=False)
            else:
                json.dump(data, f, ensure_ascii=False)
        
        print(f"✅ Successfully converted {len(data)} records")
        print(f"📁 Output saved to: {output_path}")
        return True
        
    except Exception as e:
        print(f"❌ Error converting {input_path}: {e}")
        return False

def main():
    """Main function"""
    if len(sys.argv) != 3:
        print("Usage: python simple_parquet_to_json.py <input_parquet_path> <output_json_path>")
        print("Example: python simple_parquet_to_json.py data.parquet output.json")
        sys.exit(1)
    
    input_path = sys.argv[1]
    output_path = sys.argv[2]
    
    success = parquet_to_json(input_path, output_path)
    
    if success:
        print("🎉 Conversion completed successfully!")
    else:
        print("💥 Conversion failed!")
        sys.exit(1)

if __name__ == "__main__":
    main() 