package parquet

import (
	"fmt"
	"os"
	"path/filepath"
	"sync"
	"time"

	"github.com/xitongsys/parquet-go-source/local"
	"github.com/xitongsys/parquet-go/parquet"
	"github.com/xitongsys/parquet-go/writer"
)

// BatchWriter handles buffered writing to Parquet files with automatic rotation
type BatchWriter[T any] struct {
	mu            sync.Mutex
	outputDir     string
	batchSize     int
	maxFileSize   int64
	flushInterval time.Duration

	buffer          []T
	currentFilePath string
	parquetWriter   *writer.ParquetWriter
	currentFileSize int64
	fileCounter     int
	lastFlush       time.Time

	flushTicker *time.Ticker
	stopChan    chan struct{}
	wg          sync.WaitGroup

	// Metrics
	totalSize int64
}

// NewBatchWriter creates a new batch writer for the given type
func NewBatchWriter[T any](outputDir string, batchSize int, maxFileSize int64, flushInterval int) (*BatchWriter[T], error) {
	// Create output directory if it doesn't exist
	if err := os.MkdirAll(outputDir, 0755); err != nil {
		return nil, fmt.Errorf("failed to create output directory: %w", err)
	}

	bw := &BatchWriter[T]{
		outputDir:     outputDir,
		batchSize:     batchSize,
		maxFileSize:   maxFileSize,
		flushInterval: time.Duration(flushInterval) * time.Second,
		buffer:        make([]T, 0, batchSize),
		lastFlush:     time.Now(),
		stopChan:      make(chan struct{}),
	}

	// Start periodic flush goroutine
	bw.flushTicker = time.NewTicker(bw.flushInterval)
	bw.wg.Add(1)
	go bw.periodicFlush()

	return bw, nil
}

// GetTotalSize returns the total size of data written in bytes
func (bw *BatchWriter[T]) GetTotalSize() int64 {
	bw.mu.Lock()
	defer bw.mu.Unlock()
	return bw.totalSize
}

// Write adds a record to the buffer
func (bw *BatchWriter[T]) Write(record T) error {
	bw.mu.Lock()
	defer bw.mu.Unlock()

	bw.buffer = append(bw.buffer, record)

	// Check if we need to flush
	if len(bw.buffer) >= bw.batchSize {
		return bw.flushLocked()
	}

	return nil
}

// Flush writes all buffered records to disk
func (bw *BatchWriter[T]) Flush() error {
	bw.mu.Lock()
	defer bw.mu.Unlock()
	return bw.flushLocked()
}

// flushLocked performs the actual flush (must be called with lock held)
func (bw *BatchWriter[T]) flushLocked() error {
	if len(bw.buffer) == 0 {
		return nil
	}

	// Check if we need to rotate file based on actual file size
	if bw.parquetWriter == nil {
		if err := bw.rotateFileLocked(); err != nil {
			return fmt.Errorf("failed to rotate file: %w", err)
		}
	} else if bw.currentFilePath != "" {
		// Check actual file size before writing
		if fileInfo, err := os.Stat(bw.currentFilePath); err == nil {
			newSize := fileInfo.Size()
			delta := newSize - bw.currentFileSize
			if delta > 0 {
				bw.totalSize += delta
			}
			bw.currentFileSize = newSize

			if bw.currentFileSize >= bw.maxFileSize {
				if err := bw.rotateFileLocked(); err != nil {
					return fmt.Errorf("failed to rotate file: %w", err)
				}
			}
		}
	}

	// Write all buffered records
	for _, record := range bw.buffer {
		if err := bw.parquetWriter.Write(record); err != nil {
			return fmt.Errorf("failed to write record: %w", err)
		}
	}

	// Clear buffer and update flush time
	bw.buffer = bw.buffer[:0]
	bw.lastFlush = time.Now()

	return nil
}

// rotateFileLocked closes current file and opens a new one
func (bw *BatchWriter[T]) rotateFileLocked() error {
	// Close existing writer
	if bw.parquetWriter != nil {
		if err := bw.parquetWriter.WriteStop(); err != nil {
			return fmt.Errorf("failed to close parquet writer: %w", err)
		}

		// Update total size with final file size
		if bw.currentFilePath != "" {
			if info, err := os.Stat(bw.currentFilePath); err == nil {
				newSize := info.Size()
				delta := newSize - bw.currentFileSize
				if delta > 0 {
					bw.totalSize += delta
				}
			}
		}
	}

	// Create new file
	bw.fileCounter++
	filename := filepath.Join(bw.outputDir, fmt.Sprintf("part-%04d.parquet", bw.fileCounter))

	// Create local file writer
	fw, err := local.NewLocalFileWriter(filename)
	if err != nil {
		return fmt.Errorf("failed to create file %s: %w", filename, err)
	}

	// Create parquet writer
	pw, err := writer.NewParquetWriter(fw, new(T), 4)
	if err != nil {
		fw.Close()
		return fmt.Errorf("failed to create parquet writer: %w", err)
	}

	pw.CompressionType = parquet.CompressionCodec_SNAPPY

	bw.currentFilePath = filename
	bw.parquetWriter = pw
	bw.currentFileSize = 0

	fmt.Printf("[INFO] Created new parquet file: %s\n", filename)

	return nil
}

// periodicFlush runs in background to flush based on time
func (bw *BatchWriter[T]) periodicFlush() {
	defer bw.wg.Done()

	for {
		select {
		case <-bw.flushTicker.C:
			bw.mu.Lock()
			if len(bw.buffer) > 0 && time.Since(bw.lastFlush) >= bw.flushInterval {
				if err := bw.flushLocked(); err != nil {
					fmt.Printf("[ERROR] Periodic flush failed: %v\n", err)
				}
			}
			bw.mu.Unlock()

		case <-bw.stopChan:
			return
		}
	}
}

// Close flushes remaining data and closes the writer
func (bw *BatchWriter[T]) Close() error {
	// Stop periodic flush
	close(bw.stopChan)
	bw.flushTicker.Stop()
	bw.wg.Wait()

	// Final flush
	if err := bw.Flush(); err != nil {
		return err
	}

	// Close parquet writer
	bw.mu.Lock()
	defer bw.mu.Unlock()

	if bw.parquetWriter != nil {
		if err := bw.parquetWriter.WriteStop(); err != nil {
			return err
		}
	}

	return nil
}
