package tasks

import (
	"bytes"
	"context"
	"errors"
	"fmt"
	"strings"
	"sync"
	"text/template"
	"time"

	"github.com/reposurvey/pipeline/client"
	"github.com/reposurvey/pipeline/config"
	"github.com/reposurvey/pipeline/models"
	"github.com/reposurvey/pipeline/parquet"
)

// truncatePatch truncates a patch string to maxLen characters
func truncatePatch(patch string, maxLen int) string {
	if len(patch) > maxLen {
		return patch[:maxLen] + "\n... (truncated)"
	}
	return patch
}

// enhancePRJob represents a single PR to enhance with LLM
type enhancePRJob struct {
	pr models.EnrichedPRData
}

// enhanceThroughputMonitor tracks and reports enhancement pipeline throughput
type enhanceThroughputMonitor struct {
	mu           sync.Mutex
	prsProcessed int64
	prsEnhanced  int64
	prsFailed    int64
	startTime    time.Time
	writer       *parquet.ParallelBatchWriter[models.LLMEnhancedPRData]
	llmClient    *client.LLMClient
}

func newEnhanceThroughputMonitor(writer *parquet.ParallelBatchWriter[models.LLMEnhancedPRData], llmClient *client.LLMClient) *enhanceThroughputMonitor {
	return &enhanceThroughputMonitor{
		startTime: time.Now(),
		writer:    writer,
		llmClient: llmClient,
	}
}

func (m *enhanceThroughputMonitor) addPRsProcessed(count int) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.prsProcessed += int64(count)
}

func (m *enhanceThroughputMonitor) addPRsEnhanced(count int) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.prsEnhanced += int64(count)
}

func (m *enhanceThroughputMonitor) addPRsFailed(count int) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.prsFailed += int64(count)
}

func (m *enhanceThroughputMonitor) report() {
	m.mu.Lock()
	defer m.mu.Unlock()

	elapsed := time.Since(m.startTime).Seconds()
	processRate := float64(m.prsProcessed) / elapsed
	enhanceRate := float64(m.prsEnhanced) / elapsed

	// Get data written size
	totalBytes := m.writer.GetTotalSize()
	totalGB := float64(totalBytes) / (1024 * 1024 * 1024)
	mbps := float64(totalBytes) / (1024 * 1024) / elapsed

	// Get LLM throughput statistics
	llmStats := m.llmClient.GetStats()
	llmReqRate := float64(llmStats.FinishedRequests) / elapsed
	promptTokenRate := float64(llmStats.TotalPromptTokens) / elapsed
	completionTokenRate := float64(llmStats.TotalCompletionTokens) / elapsed

	fmt.Printf("[THROUGHPUT] PRs: %d (%.1f/s) | Enhanced: %d (%.1f/s) | Failed: %d | Data: %.2f GB (%.2f MB/s) | Elapsed: %.1fs\n",
		m.prsProcessed, processRate, m.prsEnhanced, enhanceRate, m.prsFailed, totalGB, mbps, elapsed)
	fmt.Printf("[LLM STATS]  Requests: %d (%.1f/s) | Prompt: %d (%.1f/s) | Completion: %d (%.1f/s) | Total: %d\n",
		llmStats.FinishedRequests, llmReqRate, llmStats.TotalPromptTokens, promptTokenRate, llmStats.TotalCompletionTokens, completionTokenRate, llmStats.TotalTokens)
}

// Task4LLMEnhance implements LLM-based PR enhancement
type Task4LLMEnhance struct {
	cfg       *config.Config
	llmClient *client.LLMClient
	writer    *parquet.ParallelBatchWriter[models.LLMEnhancedPRData]

	// Channel for piping jobs from reader to workers (1 PR = 1 job)
	jobChan chan enhancePRJob

	// Throughput monitoring
	monitor *enhanceThroughputMonitor

	// Templates for LLM prompts
	summaryTmpl      *template.Template
	commitRefineTmpl *template.Template
}

// Hardcoded LLM generation parameters
const (
	// Max tokens for PR summary generation
	llmSummaryMaxTokens = 512
	// Max tokens for commit message refinement
	llmCommitRefineMaxTokens = 256
)

// NewTask4LLMEnhance creates a new LLM enhancement task
func NewTask4LLMEnhance(cfg *config.Config) (*Task4LLMEnhance, error) {
	// Create LLM client with configurable timeout
	llmCfg := client.LLMConfig{
		BaseURL:        cfg.LLMBaseURL,
		APIKey:         cfg.LLMAPIKey,
		Model:          cfg.LLMModel,
		TimeoutSeconds: cfg.LLMTimeoutSeconds,
	}
	llmClient := client.NewLLMClient(llmCfg)

	// Create enhanced PR writer
	writer, err := parquet.NewParallelBatchWriter[models.LLMEnhancedPRData](
		cfg.LLMEnhancedPRsDir,
		cfg.PRBatchSize,
		cfg.MaxFileSize,
		cfg.FlushInterval,
		32, // 32 concurrent writers
	)
	if err != nil {
		return nil, fmt.Errorf("failed to create LLM enhanced PR writer: %w", err)
	}

	// Template functions
	funcMap := template.FuncMap{
		"truncatePatch": truncatePatch,
	}

	// Parse templates
	summaryTmpl, err := template.New("summary").Parse(prSummaryPromptTemplate)
	if err != nil {
		return nil, fmt.Errorf("failed to parse summary template: %w", err)
	}

	commitRefineTmpl, err := template.New("commit_refine").Funcs(funcMap).Parse(commitRefinePromptTemplate)
	if err != nil {
		return nil, fmt.Errorf("failed to parse commit refine template: %w", err)
	}

	return &Task4LLMEnhance{
		cfg:              cfg,
		llmClient:        llmClient,
		writer:           writer,
		jobChan:          make(chan enhancePRJob, cfg.LLMConcurrency),
		monitor:          newEnhanceThroughputMonitor(writer, llmClient),
		summaryTmpl:      summaryTmpl,
		commitRefineTmpl: commitRefineTmpl,
	}, nil
}

// Run starts the LLM enhancement process
func (t *Task4LLMEnhance) Run(ctx context.Context) error {
	fmt.Println("[INFO] Starting Task 4: LLM Enhancement")

	// Create batch reader for Enriched PR data (from Task 3)
	reader, err := parquet.NewParallelBatchReader[models.EnrichedPRData](t.cfg.EnrichedPRsDir, t.cfg.PRBatchSize, t.cfg.OfflineConcurrency, 2)
	if err != nil {
		return fmt.Errorf("failed to create enriched PR reader: %w", err)
	}

	fmt.Printf("[INFO] Found %d enriched PR parquet files to process\n", reader.GetFileCount())

	// Start throughput monitor
	monitorCtx, monitorCancel := context.WithCancel(ctx)
	defer monitorCancel()
	go t.runThroughputMonitor(monitorCtx)

	// Start worker pool
	workersDone := make(chan error, 1)
	go func() {
		if err := t.runWorkers(ctx); err != nil {
			workersDone <- fmt.Errorf("workers error: %w", err)
		}
		close(workersDone)
	}()

	// Read and dispatch PR jobs (1 PR = 1 job)
	for {
		select {
		case <-ctx.Done():
			close(t.jobChan)
			return ctx.Err()
		default:
		}

		batch, hasMore, err := reader.ReadBatch()
		if err != nil {
			close(t.jobChan)
			return fmt.Errorf("failed to read enriched PR batch: %w", err)
		}

		// Dispatch each PR as an individual job
		for _, pr := range batch {
			job := enhancePRJob{pr: pr}

			select {
			case t.jobChan <- job:
			case <-ctx.Done():
				close(t.jobChan)
				return ctx.Err()
			}

			t.monitor.addPRsProcessed(1)
		}

		if !hasMore {
			break
		}
	}

	// Signal workers that no more jobs will be sent
	close(t.jobChan)

	// Wait for workers to complete
	if err := <-workersDone; err != nil {
		return err
	}

	// Final report
	t.monitor.report()
	fmt.Println("[INFO] Task 4 completed successfully")
	return nil
}

// runThroughputMonitor reports throughput statistics every 30 seconds
func (t *Task4LLMEnhance) runThroughputMonitor(ctx context.Context) {
	ticker := time.NewTicker(30 * time.Second)
	defer ticker.Stop()

	for {
		select {
		case <-ctx.Done():
			t.monitor.report()
			return
		case <-ticker.C:
			t.monitor.report()
		}
	}
}

// runWorkers implements the worker pool for enhancing PRs
func (t *Task4LLMEnhance) runWorkers(ctx context.Context) error {
	workerCount := t.cfg.LLMConcurrency
	fmt.Printf("[INFO] Starting %d workers for LLM enhancement\n", workerCount)

	errChan := make(chan error, workerCount)

	for i := 0; i < workerCount; i++ {
		go func(workerID int) {
			for job := range t.jobChan {
				if err := t.processJob(ctx, job); err != nil {
					// Don't log errors during graceful shutdown (context canceled or writer closed)
					if !errors.Is(err, context.Canceled) && !errors.Is(err, parquet.ErrWriterClosed) {
						fmt.Printf("[ERROR] Worker %d failed to process PR %s#%d: %v\n", workerID, job.pr.RepoName, job.pr.PRID, err)
					}
					t.monitor.addPRsFailed(1)
				}
			}
			errChan <- nil
		}(i)
	}

	// Wait for all workers to complete
	for i := 0; i < workerCount; i++ {
		if err := <-errChan; err != nil {
			return err
		}
	}

	return nil
}

// processJob enhances a single PR with LLM
func (t *Task4LLMEnhance) processJob(ctx context.Context, job enhancePRJob) error {
	pr := job.pr

	// Step 1: Generate PR summary
	summary, err := t.generatePRSummary(ctx, pr)
	if err != nil {
		return fmt.Errorf("failed to generate summary: %w", err)
	}

	// Step 2: Refine each commit message
	enhancedCommits := make([]models.EnhancedCommitInfo, 0, len(pr.Commits))
	for _, commit := range pr.Commits {
		refinedMessage, err := t.refineCommitMessage(ctx, pr, summary, commit)
		if err != nil {
			// Skip logging if context was cancelled (graceful shutdown)
			if !errors.Is(err, context.Canceled) {
				fmt.Printf("[WARN] Failed to refine commit %s for PR %s#%d: %v\n", commit.SHA[:8], pr.RepoName, pr.PRID, err)
			}
			refinedMessage = commit.Message
		}

		enhancedCommits = append(enhancedCommits, models.EnhancedCommitInfo{
			SHA:            commit.SHA,
			Author:         commit.Author,
			Timestamp:      commit.Timestamp,
			Diffs:          commit.Diffs,
			Message:        commit.Message,
			RefinedMessage: refinedMessage,
		})
	}

	// Step 3: Build enhanced PR data
	enhancedPR := models.LLMEnhancedPRData{
		PRID:              pr.PRID,
		RepoID:            pr.RepoID,
		RepoName:          pr.RepoName,
		RepoDesc:          pr.RepoDesc,
		Title:             pr.Title,
		Body:              pr.Body,
		Issue:             pr.Issue,
		RelatedIssueCount: pr.RelatedIssueCount,
		ChangedPyFiles:    pr.ChangedPyFiles,
		RelevantFiles:     pr.RelevantFiles,
		Commits:           enhancedCommits,
		PRSummary:         summary,
	}

	// Step 4: Write enhanced data
	if err := t.writer.Write(enhancedPR); err != nil {
		// Don't wrap ErrWriterClosed - it's expected during graceful shutdown
		if errors.Is(err, parquet.ErrWriterClosed) {
			return err
		}
		return fmt.Errorf("failed to write enhanced PR: %w", err)
	}

	t.monitor.addPRsEnhanced(1)
	return nil
}

// generatePRSummary generates a summary of the entire PR using LLM
func (t *Task4LLMEnhance) generatePRSummary(ctx context.Context, pr models.EnrichedPRData) (string, error) {
	// Build prompt from template
	var buf bytes.Buffer
	if err := t.summaryTmpl.Execute(&buf, pr); err != nil {
		return "", fmt.Errorf("failed to execute summary template: %w", err)
	}

	prompt := buf.String()

	// Call LLM with summary-specific max tokens
	summary, err := t.llmClient.Generate(ctx, prompt, llmSummaryMaxTokens)
	if err != nil {
		return "", err
	}

	return strings.TrimSpace(summary), nil
}

// refineCommitMessage refines a commit message using LLM with PR context
func (t *Task4LLMEnhance) refineCommitMessage(ctx context.Context, pr models.EnrichedPRData, summary string, commit models.CommitInfo) (string, error) {
	// Build template data
	data := struct {
		Summary string
		Commit  models.CommitInfo
	}{
		Summary: summary,
		Commit:  commit,
	}

	// Build prompt from template
	var buf bytes.Buffer
	if err := t.commitRefineTmpl.Execute(&buf, data); err != nil {
		return "", fmt.Errorf("failed to execute commit refine template: %w", err)
	}

	prompt := buf.String()

	// Call LLM with commit-refine-specific max tokens
	refined, err := t.llmClient.Generate(ctx, prompt, llmCommitRefineMaxTokens)
	if err != nil {
		return "", err
	}

	return strings.TrimSpace(refined), nil
}

// Close closes all writers and resources
func (t *Task4LLMEnhance) Close() error {
	if err := t.writer.Close(); err != nil {
		return fmt.Errorf("failed to close LLM enhanced PR writer: %w", err)
	}
	return nil
}

// PR Summary Prompt Template
const prSummaryPromptTemplate = `Summarize this pull request in 1-4 clear sentences:

Repository: {{.RepoName}}
Description: {{.RepoDesc}}

PR Title: {{.Title}}
PR Description:
{{.Body}}

{{if .Issue}}Related Issue: {{.Issue.Title}}
{{.Issue.Body}}

{{end}}Changed Files:
{{range .ChangedPyFiles}}- {{.}}
{{end}}

Commits:
{{range .Commits}}
## Message: {{.Message}}

Changes:
{{range .Diffs}}
File: {{.Path}}
{{.Patch}}
{{end}}
{{end}}

Please provide a clear and concise summary (1-4 sentences) of this Pull Request, focusing on:
1. What problem does it solve or what feature does it add?
2. What are the key changes made?
3. Any important implementation details?

Summary:`

// Commit Message Refinement Prompt Template
const commitRefinePromptTemplate = `Optimize this commit message for clarity and educational value while keeping it concise.

PR Context Summary: {{.Summary}}

Original commit message:
{{.Commit.Message}}

Diff Context:
{{range .Commit.Diffs}}File: {{.Path}}
{{truncatePatch .Patch 2000}}

{{end}}
Provide an optimized version that:
1. The subject is clear and descriptive
2. If the commit is trivial and the changes are minimal, don't add the footer
3. Otherwise, keep the footer in one sentence

Refined commit message:`
