package tasks

import (
	"bytes"
	"context"
	"errors"
	"fmt"
	"strings"
	"sync"
	"text/template"
	"time"
	"unicode/utf8"

	"github.com/reposurvey/pipeline/client"
	"github.com/reposurvey/pipeline/config"
	"github.com/reposurvey/pipeline/diff"
	"github.com/reposurvey/pipeline/models"
	"github.com/reposurvey/pipeline/parquet"
)

// TranslatedCommit represents a commit with its diffs translated to edits
type TranslatedCommit struct {
	SHA            string
	Message        string
	RefinedMessage string
	// Original diffs (for old format)
	Diffs []models.DiffPatch
	// Translated edits (for new format)
	Edits []diff.Edit
	// Translation errors (if any)
	TranslationErrors []string
}

// TranslatedPRData wraps LLMEnhancedPRData with translated commits
type TranslatedPRData struct {
	models.LLMEnhancedPRData
	TranslatedCommits []TranslatedCommit
}

// DefaultMaxContextExpand is the default maximum number of lines to expand for context uniqueness.
// Higher values improve success rate but increase search string size.
// Testing shows: maxExpand=10 -> 99.5%, maxExpand=20 -> 99.8%, maxExpand=30 -> 99.9%
const DefaultMaxContextExpand = 20

// TranslatePRDiffs translates all diffs in a PR to structured edits.
// It maintains a running state of file contents, updating them after each commit
// to ensure context expansion works correctly for sequential commits on the same file.
func TranslatePRDiffs(pr models.LLMEnhancedPRData) TranslatedPRData {
	return TranslatePRDiffsWithMaxExpand(pr, DefaultMaxContextExpand)
}

// TranslatePRDiffsWithMaxExpand translates all diffs in a PR to structured edits with custom maxExpand.
func TranslatePRDiffsWithMaxExpand(pr models.LLMEnhancedPRData, maxExpand int) TranslatedPRData {
	result := TranslatedPRData{
		LLMEnhancedPRData: pr,
		TranslatedCommits: make([]TranslatedCommit, 0, len(pr.Commits)),
	}

	// Build a map of file paths to their current content for context expansion.
	// This map is updated after each commit to reflect the state after applying edits.
	fileContentMap := make(map[string]string)
	for _, f := range pr.RelevantFiles {
		fileContentMap[f.Path] = f.Content
	}

	for _, commit := range pr.Commits {
		tc := TranslatedCommit{
			SHA:            commit.SHA,
			Message:        commit.Message,
			RefinedMessage: commit.RefinedMessage,
			Diffs:          commit.Diffs,
			Edits:          []diff.Edit{},
		}

		for _, d := range commit.Diffs {
			// Get current file content (may have been updated by previous commits)
			currentContent := fileContentMap[d.Path]

			// Translate with context expansion if we have the file content
			var translationResult diff.TranslationResult
			if currentContent != "" {
				translationResult = diff.TranslatePatchToEditsWithContext(d.Patch, d.Path, currentContent, maxExpand)
			} else {
				translationResult = diff.TranslatePatchToEdits(d.Patch, d.Path)
			}

			if translationResult.Success {
				tc.Edits = append(tc.Edits, translationResult.Edits...)

				// Update the file content map by applying the edits sequentially
				// This ensures subsequent commits see the updated file state
				for _, edit := range translationResult.Edits {
					if edit.Type == diff.EditTypeStrReplace && currentContent != "" {
						// Apply the edit to update the file content
						newContent, err := diff.ApplyEdit(&diff.EditCommand{
							Command: "str_replace",
							Path:    edit.Path,
							OldStr:  edit.OldContent,
							NewStr:  edit.NewContent,
						}, currentContent)
						if err == nil {
							fileContentMap[d.Path] = newContent
							currentContent = newContent // Update for next edit in same file
						}
						// If apply fails, keep the old content (best effort)
					}
				}
			} else {
				fmt.Printf("Translation Error on %s#%d: %s:%s\n", pr.RepoName, pr.PRID, d.Path, translationResult.Error)
				tc.TranslationErrors = append(tc.TranslationErrors,
					fmt.Sprintf("%s: %s", d.Path, translationResult.Error))
			}
		}

		result.TranslatedCommits = append(result.TranslatedCommits, tc)
	}

	return result
}

// renderTextJob represents a batch of LLM enhanced PRs to render
type renderTextJob struct {
	prs []models.LLMEnhancedPRData
}

// renderThroughputMonitor tracks and reports rendering pipeline throughput
type renderThroughputMonitor struct {
	mu           sync.Mutex
	prsProcessed int64
	prsRendered  int64
	startTime    time.Time
	writer       *parquet.ParallelBatchWriter[models.RenderedPRText]
}

func newRenderThroughputMonitor(writer *parquet.ParallelBatchWriter[models.RenderedPRText]) *renderThroughputMonitor {
	return &renderThroughputMonitor{
		startTime: time.Now(),
		writer:    writer,
	}
}

func (m *renderThroughputMonitor) addPRsProcessed(count int) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.prsProcessed += int64(count)
}

func (m *renderThroughputMonitor) addPRsRendered(count int) {
	m.mu.Lock()
	defer m.mu.Unlock()
	m.prsRendered += int64(count)
}

func (m *renderThroughputMonitor) report() {
	m.mu.Lock()
	defer m.mu.Unlock()

	elapsed := time.Since(m.startTime).Seconds()
	processRate := float64(m.prsProcessed) / elapsed
	renderRate := float64(m.prsRendered) / elapsed

	// Get data written size
	totalBytes := m.writer.GetTotalSize()
	totalGB := float64(totalBytes) / (1024 * 1024 * 1024)
	mbps := float64(totalBytes) / (1024 * 1024) / elapsed

	fmt.Printf("[THROUGHPUT] PRs Processed: %d (%.1f/s) | PRs Rendered: %d (%.1f/s) | Data Written: %.2f GB (%.2f MB/s) | Elapsed: %.1fs\n",
		m.prsProcessed, processRate, m.prsRendered, renderRate, totalGB, mbps, elapsed)
}

// Task5RenderText implements PR text rendering
type Task5RenderText struct {
	cfg    *config.Config
	writer *parquet.ParallelBatchWriter[models.RenderedPRText]

	// Channel for piping jobs from reader to workers
	jobChan chan renderTextJob

	// Throughput monitoring
	monitor *renderThroughputMonitor

	// Template for rendering
	tmpl *template.Template
}

// NewTask5RenderText creates a new PR text rendering task
func NewTask5RenderText(cfg *config.Config, client *client.GithubClient) (*Task5RenderText, error) {
	// Create rendered text writer
	writer, err := parquet.NewParallelBatchWriter[models.RenderedPRText](
		cfg.RenderedTextDir,
		cfg.PRBatchSize,
		cfg.MaxFileSize,
		cfg.FlushInterval,
		32, // 32 concurrent writers, 1 for debugging
	)
	if err != nil {
		return nil, fmt.Errorf("failed to create rendered text writer: %w", err)
	}

	// Parse template
	tmpl, err := template.New("pr_text").Parse(llmEnhancedDebugTemplate)
	if err != nil {
		return nil, fmt.Errorf("failed to parse template: %w", err)
	}

	return &Task5RenderText{
		cfg:     cfg,
		writer:  writer,
		jobChan: make(chan renderTextJob, cfg.OfflineConcurrency),
		monitor: newRenderThroughputMonitor(writer),
		tmpl:    tmpl,
	}, nil
}

// Run starts the PR text rendering process
func (t *Task5RenderText) Run(ctx context.Context) error {
	fmt.Println("[INFO] Starting Task 5: PR Text Rendering")

	// Create batch reader for LLM Enhanced PR data (from Task 4)
	reader, err := parquet.NewParallelBatchReader[models.LLMEnhancedPRData](t.cfg.LLMEnhancedPRsDir, t.cfg.PRBatchSize, t.cfg.OfflineConcurrency, 2)
	if err != nil {
		return fmt.Errorf("failed to create LLM enhanced PR reader: %w", err)
	}

	fmt.Printf("[INFO] Found %d LLM enhanced PR parquet files to process\n", reader.GetFileCount())

	// Start throughput monitor
	monitorCtx, monitorCancel := context.WithCancel(ctx)
	defer monitorCancel()
	go t.runThroughputMonitor(monitorCtx)

	// Start worker pool
	workersDone := make(chan error, 1)
	go func() {
		if err := t.runWorkers(ctx); err != nil {
			workersDone <- fmt.Errorf("workers error: %w", err)
		}
		close(workersDone)
	}()

	// Read and dispatch PR batches
	for {
		select {
		case <-ctx.Done():
			close(t.jobChan)
			return ctx.Err()
		default:
		}

		batch, hasMore, err := reader.ReadBatch()
		if err != nil {
			close(t.jobChan)
			return fmt.Errorf("failed to read enriched PR batch: %w", err)
		}

		if len(batch) > 0 {
			job := renderTextJob{
				prs: batch,
			}

			select {
			case t.jobChan <- job:
			case <-ctx.Done():
				close(t.jobChan)
				return ctx.Err()
			}

			t.monitor.addPRsProcessed(len(batch))
		}

		if !hasMore {
			break
		}

	}

	// Signal workers that no more jobs will be sent
	close(t.jobChan)

	// Wait for workers to complete
	if err := <-workersDone; err != nil {
		return err
	}

	// Final report
	t.monitor.report()
	fmt.Println("[INFO] Task 5 completed successfully")
	return nil
}

// runThroughputMonitor reports throughput statistics every 30 seconds
func (t *Task5RenderText) runThroughputMonitor(ctx context.Context) {
	ticker := time.NewTicker(30 * time.Second)
	defer ticker.Stop()

	for {
		select {
		case <-ctx.Done():
			t.monitor.report()
			return
		case <-ticker.C:
			t.monitor.report()
		}
	}
}

// runWorkers implements the worker pool for rendering PRs
func (t *Task5RenderText) runWorkers(ctx context.Context) error {
	workerCount := t.cfg.OfflineConcurrency
	fmt.Printf("[INFO] Starting %d workers for PR rendering\n", workerCount)

	errChan := make(chan error, workerCount)

	for i := 0; i < workerCount; i++ {
		go func(workerID int) {
			for job := range t.jobChan {
				if err := t.processJobBatch(ctx, job); err != nil {
					// Don't log errors during graceful shutdown (context canceled or writer closed)
					if !errors.Is(err, context.Canceled) && !errors.Is(err, parquet.ErrWriterClosed) {
						fmt.Printf("[ERROR] Worker %d failed to process batch: %v\n", workerID, err)
					}
				}
			}
			errChan <- nil
		}(i)
	}

	// Wait for all workers to complete
	for i := 0; i < workerCount; i++ {
		if err := <-errChan; err != nil {
			return err
		}
	}

	return nil
}

// processJobBatch renders a batch of PRs
func (t *Task5RenderText) processJobBatch(ctx context.Context, job renderTextJob) error {
	for _, pr := range job.prs {
		select {
		case <-ctx.Done():
			return ctx.Err()
		default:
		}

		// Render this PR
		renderedText, err := t.renderPR(pr)
		if err != nil {
			fmt.Printf("[WARN] Failed to render PR %s#%d: %v\n", pr.RepoName, pr.PRID, err)
			continue
		}

		// Write rendered data
		if err := t.writer.Write(models.RenderedPRText{
			PRID:     pr.PRID,
			RepoID:   pr.RepoID,
			RepoName: pr.RepoName,
			Text:     renderedText,
		}); err != nil {
			// Don't log errors during graceful shutdown (context canceled or writer closed)
			if !errors.Is(err, context.Canceled) && !errors.Is(err, parquet.ErrWriterClosed) {
				fmt.Printf("[ERROR] Failed to write rendered text for PR %s#%d: %v\n",
					pr.RepoName, pr.PRID, err)
			}
			continue
		}

		t.monitor.addPRsRendered(1)
	}

	return nil
}

// renderPR renders a single LLM enhanced PR to text using the template
func (t *Task5RenderText) renderPR(pr models.LLMEnhancedPRData) (string, error) {
	return RenderWithEdits(pr)
}

// Close closes all writers and resources
func (t *Task5RenderText) Close() error {
	if err := t.writer.Close(); err != nil {
		return fmt.Errorf("failed to close rendered text writer: %w", err)
	}
	return nil
}

// RenderPRText renders a PR to text
// and ensures the output contains only valid UTF-8
func RenderPRText(pr models.LLMEnhancedPRData) (string, error) {
	tmpl, err := template.New("pr_text").Parse(prTextTemplate)
	if err != nil {
		return "", err
	}
	var buf bytes.Buffer
	if err := tmpl.Execute(&buf, pr); err != nil {
		return "", err
	}

	// Sanitize text to ensure valid UTF-8
	text := buf.String()
	return sanitizeUTF8(text), nil
}

// RenderLLMEnhancement renders the LLM enhancement of a PR to text for manual inspection
func RenderLLMEnhancement(pr models.LLMEnhancedPRData) (string, error) {
	tmpl, err := template.New("pr_text").Parse(llmEnhancedDebugTemplate)
	if err != nil {
		return "", err
	}
	var buf bytes.Buffer
	if err := tmpl.Execute(&buf, pr); err != nil {
		return "", err
	}

	// Sanitize text to ensure valid UTF-8
	text := buf.String()
	return sanitizeUTF8(text), nil
}

// RenderWithEdits renders a PR with both old (patch) and new (edits) formats for comparison
func RenderWithEdits(pr models.LLMEnhancedPRData) (string, error) {
	// Translate diffs to edits
	translated := TranslatePRDiffs(pr)

	// Parse template with custom functions
	funcMap := template.FuncMap{
		"formatEdit": formatEditForTemplate,
		"joinLines": func(lines []string) string {
			const maxLines = 50
			if len(lines) > maxLines {
				truncated := lines[:maxLines]
				return strings.Join(truncated, "\n") + fmt.Sprintf("\n... (truncated, showing %d of %d files)", maxLines, len(lines))
			}
			return strings.Join(lines, "\n")
		},
	}

	tmpl, err := template.New("pr_with_edits").Funcs(funcMap).Parse(prWithEditsTemplate)
	if err != nil {
		return "", err
	}

	var buf bytes.Buffer
	if err := tmpl.Execute(&buf, translated); err != nil {
		return "", err
	}

	return sanitizeUTF8(buf.String()), nil
}

// formatEditForTemplate formats a single edit for template rendering.
// The format is designed to be readable and directly mappable to str_replace_editor commands.
func formatEditForTemplate(edit diff.Edit) string {
	var sb strings.Builder

	switch edit.Type {
	case diff.EditTypeStrReplace:
		sb.WriteString(fmt.Sprintf("Edit: %s\n", edit.Path))
		sb.WriteString("\nSearch:\n```\n")
		sb.WriteString(edit.OldContent)
		if !strings.HasSuffix(edit.OldContent, "\n") {
			sb.WriteString("\n")
		}
		sb.WriteString("```\n")
		sb.WriteString("\nReplace:\n```\n")
		// Use empty string directly for deletions (no placeholder text)
		if edit.NewContent != "" {
			sb.WriteString(edit.NewContent)
			if !strings.HasSuffix(edit.NewContent, "\n") {
				sb.WriteString("\n")
			}
		}
		sb.WriteString("```\n")

	case diff.EditTypeInsert:
		sb.WriteString(fmt.Sprintf("Insert: %s\n", edit.Path))
		sb.WriteString(fmt.Sprintf("\nInsert after line %d:\n```\n", edit.InsertLine))
		sb.WriteString(edit.NewContent)
		if !strings.HasSuffix(edit.NewContent, "\n") {
			sb.WriteString("\n")
		}
		sb.WriteString("```\n")

	case diff.EditTypeCreate:
		sb.WriteString(fmt.Sprintf("Create file: %s\n", edit.Path))
		sb.WriteString("\nContent:\n```\n")
		if edit.NewContent != "" {
			sb.WriteString(edit.NewContent)
			if !strings.HasSuffix(edit.NewContent, "\n") {
				sb.WriteString("\n")
			}
		}
		sb.WriteString("```\n")

	case diff.EditTypeDelete:
		sb.WriteString(fmt.Sprintf("Remove file: %s\n", edit.Path))

	case diff.EditTypeRename:
		sb.WriteString(fmt.Sprintf("Rename: %s\n", edit.OldPath))
		sb.WriteString(fmt.Sprintf("\nTo: %s\n", edit.Path))
	}

	return sb.String()
}

// sanitizeUTF8 ensures the string contains only valid UTF-8 by replacing invalid sequences
// with the Unicode replacement character (U+FFFD)
func sanitizeUTF8(s string) string {
	// Fast path: if already valid UTF-8, return as-is
	if utf8.ValidString(s) {
		return s
	}

	// Slow path: rebuild string with valid UTF-8
	var builder strings.Builder
	builder.Grow(len(s))

	for len(s) > 0 {
		r, size := utf8.DecodeRuneInString(s)
		builder.WriteRune(r)
		s = s[size:]
	}

	return builder.String()
}

const prTextTemplate = `# Repository Context

Name: {{.RepoName}}
Description: {{.RepoDesc}}

{{if .Issue}}# Issue

## {{.Issue.Title}}
{{.Issue.Body}}

{{range .Issue.Comments}}{{.Body}}
{{end}}
{{end}}# Pull Request

## {{.Title}}
{{.Body}}

# Relevant Files Found

{{range .RelevantFiles}}## {{.Path}}

` + "```" + `
{{.Content}}
` + "```" + `

{{end}}

# Commits

{{.PRSummary}}

{{range .Commits}}{{.RefinedMessage}}

patch
{{range .Diffs}}
File: {{.Path}}
{{.Patch}}
{{end}}

{{end}}`

// llmEnhancedDebugTemplate is the template for rendering LLM enhancement of a PR for manual inspection
const llmEnhancedDebugTemplate = `# Repository Context

Name: {{.RepoName}}
Description: {{.RepoDesc}}

# PR Summary
{{.PRSummary}}

{{if .Issue}}# Issue

## {{.Issue.Title}}
{{.Issue.Body}}

{{range .Issue.Comments}}{{.Body}}
{{end}}
{{end}}# Pull Request

## {{.Title}}
{{.Body}}

# Commits

{{range .Commits}}## Commit Message (Refined)
{{.RefinedMessage}}

## Original Message
{{.Message}}

patch
{{range .Diffs}}
File: {{.Path}}
{{.Patch}}
{{end}}

{{end}}`

// prWithEditsTemplate renders both old (patch) and new (edits) formats for comparison
const prWithEditsTemplate = `# Repository Context

Name: {{.RepoName}}
Description: {{.RepoDesc}}

{{if .Issue}}# Issue

## {{.Issue.Title}}
{{.Issue.Body}}

{{range .Issue.Comments}}{{.Body}}
{{end}}
{{end}}# Pull Request

## {{.Title}}
{{.Body}}

# Relevant Files Found

{{range .RelevantFiles}}## {{.Path}}

` + "```" + `
{{.Content}}
` + "```" + `

{{end}}

# Edits

{{.PRSummary}}

{{range .TranslatedCommits}}
{{.RefinedMessage}}

{{if .TranslationErrors}}{{range .TranslationErrors}}- {{.}}
{{end}}
{{end}}{{range .Edits}}{{formatEdit .}}
{{end}}

{{end}}`
