"""
Grading comparison views for analyzing consistency between multiple graders.

Provides admin-only views to:
- List questions with multiple grading sessions
- Compare gradings side-by-side
- View statistical agreement metrics
- Export comparison data as CSV
"""

from django.views.generic import ListView, DetailView, View
from django.contrib.auth.mixins import LoginRequiredMixin
from django.shortcuts import get_object_or_404
from django.http import HttpResponse, JsonResponse
from django.db.models import Count, Q
import csv
from collections import defaultdict

from .models import Question
from model_evaluation.models import (
    ModelGradingSession, ModelGrading, ModelGradingAlias
)
from accounts.permissions import AdminRequiredMixin
from .grading_statistics import calculate_agreement


def sanitize_csv_value(value):
    """
    Sanitize a value for safe CSV export.

    Prevents CSV injection attacks by prefixing potentially dangerous
    values with a single quote, which Excel treats as a text indicator.

    Dangerous characters that can trigger formula execution:
    - = (formula)
    - + (formula)
    - - (formula/negative)
    - @ (function)
    - \\t (tab - can be used in injection)
    - \\r (carriage return - can be used in injection)
    """
    if value is None:
        return value

    str_value = str(value)
    if str_value and str_value[0] in ('=', '+', '-', '@', '\t', '\r'):
        return "'" + str_value
    return str_value


class GradingComparisonListView(AdminRequiredMixin, ListView):
    """
    List all questions that have multiple grading sessions.

    Shows:
    - Question title and author
    - Number of graders
    - Number of grading sessions
    - Quick agreement metrics (if 2 sessions)
    - Links to detailed comparison
    """
    template_name = 'questions/grading_comparison_list.html'
    context_object_name = 'questions'
    paginate_by = 20

    def get_queryset(self):
        """Get questions with 2+ finalized grading sessions."""
        # Annotate questions with count of finalized sessions
        questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            ),
            grader_count=Count(
                'modelgradingsession__grader',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(
            finalized_session_count__gte=2  # Only questions with 2+ finalized sessions
        ).select_related('author').order_by('-id')

        return questions

    def get_context_data(self, **kwargs):
        context = super().get_context_data(**kwargs)

        # Add session details for each question (only finalized sessions)
        questions_with_sessions = []
        for question in context['questions']:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).select_related('grader').order_by('created_at')

            # Get grader names
            graders = []
            for session in sessions:
                grader_name = session.grader.get_full_name() or session.grader.email
                graders.append({
                    'name': grader_name,
                    'session_id': session.id,
                    'status': session.session_status,
                    'is_finalized': session.is_finalized,
                })

            # Calculate quick agreement if exactly 2 sessions
            quick_agreement = None
            progress_exact_agreement = None
            progress_within1_agreement = None
            progress_mean_diff = None

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)
                    quick_agreement = stats.get('overall_agreement')

                    # Get progress grade agreement
                    prog_agreement = stats.get('progress_agreement', {})
                    if prog_agreement:
                        progress_exact_agreement = prog_agreement.get('exact_agreement_pct')
                        progress_within1_agreement = prog_agreement.get('within_1_agreement_pct')
                        progress_mean_diff = prog_agreement.get('mean_absolute_difference')

            questions_with_sessions.append({
                'question': question,
                'graders': graders,
                'session_count': sessions.count(),
                'quick_agreement': quick_agreement,
                'progress_exact_agreement': progress_exact_agreement,
                'progress_within1_agreement': progress_within1_agreement,
                'progress_mean_diff': progress_mean_diff,
            })

        context['questions_with_sessions'] = questions_with_sessions

        # Category labels for display
        context['category_labels'] = {
            'error_incorrect_logic': 'Incorrect Logic',
            'error_hallucinated': 'Hallucinated Facts',
            'error_calculation': 'Calculation Error',
            'error_conceptual': 'Conceptual Error',
            'achievement_understanding': 'Problem Understanding',
            'achievement_correct_result': 'Correct End Result',
            'achievement_insight': 'Mathematical Insight',
            'achievement_usefulness': 'Useful Progress',
        }

        # Calculate global statistics across ALL questions (not just paginated ones)
        # Get the full unpaginated queryset for global statistics
        all_questions = self.get_queryset()

        if all_questions.exists():
            total_questions = all_questions.count()

            # Calculate global statistics from ALL questions
            overall_agreements = []
            progress_diffs = []
            category_aggregates = defaultdict(lambda: {'total_agreements': 0, 'total_comparisons': 0})
            total_exact_matches = 0
            total_within1_matches = 0
            total_progress_comparisons = 0
            difference_distribution = {0: 0, 1: 0, 2: 0, 3: 0}

            for question in all_questions:
                sessions = ModelGradingSession.objects.filter(
                    question=question,
                    session_status='finalized'
                ).order_by('created_at')

                if sessions.count() == 2:
                    s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                    s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                    if s1_gradings.exists() and s2_gradings.exists():
                        stats = calculate_agreement(s1_gradings, s2_gradings)

                        # Collect overall agreement
                        overall_agreements.append(stats['overall_agreement'])

                        # Collect category agreements
                        for cat_key, cat_stats in stats['category_agreements'].items():
                            category_aggregates[cat_key]['total_agreements'] += cat_stats['agreements']
                            category_aggregates[cat_key]['total_comparisons'] += cat_stats['total']

                        # Collect progress grade statistics
                        prog_agreement = stats.get('progress_agreement', {})
                        if prog_agreement and prog_agreement.get('n_compared', 0) > 0:
                            n_compared = prog_agreement['n_compared']
                            total_progress_comparisons += n_compared

                            mean_diff = prog_agreement.get('mean_absolute_difference')
                            if mean_diff is not None:
                                progress_diffs.append(mean_diff)

                            # Calculate exact counts
                            exact_count = round(prog_agreement['exact_agreement_pct'] / 100 * n_compared)
                            within1_count = round(prog_agreement['within_1_agreement_pct'] / 100 * n_compared)

                            total_exact_matches += exact_count
                            total_within1_matches += within1_count

                            # Calculate actual difference distribution
                            # We need to look at individual answer pairs to get accurate distribution
                            s1_map = {g.model_answer_id: g for g in s1_gradings}
                            s2_map = {g.model_answer_id: g for g in s2_gradings}
                            common_ids = set(s1_map.keys()) & set(s2_map.keys())

                            for answer_id in common_ids:
                                g1 = s1_map[answer_id]
                                g2 = s2_map[answer_id]

                                if g1.progress_grade is not None and g2.progress_grade is not None:
                                    diff = abs(g1.progress_grade - g2.progress_grade)
                                    difference_distribution[diff] += 1

            # Only create global stats if we have data
            if overall_agreements:
                # 1. Summary Dashboard
                context['global_stats'] = {
                    'total_questions': total_questions,
                    'avg_overall_agreement': round(sum(overall_agreements) / len(overall_agreements), 1),
                    'avg_progress_diff': round(sum(progress_diffs) / len(progress_diffs), 2) if progress_diffs else None,
                    'median_progress_diff': round(sorted(progress_diffs)[len(progress_diffs) // 2], 2) if progress_diffs else None,
                }

                # 2. Agreement Distribution
                high_agreement = sum(1 for a in overall_agreements if a >= 80)
                moderate_agreement = sum(1 for a in overall_agreements if 60 <= a < 80)
                low_agreement = sum(1 for a in overall_agreements if a < 60)

                context['agreement_distribution'] = {
                    'high': {'count': high_agreement, 'pct': round(high_agreement / len(overall_agreements) * 100, 1)},
                    'moderate': {'count': moderate_agreement, 'pct': round(moderate_agreement / len(overall_agreements) * 100, 1)},
                    'low': {'count': low_agreement, 'pct': round(low_agreement / len(overall_agreements) * 100, 1)},
                }

                # 3. Category-Level Analysis
                category_stats = {}
                for cat_key, agg in category_aggregates.items():
                    if agg['total_comparisons'] > 0:
                        category_stats[cat_key] = round(agg['total_agreements'] / agg['total_comparisons'] * 100, 1)
                    else:
                        category_stats[cat_key] = None

                # Sort by agreement (lowest first to highlight problem areas)
                sorted_categories = sorted(category_stats.items(), key=lambda x: x[1] if x[1] is not None else 0)
                context['category_stats'] = sorted_categories

                # 4. Progress Grade Statistics
                context['progress_grade_stats'] = {
                    'exact_match_pct': round(total_exact_matches / total_progress_comparisons * 100, 1) if total_progress_comparisons > 0 else None,
                    'within1_match_pct': round(total_within1_matches / total_progress_comparisons * 100, 1) if total_progress_comparisons > 0 else None,
                    'total_comparisons': total_progress_comparisons,
                    'difference_distribution': difference_distribution,
                }

        return context


class GradingComparisonDetailView(AdminRequiredMixin, DetailView):
    """
    Detailed comparison of grading sessions for a specific question.

    Shows:
    - Side-by-side comparison of all grading sessions
    - Agreement statistics per category
    - Overall reliability metrics
    - Highlighting of disagreements
    """
    template_name = 'questions/grading_comparison_detail.html'
    context_object_name = 'question'
    model = Question
    pk_url_kwarg = 'question_id'

    def get_context_data(self, **kwargs):
        context = super().get_context_data(**kwargs)

        # Get all finalized sessions for this question
        sessions = ModelGradingSession.objects.filter(
            question=self.object,
            session_status='finalized'
        ).select_related('grader').order_by('created_at')

        context['sessions'] = sessions

        # Get all gradings organized by session
        sessions_data = []
        for session in sessions:
            gradings = ModelGrading.objects.filter(
                session=session
            ).select_related('model_answer__model')

            aliases = ModelGradingAlias.objects.filter(
                session=session
            ).select_related('model_answer')

            # Create alias lookup
            alias_map = {a.model_answer_id: a for a in aliases}

            sessions_data.append({
                'session': session,
                'grader_name': session.grader.get_full_name() or session.grader.email,
                'gradings': gradings,
                'alias_map': alias_map,
            })

        context['sessions_data'] = sessions_data

        # Build comparison matrix (answer x grader)
        # Get all unique model answers that have been graded
        all_answer_ids = set()
        for session_data in sessions_data:
            all_answer_ids.update(g.model_answer_id for g in session_data['gradings'])

        # Build matrix data
        comparison_matrix = []
        for answer_id in sorted(all_answer_ids):
            row = {'answer_id': answer_id}

            # Get model name from first session that has this answer
            for session_data in sessions_data:
                for grading in session_data['gradings']:
                    if grading.model_answer_id == answer_id:
                        row['model_name'] = grading.model_answer.model.display_name or grading.model_answer.model.model_name
                        break
                if 'model_name' in row:
                    break

            # Get gradings from each session
            row['session_gradings'] = []
            for session_data in sessions_data:
                grading = next((g for g in session_data['gradings'] if g.model_answer_id == answer_id), None)
                alias = session_data['alias_map'].get(answer_id)

                row['session_gradings'].append({
                    'grading': grading,
                    'alias': alias.alias if alias else None,
                })

            comparison_matrix.append(row)

        context['comparison_matrix'] = comparison_matrix

        # Calculate pairwise statistics between all session pairs
        pairwise_stats = []
        for i in range(len(sessions_data)):
            for j in range(i + 1, len(sessions_data)):
                s1_data = sessions_data[i]
                s2_data = sessions_data[j]

                stats = calculate_agreement(s1_data['gradings'], s2_data['gradings'])

                pairwise_stats.append({
                    'grader1': s1_data['grader_name'],
                    'grader2': s2_data['grader_name'],
                    'session1_id': s1_data['session'].id,
                    'session2_id': s2_data['session'].id,
                    'stats': stats,
                })

        context['pairwise_stats'] = pairwise_stats

        # Category labels for display
        context['category_labels'] = {
            'error_incorrect_logic': 'Incorrect Logic',
            'error_hallucinated': 'Hallucinated Facts',
            'error_calculation': 'Calculation Error',
            'error_conceptual': 'Conceptual Error',
            'achievement_understanding': 'Problem Understanding',
            'achievement_correct_result': 'Correct End Result',
            'achievement_insight': 'Mathematical Insight',
            'achievement_usefulness': 'Useful Progress',
        }

        return context


class GradingComparisonExportView(AdminRequiredMixin, View):
    """Export grading comparison data as CSV."""

    def get(self, request, question_id):
        """Generate CSV export of grading comparison."""
        question = get_object_or_404(Question, pk=question_id)

        # Create HTTP response with CSV header
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = f'attachment; filename="grading_comparison_q{question_id}.csv"'

        writer = csv.writer(response)

        # Get all finalized sessions
        sessions = ModelGradingSession.objects.filter(
            question=question,
            session_status='finalized'
        ).select_related('grader').order_by('created_at')

        if sessions.count() < 2:
            writer.writerow(['Error: Question must have at least 2 finalized grading sessions'])
            return response

        # Write header
        header = ['Model Answer', 'Model Name']

        # Categories
        categories = [
            'error_incorrect_logic',
            'error_hallucinated',
            'error_calculation',
            'error_conceptual',
            'achievement_understanding',
            'achievement_correct_result',
            'achievement_insight',
            'achievement_usefulness',
            'progress_grade',
        ]

        category_labels = {
            'error_incorrect_logic': 'Incorrect Logic',
            'error_hallucinated': 'Hallucinated Facts',
            'error_calculation': 'Calculation Error',
            'error_conceptual': 'Conceptual Error',
            'achievement_understanding': 'Problem Understanding',
            'achievement_correct_result': 'Correct End Result',
            'achievement_insight': 'Mathematical Insight',
            'achievement_usefulness': 'Useful Progress',
            'progress_grade': 'Progress Grade',
        }

        # Add columns for each grader and each category
        for session in sessions:
            grader_id = f'User {session.grader.id}'
            header.append(f'{grader_id} - Alias')
            for cat in categories:
                header.append(f'{grader_id} - {category_labels[cat]}')

        writer.writerow(header)

        # Get all answer IDs
        all_answer_ids = set()
        sessions_data = {}

        for session in sessions:
            gradings = ModelGrading.objects.filter(session=session).select_related('model_answer__model')
            aliases = ModelGradingAlias.objects.filter(session=session)

            alias_map = {a.model_answer_id: a.alias for a in aliases}
            grading_map = {g.model_answer_id: g for g in gradings}

            sessions_data[session.id] = {
                'alias_map': alias_map,
                'grading_map': grading_map,
            }

            all_answer_ids.update(alias_map.keys())

        # Write data rows
        for answer_id in sorted(all_answer_ids):
            row = [answer_id]

            # Get model name
            model_name = None
            for session_id, data in sessions_data.items():
                if answer_id in data['grading_map']:
                    grading = data['grading_map'][answer_id]
                    model_name = grading.model_answer.model.display_name or grading.model_answer.model.model_name
                    break

            row.append(sanitize_csv_value(model_name) or 'Unknown')

            # Add grading data for each session
            for session in sessions:
                data = sessions_data[session.id]

                # Alias
                alias = data['alias_map'].get(answer_id, 'N/A')
                row.append(alias)

                # Grading values
                if answer_id in data['grading_map']:
                    grading = data['grading_map'][answer_id]

                    for cat in categories:
                        if cat == 'progress_grade':
                            value = grading.progress_grade if grading.progress_grade is not None else 'N/A'
                        else:
                            state = getattr(grading, cat)
                            if state is None:
                                value = 'N/A'
                            else:
                                value = state.state_code

                        row.append(value)
                else:
                    # No grading for this answer in this session
                    row.extend(['N/A'] * len(categories))

            writer.writerow(row)

        return response


class AgreementDistributionExportView(AdminRequiredMixin, View):
    """Export per-question overall agreement as clean CSV."""

    def get(self, request):
        """Generate CSV with one row per question comparison."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="agreement_distribution.csv"'

        writer = csv.writer(response)

        # Header
        writer.writerow(['Question ID', 'Title', 'Grader 1', 'Grader 2', 'Overall Agreement %',
                        'Progress Correlation', 'Progress Mean Diff', 'Answers Compared'])

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).select_related('grader').order_by('created_at')

            if sessions.count() == 2:
                s1 = sessions[0]
                s2 = sessions[1]
                s1_gradings = ModelGrading.objects.filter(session=s1)
                s2_gradings = ModelGrading.objects.filter(session=s2)

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)

                    grader1_id = s1.grader.id
                    grader2_id = s2.grader.id

                    prog_agreement = stats.get('progress_agreement', {})

                    writer.writerow([
                        question.id,
                        sanitize_csv_value(question.title),
                        grader1_id,
                        grader2_id,
                        stats['overall_agreement'],
                        stats.get('progress_correlation') or 'N/A',
                        prog_agreement.get('mean_absolute_difference') or 'N/A',
                        stats['n_compared']
                    ])

        return response


class AgreementDistributionSummaryExportView(AdminRequiredMixin, View):
    """Export agreement distribution summary (high/moderate/low) as clean CSV."""

    def get(self, request):
        """Generate CSV with agreement level distribution."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="agreement_distribution_summary.csv"'

        writer = csv.writer(response)

        # Header
        writer.writerow(['Agreement Level', 'Count', 'Percentage'])

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        question_agreements = []

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).order_by('created_at')

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)
                    question_agreements.append(stats['overall_agreement'])

        if question_agreements:
            high_agreement = sum(1 for a in question_agreements if a >= 80)
            moderate_agreement = sum(1 for a in question_agreements if 60 <= a < 80)
            low_agreement = sum(1 for a in question_agreements if a < 60)
            total = len(question_agreements)

            writer.writerow(['High (≥80%)', high_agreement, round(high_agreement / total * 100, 1)])
            writer.writerow(['Moderate (60-79%)', moderate_agreement, round(moderate_agreement / total * 100, 1)])
            writer.writerow(['Low (<60%)', low_agreement, round(low_agreement / total * 100, 1)])

        return response


class CategoryAggregatesExportView(AdminRequiredMixin, View):
    """Export category-level aggregated statistics as clean CSV."""

    def get(self, request):
        """Generate CSV with aggregated category agreement stats."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="category_aggregates.csv"'

        writer = csv.writer(response)

        # Header
        writer.writerow(['Category', 'Total Agreements', 'Total Comparisons', 'Agreement %'])

        # Category labels
        category_labels = {
            'error_incorrect_logic': 'Incorrect Logic',
            'error_hallucinated': 'Hallucinated Facts',
            'error_calculation': 'Calculation Error',
            'error_conceptual': 'Conceptual Error',
            'achievement_understanding': 'Problem Understanding',
            'achievement_correct_result': 'Correct End Result',
            'achievement_insight': 'Mathematical Insight',
            'achievement_usefulness': 'Useful Progress',
        }

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        category_aggregates = defaultdict(lambda: {'total_agreements': 0, 'total_comparisons': 0})

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).order_by('created_at')

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)

                    for cat_key, cat_stats in stats['category_agreements'].items():
                        category_aggregates[cat_key]['total_agreements'] += cat_stats['agreements']
                        category_aggregates[cat_key]['total_comparisons'] += cat_stats['total']

        # Sort by agreement percentage (lowest first)
        category_stats_list = []
        for cat_key, agg in category_aggregates.items():
            if agg['total_comparisons'] > 0:
                agreement_pct = round(agg['total_agreements'] / agg['total_comparisons'] * 100, 1)
            else:
                agreement_pct = None
            category_stats_list.append((cat_key, agg, agreement_pct))

        category_stats_list.sort(key=lambda x: x[2] if x[2] is not None else 0)

        for cat_key, agg, agreement_pct in category_stats_list:
            writer.writerow([
                category_labels.get(cat_key, cat_key),
                agg['total_agreements'],
                agg['total_comparisons'],
                agreement_pct if agreement_pct is not None else 'N/A'
            ])

        return response


class ProgressGradeSummaryExportView(AdminRequiredMixin, View):
    """Export progress grade summary statistics as clean CSV."""

    def get(self, request):
        """Generate CSV with progress grade summary metrics."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="progress_grade_summary.csv"'

        writer = csv.writer(response)

        # Header
        writer.writerow(['Metric', 'Value'])

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        total_exact_matches = 0
        total_within1_matches = 0
        total_progress_comparisons = 0

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).order_by('created_at')

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)
                    prog_agreement = stats.get('progress_agreement', {})

                    if prog_agreement and prog_agreement.get('n_compared', 0) > 0:
                        n_compared = prog_agreement['n_compared']
                        total_progress_comparisons += n_compared

                        exact_count = round(prog_agreement['exact_agreement_pct'] / 100 * n_compared)
                        within1_count = round(prog_agreement['within_1_agreement_pct'] / 100 * n_compared)

                        total_exact_matches += exact_count
                        total_within1_matches += within1_count

        # Write summary statistics
        writer.writerow(['Total Comparisons', total_progress_comparisons])
        writer.writerow(['Exact Matches', total_exact_matches])
        writer.writerow(['Exact Match %', round(total_exact_matches / total_progress_comparisons * 100, 1) if total_progress_comparisons > 0 else 0])
        writer.writerow(['Within 1 Point', total_within1_matches])
        writer.writerow(['Within 1 Point %', round(total_within1_matches / total_progress_comparisons * 100, 1) if total_progress_comparisons > 0 else 0])

        return response


class ProgressGradeDifferenceDistributionExportView(AdminRequiredMixin, View):
    """Export progress grade difference distribution as clean CSV."""

    def get(self, request):
        """Generate CSV with difference distribution table."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="progress_grade_difference_distribution.csv"'

        writer = csv.writer(response)

        # Header
        writer.writerow(['Difference (points)', 'Count', 'Percentage'])

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        total_progress_comparisons = 0
        difference_distribution = {0: 0, 1: 0, 2: 0, 3: 0}

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).order_by('created_at')

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)
                    prog_agreement = stats.get('progress_agreement', {})

                    if prog_agreement and prog_agreement.get('n_compared', 0) > 0:
                        n_compared = prog_agreement['n_compared']
                        total_progress_comparisons += n_compared

                        # Calculate actual difference distribution
                        s1_map = {g.model_answer_id: g for g in s1_gradings}
                        s2_map = {g.model_answer_id: g for g in s2_gradings}
                        common_ids = set(s1_map.keys()) & set(s2_map.keys())

                        for answer_id in common_ids:
                            g1 = s1_map[answer_id]
                            g2 = s2_map[answer_id]

                            if g1.progress_grade is not None and g2.progress_grade is not None:
                                diff = abs(g1.progress_grade - g2.progress_grade)
                                difference_distribution[diff] += 1

        # Write difference distribution
        for diff in [0, 1, 2, 3]:
            count = difference_distribution[diff]
            pct = round(count / total_progress_comparisons * 100, 1) if total_progress_comparisons > 0 else 0
            writer.writerow([diff, count, pct])

        return response


class PerQuestionCategoryExportView(AdminRequiredMixin, View):
    """Export per-question category breakdown as clean CSV."""

    def get(self, request):
        """Generate CSV with category agreement per question."""
        response = HttpResponse(content_type='text/csv')
        response['Content-Disposition'] = 'attachment; filename="per_question_category_breakdown.csv"'

        writer = csv.writer(response)

        # Category labels
        category_labels = {
            'error_incorrect_logic': 'Incorrect Logic',
            'error_hallucinated': 'Hallucinated Facts',
            'error_calculation': 'Calculation Error',
            'error_conceptual': 'Conceptual Error',
            'achievement_understanding': 'Problem Understanding',
            'achievement_correct_result': 'Correct End Result',
            'achievement_insight': 'Mathematical Insight',
            'achievement_usefulness': 'Useful Progress',
        }

        # Header
        header = ['Question ID', 'Title'] + [category_labels[cat] for cat in category_labels.keys()] + ['Progress Mean Diff']
        writer.writerow(header)

        # Get all questions with 2+ finalized sessions
        all_questions = Question.objects.annotate(
            finalized_session_count=Count(
                'modelgradingsession',
                filter=Q(modelgradingsession__session_status='finalized'),
                distinct=True
            )
        ).filter(finalized_session_count__gte=2)

        for question in all_questions:
            sessions = ModelGradingSession.objects.filter(
                question=question,
                session_status='finalized'
            ).order_by('created_at')

            if sessions.count() == 2:
                s1_gradings = ModelGrading.objects.filter(session=sessions[0])
                s2_gradings = ModelGrading.objects.filter(session=sessions[1])

                if s1_gradings.exists() and s2_gradings.exists():
                    stats = calculate_agreement(s1_gradings, s2_gradings)

                    row = [question.id, sanitize_csv_value(question.title)]

                    # Add category agreement percentages
                    for cat_key in category_labels.keys():
                        cat_stats = stats['category_agreements'].get(cat_key, {})
                        agreement_pct = cat_stats.get('agreement_pct', 'N/A')
                        row.append(agreement_pct if agreement_pct != 'N/A' else 'N/A')

                    # Add progress grade mean diff
                    prog_agreement = stats.get('progress_agreement', {})
                    mean_diff = prog_agreement.get('mean_absolute_difference', 'N/A')
                    row.append(mean_diff)

                    writer.writerow(row)

        return response
