{% extends 'base.html' %}
{% load static %}

{% block title %}Model Scores - IMProofBench{% endblock %}

{% block extra_css %}
<!-- Chart.js CDN -->
<script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.0/dist/chart.umd.min.js"></script>
<style>
    .sortable {
        cursor: pointer;
        user-select: none;
        position: relative;
    }
    
    .sortable:hover {
        background-color: rgba(0, 0, 0, 0.03);
    }
    
    .sort-icon {
        display: inline-block;
        margin-left: 5px;
        vertical-align: middle;
    }
    
    .sort-icon i {
        font-size: 0.8em;
        display: block;
        line-height: 0.5;
    }
    
    .sortable.sorted-asc .bi-chevron-up {
        color: var(--bs-primary) !important;
    }
    
    .sortable.sorted-desc .bi-chevron-down {
        color: var(--bs-primary) !important;
    }
    
    /* Export button styles */
    .chart-container {
        position: relative;
    }
    
    .export-buttons {
        position: absolute;
        top: -35px;
        right: 0px;
        z-index: 10;
    }
    
    .export-buttons .btn {
        margin-left: 5px;
    }
    
    /* Pairwise comparison table styles */
    .pairwise-table {
        font-size: 0.9rem;
    }
    
    .pairwise-table th {
        background-color: #f8f9fa;
        font-weight: 600;
        text-align: center;
        vertical-align: middle;
        padding: 8px;
    }
    
    .pairwise-table td {
        text-align: center;
        vertical-align: middle;
        padding: 6px;
        border: 1px solid #dee2e6;
    }
    
    .pairwise-table .model-header {
        background-color: #f8f9fa;
        font-weight: 600;
        text-align: left;
        white-space: nowrap;
    }
    
    .pairwise-table .diagonal {
        background-color: #e9ecef;
        color: #6c757d;
    }
    
    .pairwise-table td {
        transition: transform 0.2s ease;
    }
    
    .pairwise-table td:hover:not(.diagonal):not(.model-header) {
        transform: scale(1.1);
        box-shadow: 0 2px 5px rgba(0,0,0,0.2);
        position: relative;
        z-index: 10;
    }
    
    .tier-badge {
        font-size: 0.75rem;
        padding: 2px 6px;
        margin-left: 4px;
    }
    
    .tab-content {
        padding-top: 20px;
    }
</style>
{% endblock %}

{% block content %}
<div class="container mt-4">
    <h1>Model Evaluation Statistics</h1>
    <p class="text-muted">Comprehensive evaluation results and performance metrics for benchmark models</p>
    
    <!-- Navigation Tabs -->
    <ul class="nav nav-tabs" id="statisticsTab" role="tablist">
        <li class="nav-item" role="presentation">
            <button class="nav-link active" id="overview-tab" data-bs-toggle="tab" data-bs-target="#overview" type="button" role="tab" aria-controls="overview" aria-selected="true">
                Overview
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="pairwise-tab" data-bs-toggle="tab" data-bs-target="#pairwise" type="button" role="tab" aria-controls="pairwise" aria-selected="false">
                Pairwise Comparisons
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="grading-tab" data-bs-toggle="tab" data-bs-target="#grading" type="button" role="tab" aria-controls="grading" aria-selected="false">
                Author Grading
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="progress-tab" data-bs-toggle="tab" data-bs-target="#progress" type="button" role="tab" aria-controls="progress" aria-selected="false">
                Progress Grades
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="wordcloud-tab" data-bs-toggle="tab" data-bs-target="#wordcloud" type="button" role="tab" aria-controls="wordcloud" aria-selected="false">
                Question Tags
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="correlations-tab" data-bs-toggle="tab" data-bs-target="#correlations" type="button" role="tab" aria-controls="correlations" aria-selected="false">
                Correlations
            </button>
        </li>
        <li class="nav-item" role="presentation">
            <button class="nav-link" id="variance-tab" data-bs-toggle="tab" data-bs-target="#variance" type="button" role="tab" aria-controls="variance" aria-selected="false">
                Standard Deviations
            </button>
        </li>
    </ul>
    
    <!-- Tab Content -->
    <div class="tab-content" id="statisticsTabContent">
        
        <!-- Overview Tab -->
        <div class="tab-pane fade show active" id="overview" role="tabpanel" aria-labelledby="overview-tab">
            <!-- Questions Section -->
            <div class="card mb-4">
                <div class="card-header">
                    <h3 class="mb-0">Active Questions</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">Select which questions to include in benchmark scoring calculations:</p>
                    
                    <div class="table-responsive">
                        <table class="table table-hover">
                            <thead>
                                <tr>
                                    <th width="60">Include</th>
                                    <th>Question</th>
                                    <th width="150">Evaluations</th>
                                    <th width="120">Grading Released</th>
                                    <th width="120">Gradings</th>
                                </tr>
                            </thead>
                            <tbody>
                                {% for q_data in questions %}
                                <tr data-question-id="{{ q_data.question.id }}">
                                    <td class="text-center">
                                        <input type="checkbox" 
                                               class="form-check-input benchmark-inclusion-checkbox"
                                               data-question-id="{{ q_data.question.id }}"
                                               {% if q_data.question.benchmark_inclusion %}checked{% endif %}>
                                    </td>
                                    <td>
                                        <strong>Q{{ q_data.question.id }}:</strong> {{ q_data.question.title }}
                                        {% if not q_data.has_subquestions %}
                                        <span class="badge bg-secondary ms-2">No subquestions</span>
                                        {% endif %}
                                    </td>
                                    <td>
                                        {{ q_data.completed_evaluations }}/{{ q_data.total_expected }}
                                        {% if q_data.completed_evaluations == q_data.total_expected %}
                                        <span class="text-success">✓</span>
                                        {% endif %}
                                    </td>
                                    <td class="text-center">
                                        {% if q_data.has_released_answers %}
                                        <span class="badge bg-success">Yes</span>
                                        {% else %}
                                        <span class="badge bg-secondary">No</span>
                                        {% endif %}
                                    </td>
                                    <td class="text-center">
                                        {{ q_data.grading_sessions }}
                                    </td>
                                </tr>
                                {% empty %}
                                <tr>
                                    <td colspan="5" class="text-center text-muted">No active questions found</td>
                                </tr>
                                {% endfor %}
                            </tbody>
                        </table>
                    </div>
                </div>
            </div>
            
            <!-- Model Scores Section -->
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Subquestion Scores by Model</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Average percentage of points earned on subquestions across included questions.
                        Only questions with subquestions and benchmark inclusion enabled are counted.
                    </p>

                    <div class="table-responsive">
                        <table class="table table-hover" id="model-scores-table">
                            <thead>
                                <tr>
                                    <th class="sortable" data-sort="model">
                                        Model
                                        <span class="sort-icon">
                                            <i class="bi bi-chevron-up text-muted"></i>
                                            <i class="bi bi-chevron-down text-muted"></i>
                                        </span>
                                    </th>
                                    <th>Tier</th>
                                    <th>Questions Evaluated</th>
                                    <th class="sortable sorted-desc" data-sort="score">
                                        Average Score
                                        <span class="sort-icon">
                                            <i class="bi bi-chevron-up text-muted"></i>
                                            <i class="bi bi-chevron-down text-primary"></i>
                                        </span>
                                    </th>
                                </tr>
                            </thead>
                            <tbody id="model-scores-tbody">
                                {% for model_data in models %}
                                <tr data-model="{{ model_data.model.display_name }}"
                                    data-score="{{ model_data.score_percentage|default:'-1' }}">
                                    <td class="model-name">
                                        <strong>{{ model_data.model.display_name }}</strong>
                                    </td>
                                    <td>
                                        <span class="badge bg-info">Tier {{ model_data.tier }}</span>
                                    </td>
                                    <td>
                                        {{ model_data.questions_attempted }}/{{ model_data.questions_total }}
                                        {% if model_data.questions_attempted == model_data.questions_total and model_data.questions_total > 0 %}
                                        <span class="text-success">✓</span>
                                        {% endif %}
                                    </td>
                                    <td class="score-cell">
                                        {% if model_data.score_percentage is not None %}
                                            <strong>{{ model_data.score_percentage|floatformat:1 }}%</strong>
                                            <div class="progress mt-1" style="height: 10px;">
                                                <div class="progress-bar" role="progressbar"
                                                     style="width: {{ model_data.score_percentage }}%"
                                                     aria-valuenow="{{ model_data.score_percentage|floatformat:0 }}"
                                                     aria-valuemin="0"
                                                     aria-valuemax="100">
                                                </div>
                                            </div>
                                        {% else %}
                                            <span class="text-muted">N/A</span>
                                        {% endif %}
                                    </td>
                                </tr>
                                {% empty %}
                                <tr class="no-data-row">
                                    <td colspan="4" class="text-center text-muted">No model data available</td>
                                </tr>
                                {% endfor %}
                            </tbody>
                        </table>
                    </div>
                    
                    <div class="alert alert-info mt-3">
                        <strong>Scoring Methodology:</strong> 
                        <ul class="mb-0">
                            <li>Each question's score is calculated as a percentage (0-100%) based on subquestion points earned.</li>
                            <li>The overall score is the average of all per-question percentages (not weighted by points).</li>
                            <li>Tier 1 models have 2 attempts per question; their per-question score is averaged across attempts.</li>
                            <li>Only the latest evaluation is considered when questions have been re-run.</li>
                            <li>Scores only include questions that have subquestions and are marked for benchmark inclusion.</li>
                        </ul>
                    </div>
                </div>
            </div>

            <!-- Subquestion Results Summary -->
            <div class="card">
                <div class="card-header d-flex justify-content-between align-items-center">
                    <h3 class="mb-0">Subquestion Results by Model</h3>
                    <div class="export-buttons">
                        <button class="btn btn-sm btn-outline-primary" onclick="exportChart('subquestionResultsChart', 'subquestion_results', 'png')">📥 PNG</button>
                        <button class="btn btn-sm btn-outline-success" onclick="exportChart('subquestionResultsChart', 'subquestion_results', 'jpg')">📥 JPG</button>
                    </div>
                </div>
                <div class="card-body">
                    <p class="text-muted">Average percentage of points earned on subquestions across included questions, ordered by performance.</p>
                    <div class="chart-container" style="position: relative; height: 600px; width: 100%;">
                        <canvas id="subquestionResultsChart"></canvas>
                    </div>
                </div>
            </div>
        </div>
        
        <!-- Pairwise Comparisons Tab -->
        <div class="tab-pane fade" id="pairwise" role="tabpanel" aria-labelledby="pairwise-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Pairwise Model Comparisons</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Pairwise wins by problem: Each cell (i, j) shows the number of problems where model i (row) outperforms model j (column),
                        using weighted subquestion points. For a problem P with subquestions of point values p<sub>k</sub>, a model’s score is
                        A(M, P) = (sum of p<sub>k</sub> for correctly answered subquestions) / (sum of all p<sub>k</sub> in P), based on the latest first attempt.
                        A win is counted when A(i, P) > A(j, P). 
                        <strong>Color coding (method b):</strong> background is based on wins(i,j) − wins(j,i) with a red–white–green spectrum centered at 0
                        (white = no advantage, green = i has advantage, red = j has advantage). The table is color‑antisymmetric.
                    </p>
                    
                    {% if pairwise_data and pairwise_data.models %}
                    <div class="alert alert-info">
                        <strong>Total Questions:</strong> {{ pairwise_data.total_questions }} questions<br>
                        <strong>Total Subquestions:</strong> {{ pairwise_data.total_subquestions }} subquestions
                    </div>
                    
                    <div class="d-flex justify-content-end mb-3">
                        <button class="btn btn-sm btn-outline-danger" onclick="exportPairwiseTable()">📥 Export as PDF</button>
                    </div>
                    
                    <div class="table-responsive" id="pairwise-table-container">
                        <!-- Table will be rendered by JavaScript -->
                    </div>
                    
                    <div class="alert alert-warning mt-3">
                        <strong>How to read this table:</strong>
                        <ul class="mb-0">
                            <li>Each row represents the "wins" of that model against others</li>
                            <li>Each cell (i,j) counts problems where A(i,P) > A(j,P) using weighted subquestion points</li>
                            <li>Higher numbers indicate better relative performance across problems</li>
                            <li>Color shading uses wins(i,j) − wins(j,i) centered at 0 (red–white–green)</li>
                            <li>Only the first attempt is considered for all models (including Tier 1); missing answers count as incorrect</li>
                        </ul>
                    </div>
                    {% else %}
                    <div class="alert alert-warning">
                        No pairwise comparison data available. Please ensure there are questions with subquestions 
                        marked for benchmark inclusion and that models have been evaluated.
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>
        
        <!-- Author Grading Tab -->
        <div class="tab-pane fade" id="grading" role="tabpanel" aria-labelledby="grading-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Author Grading Analysis</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Distribution of author grading responses for each evaluation category.
                        Based on finalized grading sessions for questions with benchmark inclusion enabled.
                    </p>
                    
                    {% if grading_stats %}
                    <!-- Error Categories -->
                    <h4 class="mt-4 mb-3">Error Indicators</h4>
                    
                    {% if grading_stats.error_incorrect_logic %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.error_incorrect_logic.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('incorrectLogicChart', 'incorrect_logic', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('incorrectLogicChart', 'incorrect_logic', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="incorrectLogicChart"></canvas>
                        </div>
                        <div class="mt-2 text-muted small">
                            <strong>Note:</strong> Bar segments show percentage of answers graded as 
                            <span style="color: #dc3545;">Yes (Red = Has Error)</span>, 
                            <span style="color: #6c757d;">Not Sure (Gray)</span>, and 
                            <span style="color: #28a745;">No (Green = No Error)</span>.
                            Models are ordered by their subquestion performance score.
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.error_hallucinated %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.error_hallucinated.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('hallucinatedChart', 'hallucinated', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('hallucinatedChart', 'hallucinated', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="hallucinatedChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.error_calculation %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.error_calculation.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('calculationErrorChart', 'calculation_error', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('calculationErrorChart', 'calculation_error', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="calculationErrorChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.error_conceptual %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.error_conceptual.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('conceptualErrorChart', 'conceptual_error', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('conceptualErrorChart', 'conceptual_error', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="conceptualErrorChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    <!-- Achievement Categories -->
                    <h4 class="mt-5 mb-3">Achievement Indicators</h4>
                    
                    {% if grading_stats.achievement_understanding %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.achievement_understanding.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('understandingChart', 'understanding', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('understandingChart', 'understanding', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="understandingChart"></canvas>
                        </div>
                        <div class="mt-2 text-muted small">
                            <strong>Note:</strong> For achievement indicators: 
                            <span style="color: #28a745;">Yes (Green = Achievement Present)</span>, 
                            <span style="color: #6c757d;">Not Sure (Gray)</span>, and 
                            <span style="color: #dc3545;">No (Red = Achievement Absent)</span>.
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.achievement_correct_result %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.achievement_correct_result.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('correctResultChart', 'correct_result', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('correctResultChart', 'correct_result', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="correctResultChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.achievement_insight %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.achievement_insight.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('insightChart', 'insight', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('insightChart', 'insight', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="insightChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    {% if grading_stats.achievement_usefulness %}
                    <div class="mb-5">
                        <h5>{{ grading_stats.achievement_usefulness.display_name }}</h5>
                        <div class="chart-container" style="position: relative; height:400px; width:100%;">
                            <div class="export-buttons">
                                <button class="btn btn-sm btn-outline-primary" onclick="exportChart('usefulnessChart', 'usefulness', 'png')">📥 PNG</button>
                                <button class="btn btn-sm btn-outline-success" onclick="exportChart('usefulnessChart', 'usefulness', 'jpg')">📥 JPG</button>
                            </div>
                            <canvas id="usefulnessChart"></canvas>
                        </div>
                    </div>
                    {% endif %}
                    
                    {% else %}
                    <div class="alert alert-warning">
                        No grading data available. Please ensure grading has been completed for benchmark questions.
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>
        
        <!-- Progress Grades Tab -->
        <div class="tab-pane fade" id="progress" role="tabpanel" aria-labelledby="progress-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Overall Progress Grades</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Distribution of overall progress grades (0-3) assigned by authors.
                    </p>
                    
                    {% if progress_stats and progress_stats.models %}
                    <div class="chart-container" style="position: relative; height:400px; width:100%;">
                        <div class="export-buttons">
                            <button class="btn btn-sm btn-outline-primary" onclick="exportChart('progressGradeChart', 'progress_grades', 'png')">📥 PNG</button>
                            <button class="btn btn-sm btn-outline-success" onclick="exportChart('progressGradeChart', 'progress_grades', 'jpg')">📥 JPG</button>
                        </div>
                        <canvas id="progressGradeChart"></canvas>
                    </div>
                    <div class="mt-2 text-muted small">
                        <strong>Progress Grade Scale:</strong>
                        <span style="color: #dc3545;">0 = No Progress</span>,
                        <span style="color: #ffc107;">1 = Minor Progress</span>,
                        <span style="color: #17a2b8;">2 = Major Progress</span>,
                        <span style="color: #28a745;">3 = Complete Solution</span>
                    </div>
                    {% else %}
                    <div class="alert alert-warning">
                        No progress grade data available. Please ensure grading has been completed for benchmark questions.
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>
        
        <!-- Word Cloud Tab -->
        <div class="tab-pane fade" id="wordcloud" role="tabpanel" aria-labelledby="wordcloud-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Question Tags Word Cloud</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Visualization of tags associated with active questions. Larger text indicates more frequent tags.
                    </p>
                    
                    {% if word_cloud_data %}
                    <div class="position-relative">
                        <div class="export-buttons" style="position: absolute; top: -35px; right: 0; z-index: 10;">
                            <button class="btn btn-sm btn-outline-primary" onclick="exportWordCloud('png')">📥 PNG</button>
                            <button class="btn btn-sm btn-outline-success" onclick="exportWordCloud('jpg')">📥 JPG</button>
                            <button class="btn btn-sm btn-outline-danger" onclick="exportWordCloudAsPDF()">📥 PDF</button>
                        </div>
                        <div id="wordCloudContainer" style="position: relative; min-height: 600px; width: 100%; padding: 20px 0;">
                        </div>
                    </div>
                    
                    <div class="alert alert-info mt-3">
                        <strong>Tag Statistics:</strong>
                        <ul class="mb-0">
                            <li>Total unique tags: {{ word_cloud_data|length }}</li>
                            <li>Most common tags: 
                                {% for tag in word_cloud_data|slice:":5" %}
                                    {{ tag.text }} ({{ tag.count }}){% if not forloop.last %}, {% endif %}
                                {% endfor %}
                            </li>
                        </ul>
                    </div>
                    {% else %}
                    <div class="alert alert-warning">
                        No tags available for active questions. Please ensure questions have tags assigned.
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>
        
        <!-- Correlations Tab -->
        <div class="tab-pane fade" id="correlations" role="tabpanel" aria-labelledby="correlations-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Metric Correlations</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        Statistical correlations between different evaluation metrics.
                    </p>
                    
                    {% if correlation_data and correlation_data.progress_vs_subquestion %}
                    <div class="card mb-4">
                        <div class="card-header">
                            <h4 class="mb-0">Total Progress Grade vs. Subquestion Percentage</h4>
                        </div>
                        <div class="card-body">
                            <p class="text-muted">
                                Correlation between the average Total Progress grade (0-3 scale) assigned by graders
                                and the percentage of subquestion points earned by the model.
                            </p>
                            
                            {% with corr_data=correlation_data.progress_vs_subquestion %}
                            <div class="row">
                                <div class="col-md-6">
                                    <div class="alert {% if corr_data.correlation %}alert-info{% else %}alert-warning{% endif %}">
                                        <h5>Correlation Coefficient</h5>
                                        {% if corr_data.correlation %}
                                            <h2 class="mb-2">{{ corr_data.correlation }}</h2>
                                            {% if corr_data.p_value %}
                                            <p class="mb-0">p-value: {{ corr_data.p_value }}</p>
                                            {% endif %}
                                        {% else %}
                                            <p class="mb-0">Not enough data to calculate correlation</p>
                                        {% endif %}
                                    </div>
                                </div>
                                <div class="col-md-6">
                                    <div class="alert alert-secondary">
                                        <h5>Sample Information</h5>
                                        <ul class="mb-0">
                                            <li>Number of graded model answers: <strong>{{ corr_data.n_samples }}</strong></li>
                                            <li>Questions included: Only those with at least one grading</li>
                                            <li>Data points: Each represents one graded model answer</li>
                                        </ul>
                                    </div>
                                </div>
                            </div>
                            
                            {% if corr_data.correlation %}
                            <div class="mt-4">
                                <h5>Interpretation</h5>
                                <p>
                                    {% if corr_data.correlation >= 0.7 %}
                                        <span class="badge bg-success">Strong Positive Correlation</span>
                                        The Total Progress grade strongly correlates with subquestion performance,
                                        suggesting that models performing better on subquestions tend to receive higher progress grades.
                                    {% elif corr_data.correlation >= 0.4 %}
                                        <span class="badge bg-info">Moderate Positive Correlation</span>
                                        The Total Progress grade moderately correlates with subquestion performance,
                                        indicating a noticeable relationship between these metrics.
                                    {% elif corr_data.correlation >= 0.2 %}
                                        <span class="badge bg-warning">Weak Positive Correlation</span>
                                        The Total Progress grade shows a weak positive correlation with subquestion performance.
                                    {% elif corr_data.correlation >= -0.2 %}
                                        <span class="badge bg-secondary">No Clear Correlation</span>
                                        There is little to no linear relationship between Total Progress grade and subquestion performance.
                                    {% elif corr_data.correlation >= -0.4 %}
                                        <span class="badge bg-warning">Weak Negative Correlation</span>
                                        The Total Progress grade shows a weak negative correlation with subquestion performance.
                                    {% elif corr_data.correlation >= -0.7 %}
                                        <span class="badge bg-info">Moderate Negative Correlation</span>
                                        The Total Progress grade moderately negatively correlates with subquestion performance.
                                    {% else %}
                                        <span class="badge bg-danger">Strong Negative Correlation</span>
                                        The Total Progress grade strongly negatively correlates with subquestion performance,
                                        suggesting an inverse relationship between these metrics.
                                    {% endif %}
                                </p>
                                
                                {% if corr_data.p_value %}
                                <p>
                                    Statistical significance: 
                                    {% if corr_data.p_value < 0.001 %}
                                        <strong>Highly significant (p < 0.001)</strong>
                                    {% elif corr_data.p_value < 0.01 %}
                                        <strong>Very significant (p < 0.01)</strong>
                                    {% elif corr_data.p_value < 0.05 %}
                                        <strong>Significant (p < 0.05)</strong>
                                    {% else %}
                                        <strong>Not statistically significant (p ≥ 0.05)</strong>
                                    {% endif %}
                                </p>
                                {% endif %}
                            </div>
                            {% endif %}
                            
                            <div class="alert alert-light mt-3">
                                <strong>Methodology:</strong>
                                <ul class="mb-0">
                                    <li>For each graded model answer, we calculate:
                                        <ul>
                                            <li>The average Total Progress grade across all graders who evaluated it</li>
                                            <li>The percentage of subquestion points earned in that specific model attempt</li>
                                        </ul>
                                    </li>
                                    <li>Only questions with both grading data and subquestions are included</li>
                                    <li>Pearson correlation coefficient is used to measure linear relationship</li>
                                </ul>
                            </div>
                            {% endwith %}
                        </div>
                    </div>

                    <!-- NEW: Binary Correlation: All Subquestions Correct vs. Progress Grade = 3 -->
                    {% if correlation_data.all_correct_vs_progress_3 %}
                    <div class="card mb-4">
                        <div class="card-header">
                            <h4 class="mb-0">All Subquestions Correct vs. Progress Grade = 3</h4>
                        </div>
                        <div class="card-body">
                            <p class="text-muted">
                                Correlation between getting ALL subquestions correct (binary: 0 or 1)
                                and receiving a progress grade of 3 (Complete Solution) from all graders (binary: 0 or 1).
                            </p>

                            {% with corr_data=correlation_data.all_correct_vs_progress_3 %}
                            <div class="row">
                                <div class="col-md-6">
                                    <div class="alert {% if corr_data.correlation %}alert-info{% else %}alert-warning{% endif %}">
                                        <h5>Correlation Coefficient</h5>
                                        {% if corr_data.correlation %}
                                            <h2 class="mb-2">{{ corr_data.correlation }}</h2>
                                            {% if corr_data.p_value %}
                                            <p class="mb-0">p-value: {{ corr_data.p_value }}</p>
                                            {% endif %}
                                        {% else %}
                                            <p class="mb-0">Not enough data to calculate correlation</p>
                                        {% endif %}
                                    </div>
                                </div>
                                <div class="col-md-6">
                                    <div class="alert alert-secondary">
                                        <h5>Sample Information</h5>
                                        <ul class="mb-0">
                                            <li>Number of graded model answers: <strong>{{ corr_data.n_samples }}</strong></li>
                                            <li>Questions included: Only those with subquestions and at least one grading</li>
                                            <li>Data points: Each represents one graded model answer</li>
                                        </ul>
                                    </div>
                                </div>
                            </div>

                            {% if corr_data.correlation %}
                            <div class="mt-4">
                                <h5>Interpretation</h5>
                                <p>
                                    {% if corr_data.correlation >= 0.7 %}
                                        <span class="badge bg-success">Strong Positive Correlation</span>
                                        Getting all subquestions correct strongly correlates with receiving a Complete Solution grade (3),
                                        suggesting that automatic subquestion evaluation is highly aligned with human grading.
                                    {% elif corr_data.correlation >= 0.4 %}
                                        <span class="badge bg-info">Moderate Positive Correlation</span>
                                        Getting all subquestions correct moderately correlates with receiving a Complete Solution grade (3),
                                        indicating a noticeable relationship between these metrics.
                                    {% elif corr_data.correlation >= 0.2 %}
                                        <span class="badge bg-warning">Weak Positive Correlation</span>
                                        Getting all subquestions correct shows a weak positive correlation with receiving a Complete Solution grade (3).
                                    {% elif corr_data.correlation >= -0.2 %}
                                        <span class="badge bg-secondary">No Clear Correlation</span>
                                        There is little to no linear relationship between getting all subquestions correct and receiving a Complete Solution grade.
                                    {% elif corr_data.correlation >= -0.4 %}
                                        <span class="badge bg-warning">Weak Negative Correlation</span>
                                        Getting all subquestions correct shows a weak negative correlation with receiving a Complete Solution grade (3).
                                    {% elif corr_data.correlation >= -0.7 %}
                                        <span class="badge bg-info">Moderate Negative Correlation</span>
                                        Getting all subquestions correct moderately negatively correlates with receiving a Complete Solution grade (3).
                                    {% else %}
                                        <span class="badge bg-danger">Strong Negative Correlation</span>
                                        Getting all subquestions correct strongly negatively correlates with receiving a Complete Solution grade (3).
                                    {% endif %}
                                </p>

                                {% if corr_data.p_value %}
                                <p>
                                    Statistical significance:
                                    {% if corr_data.p_value < 0.001 %}
                                        <strong>Highly significant (p < 0.001)</strong>
                                    {% elif corr_data.p_value < 0.01 %}
                                        <strong>Very significant (p < 0.01)</strong>
                                    {% elif corr_data.p_value < 0.05 %}
                                        <strong>Significant (p < 0.05)</strong>
                                    {% else %}
                                        <strong>Not statistically significant (p ≥ 0.05)</strong>
                                    {% endif %}
                                </p>
                                {% endif %}
                            </div>
                            {% endif %}

                            <div class="alert alert-light mt-3">
                                <strong>Methodology:</strong>
                                <ul class="mb-0">
                                    <li>For each graded model answer with subquestions:
                                        <ul>
                                            <li><strong>All subquestions correct:</strong> 1 if all subquestions were answered correctly, 0 otherwise</li>
                                            <li><strong>Progress grade = 3:</strong> 1 if ALL graders gave a grade of 3 (Complete Solution), 0 otherwise</li>
                                        </ul>
                                    </li>
                                    <li>Only questions with both grading data and subquestions are included</li>
                                    <li>For Tier 1 models with 2 attempts, only the graded attempt is considered</li>
                                    <li>Pearson correlation coefficient is used to measure linear relationship between the binary variables</li>
                                </ul>
                            </div>
                            {% endwith %}
                        </div>
                    </div>
                    {% endif %}

                    {% else %}
                    <div class="alert alert-warning">
                        No correlation data available. Please ensure:
                        <ul class="mb-0">
                            <li>Questions have been graded by authors</li>
                            <li>Questions have subquestions with point values</li>
                            <li>At least 2 model answers have both grading and subquestion data</li>
                        </ul>
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>

        <!-- Standard Deviations Tab -->
        <div class="tab-pane fade" id="variance" role="tabpanel" aria-labelledby="variance-tab">
            <div class="card">
                <div class="card-header">
                    <h3 class="mb-0">Standard Deviations of Subquestion Scores</h3>
                </div>
                <div class="card-body">
                    <p class="text-muted">
                        For models with multiple evaluations, we estimate the standard deviation of their average subquestion scores.
                        This helps quantify the uncertainty in model performance measurements.
                    </p>

                    {% if variance_data %}
                    <!-- Methodology Explanation -->
                    <div class="alert alert-info mb-4">
                        <h5>Methodology</h5>
                        <p>For each model M and question Q with subquestions:</p>
                        <ol class="mb-2">
                            <li>Calculate the weighted subquestion score for each evaluation: <code>score = (points_earned / points_possible) × 100</code></li>
                            <li>Calculate the sample variance V(M,Q) across all evaluations for that question</li>
                            <li>Estimate the overall standard deviation using: <strong>σ(M) = (1/N) × √(V(M,Q₁) + ... + V(M,Qₙ))</strong></li>
                        </ol>
                        <p class="mb-0">
                            <strong>Note:</strong> Only models with at least 2 evaluations for at least one question are included.
                            Currently, this primarily includes Tier 1 models which have 2 attempts per question.
                        </p>
                    </div>

                    <!-- Summary Table -->
                    <h4 class="mt-4 mb-3">Model Statistics</h4>
                    <div class="table-responsive mb-4">
                        <table class="table table-hover">
                            <thead>
                                <tr>
                                    <th>Model</th>
                                    <th>Tier</th>
                                    <th>Average Score (%)</th>
                                    <th>Standard Deviation (σ)</th>
                                    <th>Questions</th>
                                    <th>Total Evaluations</th>
                                </tr>
                            </thead>
                            <tbody>
                                {% for data in variance_data %}
                                <tr>
                                    <td><strong>{{ data.model.display_name }}</strong></td>
                                    <td><span class="badge bg-info">Tier {{ data.tier }}</span></td>
                                    <td>{{ data.average_score|floatformat:1 }}%</td>
                                    <td>{{ data.sigma|floatformat:2 }}</td>
                                    <td>{{ data.num_questions }}</td>
                                    <td>{{ data.num_total_evaluations }}</td>
                                </tr>
                                {% endfor %}
                            </tbody>
                        </table>
                    </div>

                    <!-- Chart with Error Bars -->
                    <h4 class="mt-5 mb-3">Subquestion Scores with Error Bars (±1σ)</h4>
                    <div class="chart-container" style="position: relative; height:600px; width:100%;">
                        <div class="export-buttons">
                            <button class="btn btn-sm btn-outline-primary" onclick="exportChart('varianceChart', 'variance_chart', 'png')">📥 PNG</button>
                            <button class="btn btn-sm btn-outline-success" onclick="exportChart('varianceChart', 'variance_chart', 'jpg')">📥 JPG</button>
                        </div>
                        <canvas id="varianceChart"></canvas>
                    </div>

                    <div class="mt-2 text-muted small">
                        <strong>Interpretation:</strong> The error bars show ±1 standard deviation (σ) around the average score.
                        Larger error bars indicate more variability in model performance across different evaluations.
                    </div>

                    {% else %}
                    <div class="alert alert-warning">
                        No variance data available. Please ensure:
                        <ul class="mb-0">
                            <li>Questions are marked for benchmark inclusion</li>
                            <li>Questions have subquestions with point values</li>
                            <li>At least one model has 2 or more evaluations for at least one question</li>
                        </ul>
                    </div>
                    {% endif %}
                </div>
            </div>
        </div>
    </div>
</div>

<!-- Include D3.js and D3-cloud for word cloud -->
<script src="https://d3js.org/d3.v7.min.js"></script>
<script src="https://cdn.jsdelivr.net/gh/jasondavies/d3-cloud/build/d3.layout.cloud.js"></script>

<script>
// Initialize pairwise comparison table
document.addEventListener('DOMContentLoaded', function() {
    // Restore the last active tab from localStorage
    const lastActiveTab = localStorage.getItem('modelScoresActiveTab');
    if (lastActiveTab) {
        // Find the tab button and activate it
        const tabButton = document.querySelector(`button[data-bs-target="${lastActiveTab}"]`);
        if (tabButton) {
            // Remove active class from current tab
            document.querySelector('.nav-link.active').classList.remove('active');
            document.querySelector('.tab-pane.active').classList.remove('active', 'show');
            
            // Add active class to stored tab
            tabButton.classList.add('active');
            const tabPane = document.querySelector(lastActiveTab);
            if (tabPane) {
                tabPane.classList.add('active', 'show');
            }
        }
    }
    
    // Save tab state when tabs are clicked
    const allTabButtons = document.querySelectorAll('button[data-bs-toggle="tab"]');
    allTabButtons.forEach(button => {
        button.addEventListener('click', function() {
            const target = this.getAttribute('data-bs-target');
            localStorage.setItem('modelScoresActiveTab', target);
        });
    });
    
    {% if pairwise_data_json %}
    const pairwiseData = {{ pairwise_data_json|safe }};
    
    // Create the pairwise comparison table dynamically
    const tableContainer = document.querySelector('#pairwise-table-container');
    if (tableContainer && pairwiseData && pairwiseData.models && pairwiseData.matrix) {
        // Compute maximum absolute pairwise advantage for scaling: diff = wins(i,j) - wins(j,i)
        let maxAbsDiff = 0;
        for (let i = 0; i < pairwiseData.matrix.length; i++) {
            for (let j = 0; j < pairwiseData.matrix.length; j++) {
                if (i === j) continue;
                const vij = (pairwiseData.matrix[i][j] ?? 0);
                const vji = (pairwiseData.matrix[j][i] ?? 0);
                const diff = vij - vji;
                const ad = Math.abs(diff);
                if (ad > maxAbsDiff) maxAbsDiff = ad;
            }
        }
        
        // Color interpolation function for a given diff value centered at 0
        function getHeatmapColorForDiff(diff) {
            // Normalize to [0,1] with 0.5 at diff=0
            const normalized = maxAbsDiff > 0 ? (diff + maxAbsDiff) / (2 * maxAbsDiff) : 0.5;
            
            // Create color gradient from red (negative) through white (0) to green (positive)
            let r, g, b;
            if (normalized < 0.5) {
                // Red to white
                const intensity = normalized * 2;  // 0 to 1
                r = 255;
                g = Math.round(150 + (255 - 150) * intensity);  // 150 to 255
                b = Math.round(150 + (255 - 150) * intensity);  // 150 to 255
            } else {
                // White to green
                const intensity = (normalized - 0.5) * 2;  // 0 to 1
                r = Math.round(255 - (255 - 150) * intensity);  // 255 to 150
                g = 255;
                b = Math.round(255 - (255 - 150) * intensity);  // 255 to 150
            }
            
            return `rgba(${r}, ${g}, ${b}, 0.6)`;
        }
        
        let tableHtml = '<table class="table pairwise-table"><thead><tr>';
        tableHtml += '<th style="width: 200px;">Model ↓ vs Model →</th>';
        
        // Add column headers
        pairwiseData.models.forEach(model => {
            tableHtml += `<th style="writing-mode: vertical-rl; text-orientation: mixed; height: 150px;">
                ${model.name}
                <span class="badge tier-badge bg-info">T${model.tier}</span>
            </th>`;
        });
        tableHtml += '</tr></thead><tbody>';
        
        // Add rows
        pairwiseData.models.forEach((model, rowIdx) => {
            tableHtml += '<tr>';
            tableHtml += `<td class="model-header">
                ${model.name}
                <span class="badge tier-badge bg-info">T${model.tier}</span>
            </td>`;
            
            pairwiseData.matrix[rowIdx].forEach((value, colIdx) => {
                if (rowIdx === colIdx) {
                    tableHtml += '<td class="diagonal">—</td>';
                } else {
                    const symmetric = (pairwiseData.matrix[colIdx][rowIdx] ?? 0);
                    const diff = (value ?? 0) - symmetric;
                    const bgColor = getHeatmapColorForDiff(diff);
                    const textStyle = (maxAbsDiff > 0 && Math.abs(diff) / maxAbsDiff > 0.7) ? 'font-weight: bold;' : '';
                    tableHtml += `<td style="background-color: ${bgColor}; ${textStyle}">${value !== null ? value : 0}</td>`;
                }
            });
            tableHtml += '</tr>';
        });
        tableHtml += '</tbody></table>';
        
        tableContainer.innerHTML = tableHtml;
    }
    {% endif %}
    
    // Initialize other charts and features as needed
    
    // Handle benchmark inclusion checkboxes
    const checkboxes = document.querySelectorAll('.benchmark-inclusion-checkbox');
    checkboxes.forEach(checkbox => {
        checkbox.addEventListener('change', function() {
            const questionId = this.dataset.questionId;
            const isChecked = this.checked;
            
            fetch(`{% url 'model_evaluation:toggle_benchmark_inclusion' 0 %}`.replace('0', questionId), {
                method: 'POST',
                headers: {
                    'X-CSRFToken': '{{ csrf_token }}',
                    'Content-Type': 'application/json'
                },
            })
            .then(response => response.json())
            .then(data => {
                if (!data.success) {
                    console.error('Failed to update benchmark inclusion:', data.error);
                    this.checked = !isChecked; // Revert on failure
                }
            })
            .catch(error => {
                console.error('Error updating benchmark inclusion:', error);
                this.checked = !isChecked; // Revert on error
            });
        });
    });
    
    // Track which charts have been initialized
    let chartsInitialized = {
        grading: false,
        progress: false,
        wordcloud: false,
        variance: false
    };

    // Map grading datasets by chart id for PDF export fallback
    const gradingDataById = {
        {% if grading_stats_json.error_incorrect_logic %}
        'incorrectLogicChart': {{ grading_stats_json.error_incorrect_logic|safe }},
        {% endif %}
        {% if grading_stats_json.error_hallucinated %}
        'hallucinatedChart': {{ grading_stats_json.error_hallucinated|safe }},
        {% endif %}
        {% if grading_stats_json.error_calculation %}
        'calculationErrorChart': {{ grading_stats_json.error_calculation|safe }},
        {% endif %}
        {% if grading_stats_json.error_conceptual %}
        'conceptualErrorChart': {{ grading_stats_json.error_conceptual|safe }},
        {% endif %}
        {% if grading_stats_json.achievement_understanding %}
        'understandingChart': {{ grading_stats_json.achievement_understanding|safe }},
        {% endif %}
        {% if grading_stats_json.achievement_correct_result %}
        'correctResultChart': {{ grading_stats_json.achievement_correct_result|safe }},
        {% endif %}
        {% if grading_stats_json.achievement_insight %}
        'insightChart': {{ grading_stats_json.achievement_insight|safe }},
        {% endif %}
        {% if grading_stats_json.achievement_usefulness %}
        'usefulnessChart': {{ grading_stats_json.achievement_usefulness|safe }},
        {% endif %}
    };
    
    // Initialize charts when tabs are clicked
    const gradingTabButton = document.querySelector('#grading-tab');
    const progressTabButton = document.querySelector('#progress-tab');
    const wordcloudTabButton = document.querySelector('#wordcloud-tab');
    const varianceTabButton = document.querySelector('#variance-tab');

    if (gradingTabButton) {
        gradingTabButton.addEventListener('click', function () {
            setTimeout(function() {
                if (!chartsInitialized.grading) {
                    initializeGradingCharts();
                    chartsInitialized.grading = true;
                }
            }, 200);
        });
    }

    if (progressTabButton) {
        progressTabButton.addEventListener('click', function () {
            setTimeout(function() {
                if (!chartsInitialized.progress) {
                    initializeProgressChart();
                    chartsInitialized.progress = true;
                }
            }, 200);
        });
    }

    if (wordcloudTabButton) {
        wordcloudTabButton.addEventListener('click', function () {
            setTimeout(function() {
                if (!chartsInitialized.wordcloud) {
                    initializeWordCloud();
                    chartsInitialized.wordcloud = true;
                }
            }, 200);
        });
    }

    if (varianceTabButton) {
        varianceTabButton.addEventListener('click', function () {
            setTimeout(function() {
                if (!chartsInitialized.variance) {
                    initializeVarianceChart();
                    chartsInitialized.variance = true;
                }
            }, 200);
        });
    }
    
    // Function to initialize grading charts (Chart.js, original look)
    function initializeGradingCharts() {
        // Error category charts (Red = Has Error, Green = No Error)
        {% if grading_stats_json.error_incorrect_logic %}
        createGradingChart('incorrectLogicChart', {{ grading_stats_json.error_incorrect_logic|safe }}, 'error');
        {% endif %}
        {% if grading_stats_json.error_hallucinated %}
        createGradingChart('hallucinatedChart', {{ grading_stats_json.error_hallucinated|safe }}, 'error');
        {% endif %}
        {% if grading_stats_json.error_calculation %}
        createGradingChart('calculationErrorChart', {{ grading_stats_json.error_calculation|safe }}, 'error');
        {% endif %}
        {% if grading_stats_json.error_conceptual %}
        createGradingChart('conceptualErrorChart', {{ grading_stats_json.error_conceptual|safe }}, 'error');
        {% endif %}

        // Achievement category charts (Green = Achievement Present, Red = Achievement Absent)
        {% if grading_stats_json.achievement_understanding %}
        createGradingChart('understandingChart', {{ grading_stats_json.achievement_understanding|safe }}, 'achievement');
        {% endif %}
        {% if grading_stats_json.achievement_correct_result %}
        createGradingChart('correctResultChart', {{ grading_stats_json.achievement_correct_result|safe }}, 'achievement');
        {% endif %}
        {% if grading_stats_json.achievement_insight %}
        createGradingChart('insightChart', {{ grading_stats_json.achievement_insight|safe }}, 'achievement');
        {% endif %}
        {% if grading_stats_json.achievement_usefulness %}
        createGradingChart('usefulnessChart', {{ grading_stats_json.achievement_usefulness|safe }}, 'achievement');
        {% endif %}
    }
    
    // Function to initialize progress chart
    function initializeProgressChart() {
        {% if progress_stats_json %}
        createProgressGradeChart('progressGradeChart', {{ progress_stats_json|safe }});
        {% endif %}
    }
    
    // Function to initialize variance chart
    function initializeVarianceChart() {
        {% if variance_data_json %}
        createVarianceChart('varianceChart', {{ variance_data_json|safe }});
        {% endif %}
    }

    // Function to initialize word cloud
    function initializeWordCloud() {
        {% if word_cloud_json %}
        const wordCloudData = {{ word_cloud_json|safe }};
        const container = document.getElementById('wordCloudContainer');
        
        if (container && wordCloudData && wordCloudData.length > 0) {
            // Clear any existing content
            container.innerHTML = '';
            
            // Get container dimensions
            const width = container.offsetWidth;
            const height = 560;
            
            // Create SVG element
            const svg = d3.select(container)
                .append('svg')
                .attr('width', width)
                .attr('height', height);
            
            const g = svg.append('g')
                .attr('transform', `translate(${width/2},${height/2})`);
            
            // Calculate font sizes deterministically based on count
            const maxCount = Math.max(...wordCloudData.map(d => d.count));
            const minCount = Math.min(...wordCloudData.map(d => d.count));
            const sizeScale = d3.scaleLinear()
                .domain([minCount, maxCount])
                .range([16, 80]);  // Min and max font sizes
            
            // Prepare words with deterministic sizes
            const words = wordCloudData.map(d => ({
                text: d.text,
                size: sizeScale(d.count),
                count: d.count,
                weight: d.weight
            }));
            
            // Color scale based on count
            const colorScale = d3.scaleLinear()
                .domain([minCount, maxCount])
                .range(['#66b3ff', '#004080']);
            
            // Create the layout with fixed random seed for consistency
            const layout = d3.layout.cloud()
                .size([width, height])
                .words(words)
                .padding(5)
                .rotate(() => 0)  // No rotation for better readability
                .font('-apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif')
                .fontSize(d => d.size)
                .random(() => 0.5)  // Fixed seed for deterministic layout
                .on('end', draw);
            
            layout.start();
            
            // Draw function
            function draw(words) {
                const text = g.selectAll('text')
                    .data(words)
                    .enter().append('text')
                    .style('font-size', d => `${d.size}px`)
                    .style('font-family', '-apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif')
                    .style('font-weight', d => d.size > 40 ? 'bold' : 'normal')
                    .style('fill', d => colorScale(d.count))
                    .style('cursor', 'pointer')
                    .attr('text-anchor', 'middle')
                    .attr('transform', d => `translate(${d.x},${d.y})`)
                    .text(d => d.text);
                
                // Add hover effect
                text.on('mouseover', function(event, d) {
                    d3.select(this)
                        .transition()
                        .duration(200)
                        .style('opacity', 0.7)
                        .style('font-size', d => `${d.size * 1.1}px`);
                    
                    // Add tooltip
                    const tooltip = d3.select('body').append('div')
                        .attr('class', 'wordcloud-tooltip')
                        .style('position', 'absolute')
                        .style('background', 'rgba(0, 0, 0, 0.8)')
                        .style('color', 'white')
                        .style('padding', '5px 10px')
                        .style('border-radius', '5px')
                        .style('font-size', '12px')
                        .style('pointer-events', 'none')
                        .style('z-index', '1000')
                        .html(`${d.text}: ${d.count} ${d.count === 1 ? 'occurrence' : 'occurrences'}`);
                    
                    tooltip.style('left', (event.pageX + 10) + 'px')
                        .style('top', (event.pageY - 25) + 'px');
                })
                .on('mouseout', function(event, d) {
                    d3.select(this)
                        .transition()
                        .duration(200)
                        .style('opacity', 1)
                        .style('font-size', d => `${d.size}px`);
                    
                    // Remove tooltip
                    d3.selectAll('.wordcloud-tooltip').remove();
                })
                .on('click', function(event, d) {
                    console.log(`Tag: ${d.text}, Count: ${d.count}`);
                });
            }
        }
        {% endif %}
    }
    
    // Check if any tab is active on load and initialize its charts
    setTimeout(function() {
        const activeGradingTab = document.querySelector('#grading.active, #grading.show');
        const activeProgressTab = document.querySelector('#progress.active, #progress.show');
        const activeWordcloudTab = document.querySelector('#wordcloud.active, #wordcloud.show');
        const activeVarianceTab = document.querySelector('#variance.active, #variance.show');

        if (activeGradingTab && !chartsInitialized.grading) {
            initializeGradingCharts();
            chartsInitialized.grading = true;
        }

        if (activeProgressTab && !chartsInitialized.progress) {
            initializeProgressChart();
            chartsInitialized.progress = true;
        }

        if (activeWordcloudTab && !chartsInitialized.wordcloud) {
            initializeWordCloud();
            chartsInitialized.wordcloud = true;
        }

        if (activeVarianceTab && !chartsInitialized.variance) {
            initializeVarianceChart();
            chartsInitialized.variance = true;
        }
    }, 300);
    
    // Subquestion Results Chart (from benchmark_results)
    {% if models_json %}
    createSubquestionResultsChart('subquestionResultsChart', {{ models_json|safe }});
    {% endif %}
    
    function createSubquestionResultsChart(canvasId, modelsData) {
        const canvas = document.getElementById(canvasId);
        if (!canvas) return;
        
        // Prepare data for horizontal bar chart
        const modelNames = [];
        const scores = [];
        const backgroundColors = [];
        
        // Process each model (already sorted by score)
        modelsData.forEach(model => {
            // Use display name without tier label for cleaner view
            modelNames.push(model.model.display_name);
            
            // Use score percentage or 0 for N/A
            const score = model.score_percentage !== null ? model.score_percentage : 0;
            scores.push(score.toFixed(1));
            
            // Use uniform professional color for all bars
            // Only distinguish N/A values with gray
            const color = model.score_percentage === null ? '#6c757d' : '#0d6efd';  // Gray for N/A, Bootstrap primary blue for data
            backgroundColors.push(color);
        });
        
        // Create the chart
        const ctx = canvas.getContext('2d');
        new Chart(ctx, {
            type: 'bar',
            data: {
                labels: modelNames,
                datasets: [{
                    label: 'Average Score (%)',
                    data: scores,
                    backgroundColor: backgroundColors,
                    borderColor: backgroundColors,
                    borderWidth: 1
                }]
            },
            options: {
                indexAxis: 'y',  // Horizontal bars
                responsive: true,
                maintainAspectRatio: false,
                plugins: {
                    title: {
                        display: false
                    },
                    legend: {
                        display: false  // Hide legend since we only have one dataset
                    },
                    tooltip: {
                        callbacks: {
                            label: function(context) {
                                const modelData = modelsData[context.dataIndex];
                                const score = context.parsed.x;
                                const questionsText = `${modelData.questions_attempted}/${modelData.questions_total} questions`;
                                
                                if (modelData.score_percentage === null) {
                                    return `No subquestions evaluated`;
                                }
                                
                                return `Score: ${score}% (${questionsText})`;
                            }
                        }
                    }
                },
                scales: {
                    x: {
                        title: {
                            display: true,
                            text: 'Average Score (%)'
                        },
                        min: 0,
                        max: 100,
                        ticks: {
                            callback: function(value) {
                                return value + '%';
                            }
                        }
                    },
                    y: {
                        title: {
                            display: true,
                            text: 'Models'
                        }
                    }
                }
            }
        });
    }
    
    // Chart creation function for variance/error bars
    function createVarianceChart(canvasId, varianceData) {
        const canvas = document.getElementById(canvasId);
        if (!canvas) return;

        // Prepare data for horizontal bar chart with error bars
        const modelNames = [];
        const scores = [];
        const sigmas = [];
        const errorBarsLower = [];
        const errorBarsUpper = [];
        const backgroundColors = [];

        // Process each model
        varianceData.forEach(model => {
            modelNames.push(model.model);

            const score = model.average_score !== null ? model.average_score : 0;
            const sigma = model.sigma !== null ? model.sigma : 0;

            scores.push(score.toFixed(1));
            sigmas.push(sigma);

            // Calculate error bar bounds (ensuring they don't go below 0 or above 100)
            const lower = Math.max(0, score - sigma);
            const upper = Math.min(100, score + sigma);
            errorBarsLower.push(lower.toFixed(1));
            errorBarsUpper.push(upper.toFixed(1));

            // Use tier-based colors
            const tierColors = {
                1: '#0d6efd',  // Bootstrap primary blue
                2: '#6610f2',  // Bootstrap indigo
                3: '#6f42c1',  // Bootstrap purple
                4: '#d63384',  // Bootstrap pink
            };
            const color = tierColors[model.tier] || '#6c757d';
            backgroundColors.push(color);
        });

        // Create the chart
        const ctx = canvas.getContext('2d');
        new Chart(ctx, {
            type: 'bar',
            data: {
                labels: modelNames,
                datasets: [{
                    label: 'Average Score (%)',
                    data: scores,
                    backgroundColor: backgroundColors,
                    borderColor: backgroundColors,
                    borderWidth: 1,
                    // Error bars configuration
                    errorBars: {
                        'Average Score (%)': {
                            plus: sigmas,
                            minus: sigmas
                        }
                    }
                }]
            },
            options: {
                indexAxis: 'y',  // Horizontal bars
                responsive: true,
                maintainAspectRatio: false,
                plugins: {
                    title: {
                        display: false
                    },
                    legend: {
                        display: false
                    },
                    tooltip: {
                        callbacks: {
                            label: function(context) {
                                const score = parseFloat(context.parsed.x);
                                const sigma = sigmas[context.dataIndex];
                                const lower = errorBarsLower[context.dataIndex];
                                const upper = errorBarsUpper[context.dataIndex];
                                const numQuestions = varianceData[context.dataIndex].num_questions;
                                const numEvals = varianceData[context.dataIndex].num_evaluations;

                                return [
                                    `Score: ${score.toFixed(1)}%`,
                                    `σ: ${sigma.toFixed(2)}`,
                                    `Range: [${lower}, ${upper}]`,
                                    `Questions: ${numQuestions}`,
                                    `Total evaluations: ${numEvals}`
                                ];
                            }
                        }
                    }
                },
                scales: {
                    x: {
                        title: {
                            display: true,
                            text: 'Average Score (%)'
                        },
                        min: 0,
                        max: 100,
                        ticks: {
                            callback: function(value) {
                                return value + '%';
                            }
                        }
                    },
                    y: {
                        title: {
                            display: true,
                            text: 'Models'
                        }
                    }
                }
            },
            plugins: [{
                // Custom plugin to draw error bars
                afterDatasetsDraw: function(chart) {
                    const ctx = chart.ctx;
                    const yAxis = chart.scales.y;
                    const xAxis = chart.scales.x;

                    chart.data.datasets.forEach((dataset, datasetIndex) => {
                        const meta = chart.getDatasetMeta(datasetIndex);

                        meta.data.forEach((bar, index) => {
                            const score = parseFloat(scores[index]);
                            const sigma = sigmas[index];
                            const lower = Math.max(0, score - sigma);
                            const upper = Math.min(100, score + sigma);

                            // Get pixel positions
                            const y = bar.y;
                            const xCenter = bar.x;
                            const xLower = xAxis.getPixelForValue(lower);
                            const xUpper = xAxis.getPixelForValue(upper);

                            // Draw horizontal error bar line
                            ctx.save();
                            ctx.strokeStyle = '#000000';
                            ctx.lineWidth = 2;
                            ctx.beginPath();
                            ctx.moveTo(xLower, y);
                            ctx.lineTo(xUpper, y);
                            ctx.stroke();

                            // Draw left cap (|)
                            ctx.beginPath();
                            ctx.moveTo(xLower, y - 5);
                            ctx.lineTo(xLower, y + 5);
                            ctx.stroke();

                            // Draw right cap (|)
                            ctx.beginPath();
                            ctx.moveTo(xUpper, y - 5);
                            ctx.lineTo(xUpper, y + 5);
                            ctx.stroke();

                            ctx.restore();
                        });
                    });
                }
            }]
        });
    }

    // Chart creation functions (Chart.js, original)
    function createGradingChart(canvasId, categoryData, categoryType = 'error') {
        // Persist data for vector export
        window.gradingChartData = window.gradingChartData || {};
        // Skip if no canvas element
        const canvas = document.getElementById(canvasId);
        if (!canvas) return;
        
        // Prepare data for Chart.js
        const modelNames = [];
        const yesData = [];
        const notSureData = [];
        const noData = [];
        const naData = [];
        
        // Extract data from each model
        categoryData.models.forEach(model => {
            // Add tier label to model name
            const tierLabel = `[T${model.tier}]`;
            const displayName = `${model.model_name} ${tierLabel}`;
            modelNames.push(displayName);
            
            // Add percentages (rounded to 1 decimal)
            yesData.push(model.percentages.yes.toFixed(1));
            notSureData.push(model.percentages.not_sure.toFixed(1));
            noData.push(model.percentages.no.toFixed(1));
            naData.push((model.percentages.na || 0).toFixed(1));
        });
        
        // Define colors based on category type
        let yesColor, noColor;
        if (categoryType === 'error') {
            // For error categories: Yes = Red (error present), No = Green (no error)
            yesColor = '#dc3545';
            noColor = '#28a745';
        } else {
            // For achievement categories: Yes = Green (achievement present), No = Red (no achievement)
            yesColor = '#28a745';
            noColor = '#dc3545';
        }
        // Store for PDF export
        window.gradingChartData[canvasId] = {
            names: modelNames,
            yes: yesData.map(parseFloat),
            not_sure: notSureData.map(parseFloat),
            no: noData.map(parseFloat),
            na: naData.map(parseFloat),
            colors: { yes: yesColor, no: noColor, not_sure: '#6c757d', na: '#000000' }
        };
        
        // Create the chart
        const ctx = canvas.getContext('2d');
        new Chart(ctx, {
            type: 'bar',
            data: {
                labels: modelNames,
                datasets: [
                    {
                        label: 'Yes',
                        data: yesData,
                        backgroundColor: yesColor,
                        borderColor: yesColor,
                        borderWidth: 1
                    },
                    {
                        label: 'Not Sure',
                        data: notSureData,
                        backgroundColor: '#6c757d',  // Gray for "Not Sure" (always the same)
                        borderColor: '#6c757d',
                        borderWidth: 1
                    },
                    {
                        label: 'No',
                        data: noData,
                        backgroundColor: noColor,
                        borderColor: noColor,
                        borderWidth: 1
                    },
                    {
                        label: 'N/A',
                        data: naData,
                        backgroundColor: '#000000',  // Black for N/A (better visibility)
                        borderColor: '#000000',
                        borderWidth: 1
                    }
                ]
            },
            options: {
                indexAxis: 'y',  // Horizontal bars
                responsive: true,
                maintainAspectRatio: false,
                plugins: {
                    title: {
                        display: false
                    },
                    legend: {
                        position: 'top',
                    },
                    tooltip: {
                        callbacks: {
                            label: function(context) {
                                const label = context.dataset.label || '';
                                const value = context.parsed.x || 0;
                                const modelIndex = context.dataIndex;
                                const modelData = categoryData.models[modelIndex];
                                
                                // Get averaged count for this response type
                                let avgCount = 0;
                                if (label === 'Yes') avgCount = modelData.averaged_counts.yes;
                                else if (label === 'Not Sure') avgCount = modelData.averaged_counts.not_sure;
                                else if (label === 'No') avgCount = modelData.averaged_counts.no;
                                else if (label === 'N/A') avgCount = modelData.averaged_counts.na || 0;
                                
                                // Show questions instead of responses
                                const questionsText = modelData.total_questions === 1 ? 'question' : 'questions';
                                return `${label}: ${value}% (${avgCount} avg across ${modelData.total_questions} ${questionsText})`;
                            }
                        }
                    }
                },
                scales: {
                    x: {
                        stacked: true,
                        title: {
                            display: true,
                            text: 'Percentage of Responses'
                        },
                        min: 0,
                        max: 100,
                        ticks: {
                            callback: function(value) {
                                return value + '%';
                            }
                        }
                    },
                    y: {
                        stacked: true,
                        title: {
                            display: true,
                            text: 'Models (ordered by subquestion score)'
                        }
                    }
                }
            }
        });
    }

    // Vector PDF export via browser print of off-screen SVG
    window.exportGradingChartPDF = async function(chartId, filename) {
        // Prefer stored data from rendered Chart.js; fallback to server-provided JSON map
        let data = (window.gradingChartData || {})[chartId];
        const container = document.getElementById(chartId);
        if (!container) { alert('Chart container not found.'); return; }
        if (!data) {
            const cat = gradingDataById[chartId];
            if (!cat) { alert('No data available for export yet. Try clicking the tab first.'); return; }
            const names = cat.models.map(m => `${m.model_name} [T${m.tier}]`);
            const yes = cat.models.map(m => +m.percentages.yes || 0);
            const not_sure = cat.models.map(m => +m.percentages.not_sure || 0);
            const no = cat.models.map(m => +m.percentages.no || 0);
            const na = cat.models.map(m => +(m.percentages.na || 0));
            data = { names, yes, not_sure, no, na, colors: { yes: '#dc3545', no: '#28a745', not_sure: '#6c757d', na: '#000000' } };
        }
        const width = Math.max(container.clientWidth || 1000, 1000);
        const margin = { top: 16, right: 24, bottom: 32, left: 220 };
        const plotW = width - margin.left - margin.right;
        const rowH = 20;
        const gap = 6;
        const n = data.names.length;
        const svgH = margin.top + margin.bottom + n * (rowH + gap) + 40;

        // Build SVG markup as string
        const x = d3.scaleLinear().domain([0, 100]).range([0, plotW]);
        let svgParts = [];
        svgParts.push(`<svg xmlns=\"http://www.w3.org/2000/svg\" width=\"${width}\" height=\"${svgH}\" style=\"font-family:-apple-system,BlinkMacSystemFont,'Segoe UI',Roboto,sans-serif;font-size:12px\">`);
        svgParts.push(`<g transform=\"translate(${margin.left},${margin.top})\">`);
        // X axis ticks (0..100 in 20% steps)
        for (let t = 0; t <= 100; t += 20) {
            const tx = x(t);
            svgParts.push(`<line x1=\"${tx}\" y1=\"0\" x2=\"${tx}\" y2=\"${svgH - margin.top - margin.bottom}\" stroke=\"#eee\"/>`);
            svgParts.push(`<text x=\"${tx}\" y=\"${svgH - margin.top - margin.bottom + 20}\" text-anchor=\"middle\">${t}%</text>`);
        }
        // Bars
        const parts = [
            { key: 'yes', color: data.colors.yes, label: 'Yes' },
            { key: 'not_sure', color: data.colors.not_sure, label: 'Not Sure' },
            { key: 'no', color: data.colors.no, label: 'No' },
            { key: 'na', color: data.colors.na, label: 'N/A' },
        ];
        for (let i = 0; i < n; i++) {
            let acc = 0;
            for (const p of parts) {
                const value = (data[p.key][i] || 0);
                const w = x(value);
                const x0 = x(acc);
                const y0 = i * (rowH + gap);
                svgParts.push(`<rect x=\"${x0}\" y=\"${y0}\" width=\"${w}\" height=\"${rowH}\" fill=\"${p.color}\"/>`);
                acc += value;
            }
        }
        svgParts.push(`</g>`);
        // Labels
        svgParts.push(`<g transform=\"translate(${margin.left - 10},${margin.top})\">`);
        for (let i = 0; i < n; i++) {
            const yLbl = i * (rowH + gap) + rowH * 0.7;
            svgParts.push(`<text x=\"-10\" y=\"${yLbl}\" text-anchor=\"end\">${data.names[i]}</text>`);
        }
        svgParts.push(`</g>`);
        svgParts.push(`</svg>`);
        const svgHTML = `<!doctype html><html><head><title>${filename}</title><style>@page{size:landscape;margin:10mm;}body{margin:0;}</style></head><body>${svgParts.join('')}</body></html>`;

        // Print via hidden iframe (user can save as PDF)
        const iframe = document.createElement('iframe');
        iframe.style.position = 'absolute';
        iframe.style.top = '-10000px';
        iframe.style.left = '-10000px';
        iframe.width = '0';
        iframe.height = '0';
        document.body.appendChild(iframe);
        const doc = iframe.contentWindow.document;
        doc.open();
        doc.write(svgHTML);
        doc.close();
        iframe.onload = function(){
            iframe.contentWindow.focus();
            iframe.contentWindow.print();
            setTimeout(() => document.body.removeChild(iframe), 1000);
        };
    }
    
    function createProgressGradeChart(canvasId, progressData) {
        // Skip if no canvas element
        const canvas = document.getElementById(canvasId);
        if (!canvas) return;
        
        // Prepare data for Chart.js
        const modelNames = [];
        const noProgressData = [];      // Grade 0
        const minorProgressData = [];   // Grade 1
        const majorProgressData = [];   // Grade 2
        const completeData = [];        // Grade 3
        
        // Extract data from each model
        progressData.models.forEach(model => {
            // Add tier label to model name
            const tierLabel = `[T${model.tier}]`;
            const displayName = `${model.model_name} ${tierLabel}`;
            modelNames.push(displayName);
            
            // Add percentages (rounded to 1 decimal)
            noProgressData.push(model.percentages[0].toFixed(1));
            minorProgressData.push(model.percentages[1].toFixed(1));
            majorProgressData.push(model.percentages[2].toFixed(1));
            completeData.push(model.percentages[3].toFixed(1));
        });
        
        // Create the chart with reversed order (Complete Solution first)
        const ctx = canvas.getContext('2d');
        new Chart(ctx, {
            type: 'bar',
            data: {
                labels: modelNames,
                datasets: [
                    {
                        label: 'Complete Solution (3)',
                        data: completeData,
                        backgroundColor: '#28a745',  // Green
                        borderColor: '#28a745',
                        borderWidth: 1
                    },
                    {
                        label: 'Major Progress (2)',
                        data: majorProgressData,
                        backgroundColor: '#17a2b8',  // Cyan/Info Blue
                        borderColor: '#17a2b8',
                        borderWidth: 1
                    },
                    {
                        label: 'Minor Progress (1)',
                        data: minorProgressData,
                        backgroundColor: '#ffc107',  // Yellow/Amber
                        borderColor: '#ffc107',
                        borderWidth: 1
                    },
                    {
                        label: 'No Progress (0)',
                        data: noProgressData,
                        backgroundColor: '#dc3545',  // Red
                        borderColor: '#dc3545',
                        borderWidth: 1
                    }
                ]
            },
            options: {
                indexAxis: 'y',  // Horizontal bars
                responsive: true,
                maintainAspectRatio: false,
                plugins: {
                    title: {
                        display: false
                    },
                    legend: {
                        position: 'top',
                    },
                    tooltip: {
                        callbacks: {
                            label: function(context) {
                                const label = context.dataset.label || '';
                                const value = context.parsed.x || 0;
                                const modelIndex = context.dataIndex;
                                const modelData = progressData.models[modelIndex];
                                
                                // Get grade number from label
                                const gradeMatch = label.match(/\((\d)\)/);
                                const grade = gradeMatch ? parseInt(gradeMatch[1]) : 0;

                                // Get count for this grade
                                const count = modelData.counts[grade];

                                // Show questions and average progress
                                const questionsText = modelData.total_questions === 1 ? 'question' : 'questions';
                                const avgProgress = modelData.average_progress !== null ?
                                    ` | Avg: ${modelData.average_progress.toFixed(2)}` : '';

                                return `${label}: ${value}% (${count} of ${modelData.total_questions} ${questionsText}${avgProgress})`;
                            }
                        }
                    }
                },
                scales: {
                    x: {
                        stacked: true,
                        title: {
                            display: true,
                            text: 'Percentage of Responses'
                        },
                        min: 0,
                        max: 100,
                        ticks: {
                            callback: function(value) {
                                return value + '%';
                            }
                        }
                    },
                    y: {
                        stacked: true,
                        title: {
                            display: true,
                            text: 'Models (ordered by subquestion score)'
                        }
                    }
                }
            }
        });
    }
    
    // Export functions for PNG and JPG
    window.exportChart = function(chartId, filename, format) {
        const chart = Chart.getChart(chartId);
        if (!chart) {
            alert('Chart not found');
            return;
        }
        
        if (format === 'png') {
            exportChartAsPNG(chart, filename);
        } else if (format === 'jpg') {
            exportChartAsJPG(chart, filename);
        }
    }
    
    function exportChartAsPNG(chart, filename) {
        // Save current device pixel ratio
        const originalRatio = window.devicePixelRatio;
        
        // Increase resolution for export (8x ~ 800 DPI equivalent on most displays)
        // Be mindful that very large charts may consume more memory
        window.devicePixelRatio = 8;
        
        // Force chart to update with new pixel ratio
        chart.resize();
        
        // Wait for chart to redraw at higher resolution
        setTimeout(() => {
            // Get the high-resolution image
            const url = chart.toBase64Image();
            
            // Create download link
            const a = document.createElement('a');
            a.href = url;
            a.download = filename + '_hires.png';
            document.body.appendChild(a);
            a.click();
            document.body.removeChild(a);
            
            // Restore original pixel ratio
            window.devicePixelRatio = originalRatio;
            chart.resize();
        }, 150);
    }
    
    function exportChartAsJPG(chart, filename) {
        // Save current device pixel ratio
        const originalRatio = window.devicePixelRatio;
        
        // Increase resolution for JPG export (6x)
        // JPG compression will reduce file size while keeping quality
        window.devicePixelRatio = 6;
        
        // Force chart to update with new pixel ratio
        chart.resize();
        
        // Wait for chart to redraw at higher resolution
        setTimeout(() => {
            // Get the canvas element
            const canvas = chart.canvas;
            
            // Create a temporary canvas with white background for JPG
            const tempCanvas = document.createElement('canvas');
            tempCanvas.width = canvas.width;
            tempCanvas.height = canvas.height;
            const tempCtx = tempCanvas.getContext('2d');
            
            // Fill with white background (JPG doesn't support transparency)
            tempCtx.fillStyle = '#FFFFFF';
            tempCtx.fillRect(0, 0, tempCanvas.width, tempCanvas.height);
            
            // Draw the chart on top
            tempCtx.drawImage(canvas, 0, 0);
            
            // Convert to JPG with higher quality setting
            const url = tempCanvas.toDataURL('image/jpeg', 0.98);
            
            // Create download link
            const a = document.createElement('a');
            a.href = url;
            a.download = filename + '.jpg';
            document.body.appendChild(a);
            a.click();
            document.body.removeChild(a);
            
            // Restore original pixel ratio
            window.devicePixelRatio = originalRatio;
            chart.resize();
        }, 150);
    }
    
    // Export Word Cloud
    window.exportWordCloud = function(format) {
        const svg = document.querySelector('#wordCloudContainer svg');
        if (!svg) {
            alert('Word cloud not found');
            return;
        }
        
        // Get SVG dimensions
        const width = svg.getAttribute('width');
        const height = svg.getAttribute('height');
        
        // Create a canvas element
        const canvas = document.createElement('canvas');
        canvas.width = width * 4; // 4x resolution for better quality
        canvas.height = height * 4;
        const ctx = canvas.getContext('2d');
        
        // Scale for higher resolution
        ctx.scale(4, 4);
        
        // White background
        ctx.fillStyle = '#FFFFFF';
        ctx.fillRect(0, 0, width, height);
        
        // Convert SVG to string
        const svgData = new XMLSerializer().serializeToString(svg);
        const svgBlob = new Blob([svgData], {type: 'image/svg+xml;charset=utf-8'});
        const url = URL.createObjectURL(svgBlob);
        
        // Create image from SVG
        const img = new Image();
        img.onload = function() {
            ctx.drawImage(img, 0, 0, width, height);
            URL.revokeObjectURL(url);
            
            // Export based on format
            let dataUrl;
            let filename;
            if (format === 'png') {
                dataUrl = canvas.toDataURL('image/png');
                filename = 'word_cloud.png';
            } else {
                dataUrl = canvas.toDataURL('image/jpeg', 0.92);
                filename = 'word_cloud.jpg';
            }
            
            // Create download link
            const a = document.createElement('a');
            a.href = dataUrl;
            a.download = filename;
            document.body.appendChild(a);
            a.click();
            document.body.removeChild(a);
        };
        img.src = url;
    };
    
    // Export Word Cloud as PDF (preserves SVG vector format)
    window.exportWordCloudAsPDF = function() {
        const svg = document.querySelector('#wordCloudContainer svg');
        if (!svg) {
            alert('Word cloud not found');
            return;
        }
        
        // Clone the SVG exactly as it is
        const clonedSvg = svg.cloneNode(true);
        
        // Remove any transform on the root SVG that might offset it
        clonedSvg.removeAttribute('transform');
        
        // Ensure SVG has proper attributes for scaling
        const width = clonedSvg.getAttribute('width') || '800';
        const height = clonedSvg.getAttribute('height') || '600';
        clonedSvg.setAttribute('viewBox', `0 0 ${width} ${height}`);
        clonedSvg.setAttribute('preserveAspectRatio', 'xMidYMid meet');
        clonedSvg.removeAttribute('width');
        clonedSvg.removeAttribute('height');
        
        // Create a hidden iframe for printing
        const iframe = document.createElement('iframe');
        iframe.style.position = 'absolute';
        iframe.style.top = '-10000px';
        iframe.style.left = '-10000px';
        iframe.style.width = '0';
        iframe.style.height = '0';
        document.body.appendChild(iframe);
        
        const printWindow = iframe.contentWindow;
        
        // Build HTML content with SVG directly (preserves vector format)
        const styles = `
            <style>
                @page {
                    size: landscape;
                    margin: 0;
                }
                
                * {
                    margin: 0;
                    padding: 0;
                    box-sizing: border-box;
                }
                
                @media print {
                    html, body { 
                        margin: 0;
                        padding: 0;
                        width: 100%;
                        overflow: hidden;
                        background: white;
                    }
                    
                    body { 
                        display: flex;
                        justify-content: center;
                        align-items: center;
                        padding: 5mm;
                        box-sizing: border-box;
                    }
                    
                    svg {
                        display: block;
                        width: calc(297mm - 10mm) !important;  /* A4 landscape width minus margins */
                        height: calc(210mm - 10mm) !important;  /* A4 landscape height minus margins */
                        max-width: calc(297mm - 10mm) !important;
                        max-height: calc(210mm - 10mm) !important;
                    }
                    
                    /* Hide any tooltips */
                    .wordcloud-tooltip {
                        display: none !important;
                    }
                    
                    /* Force single page */
                    body::after {
                        content: "";
                        display: none;
                    }
                }
                
                /* Screen display styles */
                body { 
                    display: flex;
                    justify-content: center;
                    align-items: center;
                    font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
                    background: white;
                    padding: 20px;
                }
                
                svg {
                    max-width: 100%;
                    max-height: 90vh;
                }
                
                /* Ensure text is selectable and searchable */
                text {
                    -webkit-user-select: text;
                    -moz-user-select: text;
                    -ms-user-select: text;
                    user-select: text;
                }
            </style>
        `;
        
        // Get the SVG string with proper namespaces
        clonedSvg.setAttribute('xmlns', 'http://www.w3.org/2000/svg');
        clonedSvg.setAttribute('xmlns:xlink', 'http://www.w3.org/1999/xlink');
        const svgString = new XMLSerializer().serializeToString(clonedSvg);
        
        const content = `<!DOCTYPE html>
<html>
<head>
<meta charset="UTF-8">
<title>Word Cloud</title>
${styles}
</head>
<body>${svgString}</body>
</html>`;
        
        // Write content to iframe
        printWindow.document.write(content);
        printWindow.document.close();
        
        // Trigger print dialog
        setTimeout(function() {
            printWindow.focus();
            printWindow.print();
            
            // Clean up iframe after print dialog closes
            setTimeout(function() {
                document.body.removeChild(iframe);
            }, 1000);
        }, 250);
    };
    
    // Export Pairwise Table as PDF
    window.exportPairwiseTable = function() {
        const table = document.querySelector('#pairwise-table-container table');
        if (!table) {
            alert('Pairwise comparison table not found');
            return;
        }
        
        // Create a hidden iframe for printing
        const iframe = document.createElement('iframe');
        iframe.style.position = 'absolute';
        iframe.style.top = '-10000px';
        iframe.style.left = '-10000px';
        iframe.style.width = '0';
        iframe.style.height = '0';
        document.body.appendChild(iframe);
        
        const printWindow = iframe.contentWindow;
        
        // Build HTML content with table
        const tableHTML = table.outerHTML;
        const styles = `
            <style>
                @media print {
                    @page {
                        size: landscape;
                        margin: 0;
                    }
                    body { 
                        font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
                        font-size: 10pt;
                        margin: 15mm;
                    }
                    table { 
                        width: 100%; 
                        border-collapse: collapse; 
                        page-break-inside: auto;
                    }
                    th, td { 
                        border: 1px solid #ddd; 
                        padding: 4px 8px;
                        font-size: 9pt;
                    }
                    th { 
                        background-color: #f8f9fa !important;
                        font-weight: bold;
                        -webkit-print-color-adjust: exact;
                        print-color-adjust: exact;
                    }
                    td {
                        -webkit-print-color-adjust: exact;
                        print-color-adjust: exact;
                    }
                    .text-center { text-align: center; }
                    .fw-bold { font-weight: bold; }
                }
                body { 
                    font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
                }
                table { 
                    width: 100%; 
                    border-collapse: collapse; 
                }
                th, td { 
                    border: 1px solid #ddd; 
                    padding: 4px 8px;
                }
                th { 
                    background-color: #f8f9fa;
                    font-weight: bold;
                }
                .text-center { text-align: center; }
                .fw-bold { font-weight: bold; }
            </style>
        `;
        
        const content = `
            <!DOCTYPE html>
            <html>
            <head>
                <meta charset="UTF-8">
                <title>Pairwise Model Comparisons</title>
                ${styles}
            </head>
            <body>
                ${tableHTML}
            </body>
            </html>
        `;
        
        // Write content to new window
        printWindow.document.write(content);
        printWindow.document.close();
        
        // Wait for content to load, then trigger print dialog
        setTimeout(function() {
            printWindow.focus();
            printWindow.print();
            
            // Clean up iframe after print dialog closes
            setTimeout(function() {
                document.body.removeChild(iframe);
            }, 1000);
        }, 250);
    };
    
});
</script>
{% endblock %}
