<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>FuseAgent - Visual Results</title>
    <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
    <style>
        :root {
            --primary-color: #2c3e50;
            --secondary-color: #3498db;
            --accent-color: #e74c3c;
            --text-color: #333;
            --light-bg: #f8f9fa;
            --dark-bg: #1e272e;
        }
        
        * {
            margin: 0;
            padding: 0;
            box-sizing: border-box;
            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
        }
        
        body {
            background: linear-gradient(135deg, #f5f7fa 0%, #c3cfe2 100%);
            color: var(--text-color);
            line-height: 1.6;
            overflow-x: hidden;
            min-height: 100vh;
        }
        
        /* Header styling */
        header {
            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
            color: white;
            padding: 3rem 0;
            text-align: center;
            position: relative;
            overflow: hidden;
        }
        
        .header-container {
            position: relative;
            z-index: 2;
            max-width: 1200px;
            margin: 0 auto;
            padding: 0 2rem;
        }
        
        h1 {
            font-size: 2.2rem;
            margin-bottom: 0;
            line-height: 1.3;
            font-weight: 300;
            font-style: italic;
            display: flex;
            align-items: center;
            justify-content: center;
            gap: 1rem;
        }
        
        .title-icon {
            width: 3rem;
            height: 3rem;
            border-radius: 12px;
            object-fit: contain;
            background-color: rgba(255, 255, 255, 0.2);
            padding: 0.5rem;
            box-shadow: 0 4px 15px rgba(0, 0, 0, 0.1);
        }
        
        .subtitle {
            display: none;
        }
        
        /* Main content */
        main {
            max-width: 1400px;
            margin: 0 auto;
            padding: 3rem 2rem;
            width: 100%;
        }
        
        section {
            margin-bottom: 4rem;
        }
        
        h2 {
            font-size: 2.2rem;
            color: var(--primary-color);
            margin-bottom: 1.5rem;
            position: relative;
            display: inline-block;
        }
        
        h2::after {
            content: '';
            position: absolute;
            bottom: -5px;
            left: 0;
            width: 100%;
            height: 3px;
            background: linear-gradient(120deg, var(--secondary-color), var(--accent-color));
        }
        
        p {
            font-size: 1.1rem;
            margin-bottom: 1.5rem;
            text-align: justify;
        }
        
        /* Fusion Results Carousel - similar to 1.html */
        .fusion-carousel-container {
            position: relative;
            margin-top: 3rem;
            padding-bottom: 0rem;
            overflow: hidden;
            width: 100%;
        }
        
        /* Add gradient masks for carousel */
        .carousel-mask-left,
        .carousel-mask-right {
            position: absolute;
            top: 0;
            height: 100%;
            width: 100px;
            z-index: 10;
            pointer-events: none;
            border-radius: 8px;
        }
        
        .carousel-mask-left {
            left: 0;
            background: linear-gradient(to right, rgba(245,247,250,1) 0%, rgba(245,247,250,0) 100%);
        }
        
        .carousel-mask-right {
            right: 0;
            background: linear-gradient(to left, rgba(245,247,250,1) 0%, rgba(245,247,250,0) 100%);
        }
        
        /* Animation for carousel auto-scroll */
        @keyframes slideCarousel {
            0% { transform: translateX(0); }
            100% { transform: translateX(calc(-100% / 2)); }
        }
        
        .fusion-carousel {
            display: flex;
            overflow-x: hidden;
            scroll-behavior: smooth;
            scroll-snap-type: x mandatory;
            padding: 1rem 0;
            -ms-overflow-style: none;
            scrollbar-width: none;
            width: 200%;
            animation: slideCarousel 40s linear infinite;
            gap: 1rem;
        }
        
        .fusion-carousel:hover {
            animation-play-state: paused;
        }
        
        .fusion-item {
            flex: 0 0 800px;
            min-width: 700px;
            max-width: 900px;
            scroll-snap-align: start;
            border-radius: 12px;
            overflow: hidden;
            box-shadow: 0 6px 20px rgba(0, 0, 0, 0.1);
            background-color: white;
            transition: transform 0.3s ease, box-shadow 0.3s ease;
            position: relative;
            margin-right: 1rem;
        }
        
        .fusion-item:hover {
            transform: translateY(-5px);
            box-shadow: 0 10px 30px rgba(0, 0, 0, 0.15);
        }
        
        /* Three-column layout for inputs and result */
        .fusion-display {
            display: grid;
            grid-template-columns: 1fr 1fr 1fr;
            gap: 1rem;
            padding: 1.5rem;
            height: 350px;
        }
        
        .input-column, .result-column {
            display: flex;
            flex-direction: column;
            align-items: center;
        }
        
        .column-label {
            font-weight: 600;
            color: var(--primary-color);
            margin-bottom: 0.8rem;
            font-size: 1rem;
            text-transform: uppercase;
            letter-spacing: 0.5px;
            background-color: rgba(255, 255, 255, 0.9);
            padding: 0.3rem 0.8rem;
            border-radius: 4px;
            box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
        }
        
        .image-container {
            width: 100%;
            height: 280px;
            border-radius: 8px;
            overflow: hidden;
            box-shadow: 0 4px 12px rgba(0, 0, 0, 0.15);
            position: relative;
            background-color: #f8f9fa;
        }
        
        .fusion-image {
            width: 100%;
            height: 100%;
            object-fit: contain;
            transition: transform 0.3s ease;
        }
        
        .fusion-image:hover {
            transform: scale(1.02);
        }
        
        .result-column .image-container {
            border: 3px solid var(--secondary-color);
        }
        
        .result-column .column-label {
            background-color: var(--secondary-color);
            color: white;
        }
        
        /* Item info */
        .fusion-info {
            padding: 1rem 1.5rem;
            text-align: center;
            background-color: #f8f9fa;
        }
        
        .fusion-title {
            font-size: 1.1rem;
            font-weight: 600;
            color: var(--primary-color);
            margin-bottom: 0.3rem;
        }
        
        .fusion-description {
            color: #666;
            font-size: 0.9rem;
        }
        
        /* Conversation display */
        .conversation-display {
            background-color: white;
            border-radius: 12px;
            padding: 2rem;
            margin-top: 3rem;
            box-shadow: 0 4px 12px rgba(0, 0, 0, 0.05);
        }
        
        .conversation-container {
            max-width: 1000px;
            margin: 0 auto;
        }
        
        .user-message {
            display: flex;
            justify-content: flex-end;
            align-items: flex-start;
            margin-bottom: 1.5rem;
            gap: 12px;
        }
        
        .user-content {
            background: linear-gradient(135deg, #d299c2 0%, #a8d5e2 100%);
            border-radius: 16px;
            padding: 2rem;
            box-shadow: 0 8px 32px rgba(0, 0, 0, 0.1);
            max-width: 85%;
            backdrop-filter: blur(10px);
            border: 1px solid rgba(255, 255, 255, 0.3);
            color: #2c3e50;
            font-weight: 500;
        }
        
        .user-avatar {
            flex: 0 0 50px;
        }
        
        .user-avatar img {
            width: 50px;
            height: 50px;
            border-radius: 8px;
            object-fit: cover;
        }
        
        .model-message {
            display: flex;
            justify-content: flex-start;
            align-items: flex-start;
            gap: 15px;
        }
        
        .model-avatar {
            flex: 0 0 50px;
        }
        
        .model-avatar img {
            width: 50px;
            height: 50px;
            border-radius: 50%;
            object-fit: contain;
            background-color: #fff;
            padding: 5px;
            box-shadow: 0 2px 8px rgba(0, 0, 0, 0.1);
        }
        
        .model-content {
            background: linear-gradient(135deg, #f5f7fa 0%, #c3cfe2 100%);
            border-radius: 16px;
            padding: 2rem;
            box-shadow: 0 8px 32px rgba(0, 0, 0, 0.1);
            max-width: 87%;
            backdrop-filter: blur(10px);
            border: 1px solid rgba(255, 255, 255, 0.2);
        }
        
        .model-name {
            color: #3498db;
            font-weight: 500;
        }
        
        .highlight-issue {
            color: #e74c3c;
            font-weight: 500;
        }
        
        /* Apple-style step indicators */
        .step-indicator {
            display: inline-flex;
            align-items: center;
            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
            color: white;
            padding: 0.4rem 1rem;
            border-radius: 20px;
            font-size: 0.9rem;
            font-weight: 600;
            margin-right: 0.8rem;
            margin-bottom: 0.5rem;
            box-shadow: 0 4px 15px rgba(102, 126, 234, 0.3);
            transition: transform 0.2s ease, box-shadow 0.2s ease;
        }
        
        .step-indicator:hover {
            transform: translateY(-2px);
            box-shadow: 0 6px 20px rgba(102, 126, 234, 0.4);
        }
        
        .step-indicator::before {
            content: "🧠";
            margin-right: 0.5rem;
        }
        
        /* Combined task and model button */
        .action-badge {
            display: inline-flex;
            align-items: center;
            background: linear-gradient(135deg, #a8d5e2 0%, #b8dfd0 100%);
            color: #2c3e50;
            padding: 0.6rem 1.4rem;
            border-radius: 25px;
            font-size: 0.9rem;
            font-weight: 500;
            margin: 0.8rem 0 0 0;
            box-shadow: 0 3px 12px rgba(168, 213, 226, 0.3);
            transition: all 0.3s ease;
            border: none;
            cursor: pointer;
            gap: 0.5rem;
            float: right;
        }
        
        .action-badge:hover {
            transform: translateY(-2px) scale(1.02);
            box-shadow: 0 5px 20px rgba(168, 213, 226, 0.4);
            background: linear-gradient(135deg, #9bc9d4 0%, #a8d5ba 100%);
        }
        
        .action-badge::before {
            content: "⚡";
            font-size: 1rem;
        }
        
        /* Task name in the button */
        .task-name {
            font-weight: 600;
            text-transform: uppercase;
            letter-spacing: 0.5px;
        }
        
        /* Model name in the button */
        .model-name {
            font-style: italic;
            font-weight: 400;
            opacity: 0.8;
            font-family: 'SF Mono', Monaco, 'Cascadia Code', monospace;
            background: rgba(255, 255, 255, 0.5);
            padding: 0.2rem 0.5rem;
            border-radius: 8px;
            font-size: 0.8rem;
        }
        
        /* Analysis text styling */
        .analysis-text {
            background: rgba(255, 255, 255, 0.8);
            border-radius: 12px;
            padding: 1.2rem 1.2rem 0.5rem 1.2rem;
            margin: 1rem 0;
            border-left: 4px solid #667eea;
            box-shadow: 0 2px 10px rgba(0, 0, 0, 0.05);
            line-height: 1.6;
            backdrop-filter: blur(5px);
            position: relative;
            overflow: hidden;
        }
        
        .analysis-text::after {
            content: "";
            display: table;
            clear: both;
        }
        
        /* Response container styling */
        .response-content {
            font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Oxygen, Ubuntu, Cantarell, sans-serif;
            line-height: 1.7;
        }
        
        .response-content p {
            margin: 0;
        }
        
        /* Hidden data */
        .hidden-conversation-data {
            display: none;
        }
        
        /* Responsive */
        @media (max-width: 1024px) {
            .fusion-display {
                grid-template-columns: 1fr;
                gap: 1.5rem;
                height: auto;
            }
            
            .fusion-grid {
                grid-template-columns: 1fr;
            }
        }
        
        @media (max-width: 768px) {
            h1 {
                font-size: 2.2rem;
            }
            
            h2 {
                font-size: 1.8rem;
            }
            
            .fusion-grid {
                grid-template-columns: 1fr;
                gap: 1.5rem;
            }
            
            main {
                padding: 2rem 1rem;
            }
        }
        
        /* Loading placeholder */
        .image-placeholder {
            background: linear-gradient(45deg, #f0f0f0, #e0e0e0);
            display: flex;
            align-items: center;
            justify-content: center;
            color: #999;
            font-style: italic;
        }
    </style>
</head>
<body>
    <header>
        <div class="header-container">
            <h1>
                <img src="imgs/icon.png" alt="FuseAgent" class="title-icon">
                FuseAgent: A VLM-driven Agent for Unified In-the-Wild Image Fusion
            </h1>
        </div>
    </header>
    
    <main>
        <section id="results">
            <h2>Fusion Results</h2>
            <p>Our FuseAgent combines multiple input images to generate enhanced results. Each example shows two input images and their corresponding fusion output.</p>
            
            <!-- Fusion Results Carousel -->
            <div class="fusion-carousel-container">
                <div class="carousel-mask-left"></div>
                <div class="carousel-mask-right"></div>
                <div class="fusion-carousel" id="fusionCarousel">
                    <!-- Fusion items will be dynamically generated here -->
                </div>
            </div>
            
            <!-- Conversation display -->
            <div class="conversation-display">
                <div class="conversation-container">
                    <div class="user-message">
                        <div class="user-content">
                            <p id="userInstruction">Please analyze the two input images and provide a fusion strategy.</p>
                        </div>
                        <div class="user-avatar">
                            <img src="imgs/user-avatar.png" alt="User">
                        </div>
                    </div>
                    
                    <div class="model-message">
                        <div class="model-avatar">
                            <img src="imgs/icon.png" alt="FuseAgent">
                        </div>
                        <div class="model-content">
                            <div id="modelResponse"><strong>Analysis:</strong> Loading fusion analysis...</div>
                        </div>
                    </div>
                </div>
            </div>
        </section>
    </main>
    
    <script>
        document.addEventListener('DOMContentLoaded', function() {
            const fusionCarousel = document.getElementById('fusionCarousel');
            const userInstruction = document.getElementById('userInstruction');
            const modelResponse = document.getElementById('modelResponse');
            
            // Function to check if image exists
            function imageExists(url) {
                return new Promise((resolve) => {
                    const img = new Image();
                    img.onload = () => resolve(true);
                    img.onerror = () => resolve(false);
                    img.src = url;
                });
            }
            
            // Function to get image with fallback extensions
            async function getImageUrl(basePath, extensions = ['png', 'jpg', 'jpeg']) {
                for (let ext of extensions) {
                    const url = `${basePath}.${ext}`;
                    if (await imageExists(url)) {
                        return url;
                    }
                }
                return null;
            }
            
            // Hardcoded response data instead of loading from txt files
            const responseData = {
                '1': `**Step 1 Analysis:** The user has provided a challenging visible-infrared fusion task set in a rainy night scene. My first observation is that the visible light image is significantly degraded by raindrops on the lens and atmospheric rain, which obscures important details. Before any alignment or fusion can occur, I must first restore this image to improve its quality.

**Action:** derain using **IDT** model

**Step 2 Analysis:** Next, I've identified a severe misalignment between the restored visible image and the infrared image. The perspectives are quite different. Due to the significant difference in modality (visible vs. thermal), traditional feature detectors might fail. I need a robust, detector-free registration model that excels at finding correspondences in such challenging cross-modal scenarios.

**Action:** registration using **loftr** model

**Step 3 Analysis:** With the images now cleaned and perfectly aligned, I can proceed to the final step. The goal is to merge the thermal signatures from the infrared image, which clearly highlight the people and the cyclist, with the rich contextual and textural details from the derained visible image, such as the building facade and the wet ground reflections. A versatile and powerful general-purpose fusion model is required to handle these distinct modalities effectively.

**Action:** fusion using **SwinFusion** model`,
                '2': `**Step 1 Analysis:** The user wants to perform multi-exposure fusion on a dynamic scene. I've been given two images, one over-exposed and one under-exposed. I can clearly see motion blur and misalignment between the two frames, indicating camera or object movement during capture. My first priority is to understand and quantify this motion to prevent ghosting artifacts in the final result. I will use an optical flow estimation model to compute a dense motion field between the two images.

**Action:** optical flow using **GMA** model

**Step 2 Analysis:** Upon closer inspection, the under-exposed image suffers from significant motion blur, which degrades the very details I need to extract from it (the scene inside the window). To ensure the final fused image is sharp, I must first apply a deblurring algorithm to this source image to restore its clarity before proceeding with fusion.

**Action:** deblur using **Real-ESRGAN** model

**Step 3 Analysis:** Now that I have estimated the motion field for deghosting and restored the sharpness of the blurry input, I am ready to fuse the images. I will use a specialized multi-exposure fusion model. This model will use the corrected source images and the optical flow information to intelligently blend the well-lit foreground from the over-exposed shot with the clear interior details from the deblurred, under-exposed shot, creating a single, sharp, and artifact-free high-dynamic-range image.

**Action:** fusion using **MEFLUT** model`,
                '3': `**Step 1 Analysis:** Multi-modal fusion combining RGB and thermal imagery for enhanced scene understanding. The visible spectrum image provides rich texture and color information while the thermal image reveals heat signatures invisible to standard cameras.

**Action:** preprocessing using **Normalization** model

**Step 2 Analysis:** Alignment is crucial for accurate fusion as the two modalities may have different viewpoints or sensor positions. Cross-modal registration ensures pixel-level correspondence between the RGB and thermal domains.

**Action:** registration using **Feature-based** model

**Step 3 Analysis:** The final fusion step combines the complementary information from both modalities, preserving important thermal signatures while maintaining the visual quality and detail from the RGB image.

**Action:** fusion using **DenseFuse** model`,
                '4': `**Step 1 Analysis:** Focus stacking scenario where multiple images with different focal planes need to be combined to create an all-in-focus result. Each input image contains sharp regions at different depths.

**Action:** focus detection using **Gradient** model

**Step 2 Analysis:** Edge-preserving fusion to combine the sharp regions from each input while avoiding artifacts at transition boundaries between focused and unfocused areas.

**Action:** fusion using **Multi-focus** model`,
                '5': `**Step 1 Analysis:** Medical image fusion combining structural information from one modality with functional information from another. Precise alignment and information preservation are critical for diagnostic accuracy.

**Action:** preprocessing using **Intensity normalization** model

**Step 2 Analysis:** Anatomical structure alignment to ensure accurate correspondence between different imaging modalities before fusion.

**Action:** registration using **Mutual information** model

**Step 3 Analysis:** Final fusion preserves diagnostic information from both modalities while enhancing overall image quality for clinical interpretation.

**Action:** fusion using **Medical fusion** model`
            };
            
            function loadResponse(imageName) {
                return responseData[imageName] || "Analysis: FuseAgent successfully combines the input images to create an enhanced result with improved detail and clarity.";
            }
            
            // Apple-style response formatting function
            function formatAppleStyleResponse(response) {
                // First collect all analysis and action pairs
                const steps = [];
                const parts = response.split(/(?=\*\*Step \d+ Analysis:\*\*)/);
                
                parts.forEach(part => {
                    if (part.trim()) {
                        const stepMatch = part.match(/\*\*Step (\d+) Analysis:\*\*(.*?)(?:\*\*Action:\*\* (.*?) using \*\*(.*?)\*\* model|$)/s);
                        if (stepMatch) {
                            const [, stepNum, analysis, action, model] = stepMatch;
                            steps.push({
                                stepNum,
                                analysis: analysis.trim(),
                                action: action ? action.trim() : null,
                                model: model ? model.trim() : null
                            });
                        }
                    }
                });
                
                return steps.map(step => {
                    const actionButton = step.action && step.model ? `
                        <span class="action-badge">
                            <span class="task-name">${step.action}</span>
                            <span class="model-name">${step.model}</span>
                        </span>
                    ` : '';
                    
                    return `
                        <div style="margin-bottom: 1.5rem;">
                            <span class="step-indicator">Step ${step.stepNum}</span>
                            <div class="analysis-text">
                                ${step.analysis}
                                ${actionButton}
                            </div>
                        </div>
                    `;
                }).join('');
            }
            
            // Function to create fusion item
            async function createFusionItem(imageName, index) {
                const input1Url = await getImageUrl(`imgs/input1/${imageName}`);
                const input2Url = await getImageUrl(`imgs/input2/${imageName}`);
                const resultUrl = await getImageUrl(`imgs/after/${imageName}`);
                const responseText = loadResponse(imageName);
                
                if (!input1Url || !input2Url || !resultUrl) {
                    return null;
                }
                
                const fusionItem = document.createElement('div');
                fusionItem.className = 'fusion-item';
                fusionItem.innerHTML = `
                    <div class="fusion-display">
                        <div class="input-column">
                            <div class="column-label">Input 1</div>
                            <div class="image-container">
                                <img src="${input1Url}" alt="Input 1" class="fusion-image">
                            </div>
                        </div>
                        <div class="input-column">
                            <div class="column-label">Input 2</div>
                            <div class="image-container">
                                <img src="${input2Url}" alt="Input 2" class="fusion-image">
                            </div>
                        </div>
                        <div class="result-column">
                            <div class="column-label">Fusion Result</div>
                            <div class="image-container">
                                <img src="${resultUrl}" alt="Fusion Result" class="fusion-image">
                            </div>
                        </div>
                    </div>
                    <div class="fusion-info">
                        <div class="fusion-title">Fusion Example ${index + 1}</div>
                        <div class="fusion-description">Multi-modal image fusion result</div>
                    </div>
                    <div class="hidden-conversation-data">
                        <div class="instruction">Please analyze the two input images and provide a fusion strategy for optimal results.</div>
                        <div class="response">${responseText}</div>
                    </div>
                `;
                
                // Note: hover event added in loadFusionResults function
                
                return fusionItem;
            }
            
            // Function to update conversation display
            function updateConversation(item) {
                const data = item.querySelector('.hidden-conversation-data');
                if (!data) return;
                
                const instruction = data.querySelector('.instruction').textContent;
                const response = data.querySelector('.response').textContent;
                
                userInstruction.textContent = instruction;
                // Convert the response to Apple-style formatting
                const formattedResponse = formatAppleStyleResponse(response);
                modelResponse.innerHTML = `<div class="response-content">${formattedResponse}</div>`;
            }
            
            // Function to discover and load images
            async function loadFusionResults() {
                // Image names based on actual files found
                const commonNames = [
                    '1', '2', '3', '4', '5'
                ];
                
                let itemIndex = 0;
                
                const fusionItems = [];
                
                for (let name of commonNames) {
                    const fusionItem = await createFusionItem(name, itemIndex);
                    if (fusionItem) {
                        fusionItems.push(fusionItem);
                        fusionCarousel.appendChild(fusionItem);
                        itemIndex++;
                    }
                }
                
                // Duplicate all carousel items for infinite loop (like 1.html)
                fusionItems.forEach(item => {
                    const clone = item.cloneNode(true);
                    fusionCarousel.appendChild(clone);
                });
                
                // Add hover event to update conversation for all items (including clones)
                const allItems = fusionCarousel.querySelectorAll('.fusion-item');
                allItems.forEach(item => {
                    item.addEventListener('mouseenter', function() {
                        updateConversation(this);
                    });
                });
                
                // Initialize with first item if available
                if (fusionItems.length > 0) {
                    updateConversation(fusionItems[0]);
                }
                
                // If no images found, show placeholder
                if (itemIndex === 0) {
                    fusionCarousel.innerHTML = `
                        <div class="fusion-item">
                            <div class="fusion-display">
                                <div class="input-column">
                                    <div class="column-label">Input 1</div>
                                    <div class="image-container image-placeholder">
                                        No images found in imgs/input1/
                                    </div>
                                </div>
                                <div class="input-column">
                                    <div class="column-label">Input 2</div>
                                    <div class="image-container image-placeholder">
                                        No images found in imgs/input2/
                                    </div>
                                </div>
                                <div class="result-column">
                                    <div class="column-label">Fusion Result</div>
                                    <div class="image-container image-placeholder">
                                        No images found in imgs/after/
                                    </div>
                                </div>
                            </div>
                            <div class="fusion-info">
                                <div class="fusion-title">No Results Found</div>
                                <div class="fusion-description">Please add images to the imgs/ directory</div>
                            </div>
                        </div>
                    `;
                }
            }
            
            // Load fusion results on page load
            loadFusionResults();
        });
    </script>
</body>
</html>