<!DOCTYPE html>
<html>
<head>
  <meta charset="utf-8">
  <meta name="description"
        content="Generating Rich, Localized, and  Flexible Captions in Images.">
  <meta name="keywords" content="Flexible, Captions, VQA, Visual Recognition, Visual Dialog">
  <meta name="viewport" content="width=device-width, initial-scale=1">
  <title>FlexCap: Generating Rich, Localized, and  Flexible Captions in Images</title>
  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
        rel="stylesheet">

  <link rel="stylesheet" href="../static/css/bulma.min.css">
  <link rel="stylesheet" href="../static/css/bulma-carousel.min.css">
  <link rel="stylesheet" href="../static/css/bulma-slider.min.css">
  <link rel="stylesheet" href="../static/css/fontawesome.all.min.css">
  <link rel="stylesheet"
        href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
  <link rel="stylesheet" href="../static/css/index.css">
  <link rel="icon" href="../static/images/favicon.svg">

  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
  <script defer src="../static/js/fontawesome.all.min.js"></script>
  <script src="../static/js/bulma-carousel.min.js"></script>
  <script src="../static/js/bulma-slider.min.js"></script>
  <script src="../static/js/index.js"></script>
  <style>
    canvas {
      display: block;
      margin: 0 auto;
    }
  </style>
  <script>
  var imageUrl = '20.jpg';
var  boxes = [[ 22, 218, 162, 308],
       [152, 109, 160, 179],
       [ 84, 111,  91, 181],
       [355, 171, 428, 223],
       [102, 110, 109, 180],
       [287, 154, 351, 198],
       [197,  58, 210, 169],
       [  7,   3, 498, 337],
       [445,   0, 467, 102],
       [  9,   0, 346, 174],
       [  0, 319, 234, 337],
       [423,  89, 499,  99],
       [  2,  76,   7,  93],
       [  0,  97,  84, 130],
       [157, 113, 165, 178],
       [356,   0, 371,  96],
       [ 50,   2, 205, 104],
       [338,   0, 356,  97],
       [118, 101, 131, 180],
       [286,   0, 499, 102],
       [399,   0, 409,  98],
       [ 84, 103, 216, 181],
       [332, 184, 345, 197],
       [378, 170, 425, 190],
       [118,   1, 136, 174],
       [344, 159, 351, 190],
       [ 80, 276, 108, 305],
       [ 85, 107, 113, 180],
       [216,  86, 497, 143],
       [304,  58, 329,  76],
       [  5,   1, 497,  82],
       [ 28, 262,  36, 269],
       [299,  58, 340,  81],
       [418, 204, 426, 220],
       [194,   0, 214, 167],
       [ 65, 278,  81, 306],
       [424,  89, 452,  94],
       [141, 244, 158, 283],
       [332,   0, 408,  98],
       [357, 196, 379, 222],
       [  1,  91, 217, 132],
       [  6,  76,  14,  93],
       [  1, 147,  71, 185],
       [110, 273, 132, 305],
       [ 45, 180,  59, 186],
       [  0, 144, 248, 186],
       [161, 166, 216, 181],
       [307, 180, 347, 198],
       [ 79, 166, 216, 182],
       [407, 207, 415, 221],
       [  0,  71,  60,  92],
       [ 21, 283,  28, 292],
       [468,  95, 499, 101],
       [393,  81, 420,  93],
       [317, 185, 321, 196],
       [154,   1, 215, 169],
       [ 22, 286,  26, 291],
       [382, 200, 425, 221],
       [198, 122, 207, 169],
       [353, 102, 480, 136],
       [385, 209, 390, 221],
       [160, 140, 214, 153],
       [158, 108, 218, 175],
       [375, 177, 381, 179],
       [  5,  76,  24,  92],
       [364, 215, 372, 222],
       [312,  88, 333,  95],
       [215, 152, 280, 168],
       [309, 322, 316, 326],
       [304, 185, 313, 196],
       [  1,  50,  16,  94]];
var captions = ['a black sheep in a field', 'a wooden fence post', 'a wooden fence post', 'a sheep eating the grass', 'a wooden fence post', 'a black sheep eating grass', 'a tree trunk', 'the scene is daytime', 'a tree trunk', 'a tree with no leaves', 'a patch of dirt in the field', 'a log in the background', 'a wooden post in the ground', 'a patch of dead grass', 'a wooden fence post', 'a tree trunk', 'a tree with red leaves', 'a tree trunk', 'a wooden fence post', 'trees in the background', 'a tree trunk', 'a fence around the tree', 'leg of a sheep', 'the wool on a sheep', 'a tree trunk', 'the tail of a black sheep', 'the leg of a sheep', 'a wooden fence post', 'a small hill of grass', 'a small bush', 'trees in the background', 'the left eye of the black sheep', 'a small bush', 'leg of a sheep', 'a tree trunk', 'the front leg of a sheep', 'a log in the field', 'tail of a black sheep', 'a tree trunk', 'head of a sheep', 'a patch of dirt', 'a wooden post in the ground', 'a patch of dirt', 'the back left leg of a sheep', 'a rock in the ground', 'a patch of dirt in the field', 'a pile of hay on the ground', 'legs of a sheep', 'a small patch of dirt', 'leg of a sheep', 'a small stone wall', 'the nose of a sheep', 'a log in the background', 'a tree stump in the field', 'the front leg of a sheep', 'a tree with no leaves', 'the nose of a sheep', 'the legs of a sheep', 'a tree trunk', 'a small mound of grass', 'the leg of a sheep', 'a wooden fence post', 'a fence around the tree', 'the tail of a sheep', 'a wooden fence post', 'the nose of a sheep', 'a small rock on the ground', 'a patch of dirt in the grass', 'a white rock in the grass', 'the leg of a sheep', 'a tree stump in the background'];

  </script>
  </head>
  <body>
    <section class="hero">
      <div class="hero-body">
          <div class="container is-max-desktop">
            <div class="columns is-centered">
              <div class="column has-text-centered">
                <h2 class="is-centered has-text-centered title is-3">Draw a bounding box to see a caption.</h2>
              <h2 class="is-centered has-text-centered title is-4">Or click one of the options below.</h2>
              <div class="column has-text-centered">
                <div class="publication-links">
                  <!-- Boxes link. -->
                  <span class="link-block">
                    <button id="button5"
                        class="external-link button is-normal is-rounded is-dark">
                      <span>Clear</span>
                  </button>
                  </span>
                  <span class="link-block">
                    <button id="button2"
                        class="external-link button is-normal is-rounded is-dark">
                      <span>Show Top 5 boxes</span>
                  </button>
                  </span>
                  <span class="link-block">
                    <button id="button3"
                        class="external-link button is-normal is-rounded is-dark">
                      <span>Show Top 10 boxes</span>
                  </button>
                  </span>
                  <span class="link-block">
                    <button id="button4"
                        class="external-link button is-normal is-rounded is-dark">
                      <span>Show Top 50 boxes</span>
                  </button>
                  </span>
                  <span class="link-block">
                    <button id="button1"
                        class="external-link button is-normal is-rounded is-dark">
                      <span>Show all boxes</span>
                  </button>
                  </span>
                </div>
              </div>
            </div>
          </div>
        </div>
      </div>
    </section>

    <script>
      function displayBoundingBoxes(imageUrl, boxes, captions) {
        var image = new Image();

        // Set the source of the image element to the given image URL
        image.src = imageUrl;

        image.onload = function() {
          paddingY = 30;
          paddingX = 400;
          // Get the dimensions of the image
          var imgWidth = image.width;
          var imgHeight = image.height;
          // Create a canvas element
          var canvas = document.createElement('canvas');
          canvas.width = imgWidth + paddingX*2;
          canvas.height = imgHeight + paddingY;
          var context = canvas.getContext('2d');

          // Draw the image on the canvas
          context.drawImage(image, paddingX, 0);

          // Initialize bounding box coordinates
          var startX, startY, endX, endY;
          function typewriter(currentBox, text) {
              var i = 0;
              var x = currentBox[0]+paddingX;
              var y = currentBox[3]+ 20;

              var intervalId = setInterval(function() {
                // Set the globalAlpha property of the canvas context
                context.globalAlpha = 0.75;
                // Draw a semi-transparent rectangle behind the text
                context.fillStyle = "black";
                context.fillRect(x, currentBox[3]+6, context.measureText(text[i]).width, 20);
                // Set the globalAlpha property of the canvas context
                context.globalAlpha = 1.0;

                context.font = '20px Arial';
                context.fillStyle = 'white';
                context.fillText(text[i], x, y);
                x += context.measureText(text[i]).width; // increment x by the width of the character
                i++;
                if (i === text.length) {
                  clearInterval(intervalId);
                }}, 10);
            }

          function drawbox(bestBox, caption, bestIoU, clearOthers, color="green"){
            // Draw the bounding box
            if (bestBox && bestIoU>0.1) {
              // Clear the canvas
              if (clearOthers) {
                context.clearRect(0, 0, canvas.width, canvas.height);
                context.drawImage(image, paddingX, 0);
              }
              context.beginPath();
              context.lineWidth = "4";
              context.strokeStyle = color;
              context.rect(bestBox[0]+paddingX, bestBox[1], bestBox[2] - bestBox[0], bestBox[3] - bestBox[1]);
              context.stroke();
              console.log("bestBox:", bestBox, "bestIoU", bestIoU, "text",  caption);
              typewriter(bestBox, caption);
              // context.clearRect(startX, startY, endX-startX, endY-startY)
            }
            else {
              typewriter([startX-paddingX, startY, endX, endY], "No Match");
            }
          }

         for (var i = 0; i < 5; i++) {
          color = "#"+((1<<24)*Math.random()|0).toString(16);
          drawbox(boxes[i], captions[i], 1.0, false, color) }


          // Add event listeners for mouse actions
          var isDrawing = false;
          var bestBox = null;
          canvas.addEventListener('mousedown', function(e) {
            startX = e.clientX - canvas.offsetLeft;
            startY = e.clientY - canvas.offsetTop;
            isDrawing = true;
             bestBox = null;
          });

          canvas.addEventListener('mousemove', function(e) {
            if (isDrawing) {
              var currentX = e.clientX - canvas.offsetLeft;
              var currentY = e.clientY - canvas.offsetTop;

              // Clear the canvas
              context.clearRect(0, 0, canvas.width, canvas.height);
              context.drawImage(image, paddingX, 0);

              // Draw the bounding box
              context.beginPath();
              context.lineWidth = "4";
              context.strokeStyle = "red";
              var width = currentX - startX;
              var height = currentY - startY;
              context.rect(startX, startY, width, height);
              context.stroke();

              // Update bounding box coordinates
              endX = currentX;
              endY = currentY;
            }
          });

          canvas.addEventListener('mouseup', function(e) {
            isDrawing = false;

            // Order coords in increasing order.
            startXC = Math.min(startX, endX);
            startYC = Math.min(startY, endY);
            endXC = Math.max(startX, endX);
            endYC = Math.max(startY, endY);
            startX = startXC;
            endX = endXC
            startY = startYC;
            endY = endYC;

            console.log("Start X:", startX, "Start Y:", startY, "End X:", endX, "End Y:", endY);

            var bestIoU = 0.0;
            var caption = 'No Match'
            for (var i = 0; i < boxes.length; i++) {
              var box = boxes[i];
              var intersectionX1 = Math.max(box[0]+paddingX, startX);
              var intersectionY1 = Math.max(box[1], startY);
              var intersectionX2 = Math.min(box[2]+paddingX, endX);
              var intersectionY2 = Math.min(box[3], endY);
              var intersectionWidth = Math.max(0, intersectionX2 - intersectionX1);
              var intersectionHeight = Math.max(0, intersectionY2 - intersectionY1);
              var intersectionArea = intersectionWidth * intersectionHeight;
              var boxArea = (box[2] - box[0]) * (box[3] - box[1]);
              var drawnBoxArea = (endX - startX) * (endY - startY);
              var unionArea = boxArea + drawnBoxArea - intersectionArea;
              var iou = intersectionArea / (unionArea+1e-6);
              if (iou > bestIoU) {
                bestBox = box;
                bestIoU = iou;
                caption = captions[i]
              }
            }
            drawbox(bestBox, caption, bestIoU, true);


          });
          // Add the canvas to the document body
          document.body.appendChild(canvas);
          button = document.getElementById('button1');
          // Add an event listener to the button
          button.addEventListener("click", function() {
          // Do something when the button is clicked
          for (var i = 0; i < boxes.length; i++) {
            // Random Color
            color = "#"+((1<<24)*Math.random()|0).toString(16);
            drawbox(boxes[i], captions[i], 1.0, (i==0), color=color) }});

          button2 = document.getElementById('button2')
          // Add an event listener to the button
          button2.addEventListener("click", function() {
          // Do something when the button is clicked
          for (var i = 0; i < 5; i++) {
            // Random Color
            color = "#"+((1<<24)*Math.random()|0).toString(16);
            drawbox(boxes[i], captions[i], 1.0, (i==0), color=color) }});

          button3 = document.getElementById('button3')
          // Add an event listener to the button
          button3.addEventListener("click", function() {
          // Do something when the button is clicked
          for (var i = 0; i < 10; i++) {
            // Random Color
            color = "#"+((1<<24)*Math.random()|0).toString(16);
            drawbox(boxes[i], captions[i], 1.0, (i==0), color=color) }});

          button4 = document.getElementById('button4')
          // Add an event listener to the button
          button4.addEventListener("click", function() {
          // Do something when the button is clicked
          for (var i = 0; i < 50; i++) {
            // Random Color
            color = "#"+((1<<24)*Math.random()|0).toString(16);
            drawbox(boxes[i], captions[i], 1.0, (i==0), color=color) }});

          button5 = document.getElementById('button5')
          // Add an event listener to the button
          button5.addEventListener("click", function() {
            context.clearRect(0, 0, canvas.width, canvas.height);
            context.drawImage(image, paddingX, 0);});

        };
      }
      displayBoundingBoxes(imageUrl, boxes, captions);
  </script>
</body>
</html>

