<!DOCTYPE html>
<html>
<head>
  <meta charset="utf-8">
  <meta name="description"
        content="Feed-Forward Bullet-Time Reconstruction of Dynamic Scenes from Monocular Videos.">
  <meta name="viewport" content="width=device-width, initial-scale=1">
  <title>Feed-Forward Bullet-Time Reconstruction of Dynamic Scenes from Monocular Videos (ID: papers_17189)</title>

  <!-- Global site tag (gtag.js) - Google Analytics -->
  <script async src="https://www.googletagmanager.com/gtag/js?id=G-PYVRSFMDRL"></script>
  <script>
    window.dataLayer = window.dataLayer || [];

    function gtag() {
      dataLayer.push(arguments);
    }

    gtag('js', new Date());

    gtag('config', 'G-PYVRSFMDRL');
  </script>

  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
        rel="stylesheet">

  <link rel="stylesheet" href="./static/css/bulma.min.css">
  <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
  <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
  <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
  <link rel="stylesheet"
        href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
  <link rel="stylesheet" href="./static/css/index.css">
  <link rel="icon" href="./static/images/favicon.svg">

  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
  <script defer src="./static/js/fontawesome.all.min.js"></script>
  <script src="./static/js/bulma-carousel.min.js"></script>
  <script src="./static/js/bulma-slider.min.js"></script>
  <script src="./static/js/index.js"></script>
</head>
<body>


<section class="hero">
  <div class="hero-body">
    <div class="container is-max-desktop">
      <div class="columns is-centered">
        <div class="column has-text-centered">
          <h1 class="title is-1 publication-title">Feed-Forward Bullet-Time Reconstruction of Dynamic Scenes from Monocular Videos</h1>
          <div class="is-size-5 publication-authors">
            <span class="author-block">Anonymous Author(s)</span>
          </div>
          <div class="is-size-5 publication-authors">
            <span class="author-block">Submission ID: papers_17189</span>
          </div>
        </div>
      </div>
    </div>
  </div>
</section>

<section class="hero teaser">
  <div class="container is-max-desktop">
    <div class="hero-body is-centered has-text-centered">
      <h2 class="title is-3">What do we do?</h2>
      <img id="framework" src="./figures/teaser.png"
      class="interpolation-image"
      alt="Framework figure"
      style="max-width: 100%; height: auto;"/>
      <h2 class="subtitle">
        <span class="dnerf">BTimer:</span>
        Given a monocular video as input, our method reconstructs a 3D Gaussian Splatting (3DGS) representation at any desired timestamp in a feed-forward fashion.
      </h2>
    </div>
  </div>
</section>

<section class="hero is-light" style="margin-top: 20px;">
  <div class="hero-body has-text-centered">
      <h2 class="title is-3">Technical Contributions</h2>
      <div class="subtitle">
        <p>
          We present the first feed-forward reconstruction model for dynamic scenes using a <strong>bullet-time</strong> formulation;
        </p>
        <p>
          BTimer reconstructs a bullet-time scene within 150ms while reaching state-of-the-art performance on both static and dynamic scene datasets, even compared with optimization-based approaches.
        </p>
      </div>

  </div>
</section>

<section class="hero teaser">
  <div class="container is-max-desktop">
    <div class="hero-body is-centered has-text-centered">
      <h2 class="title is-3">Method Framework</h2>
      <img id="framework" src="./figures/method.png"
      class="interpolation-image"
      alt="Framework figure"/>
      <h2 class="subtitle">
        The model takes as input a sequence of context frames and their Plücker embeddings, along with the context timestamp and target (`bullet') timestamp embeddings. It then directly predicts the 3DGS representation at the bullet timestamp.
      </h2>
    </div>
  </div>
</section>



<section class="section">
    <div class="columns is-centered">
      <div class="column is-full-width has-text-centered">
        <!-- EGT -->
        <div class="content">
        <h2 class="title is-3">Results</h2>
        <h3 class="title is-4">Qualitative Results</h3>
          
        <div class="video-body">
          <div class="video-container">
            <video id="main-video" autoplay controls muted loop playsinline>
                <source src="./sora_results/big-sur_vid.mp4" type="video/mp4">
                Your browser does not support the video tag.
            </video>
          </div>
          <div class="thumbnail-container">
            <img src="thumbnail/big-sur_vid.jpg" alt="Video 1" class="thumbnail" data-video="./sora_results/big-sur_vid.mp4">
            <img src="thumbnail/robot-video-game_vid.jpg" alt="Video 8" class="thumbnail" data-video="./sora_results/robot-video-game_vid.mp4">
            <img src="thumbnail/amalfi-coast_vid.jpg" alt="Video 2" class="thumbnail" data-video="./sora_results/amalfi-coast_vid.mp4">
            <img src="thumbnail/birds-over-river_vid.jpg" alt="Video 3" class="thumbnail" data-video="./sora_results/birds-over-river_vid.mp4">
            <img src="thumbnail/closeup-man-in-glasses_vid.jpg" alt="Video 4" class="thumbnail" data-video="./sora_results/closeup-man-in-glasses_vid.mp4">
            <img src="thumbnail/grandma-birthday_vid.jpg" alt="Video 5" class="thumbnail" data-video="./sora_results/grandma-birthday_vid.mp4">
            <img src="thumbnail/cloud-man_vid.jpg" alt="Video 6" class="thumbnail" data-video="./sora_results/cloud-man_vid.mp4">
            <img src="thumbnail/octopus-and-crab_vid.jpg" alt="Video 7" class="thumbnail" data-video="./sora_results/octopus-and-crab_vid.mp4">
            <img src="thumbnail/tiny-construction_vid.jpg" alt="Video 7" class="thumbnail" data-video="./sora_results/tiny-construction_vid.mp4">
          </div>
            <big><em>Qualitative Results on SORA scenes.</em> We pause the video at a frame and move the camera to make a bullet-time effect.</big>
            <br>
        </div>

        <div class="video-body">
          <div class="video-container-davis">
            <video id="main-video-davis" autoplay controls muted loop playsinline>
                <source src="./davis_results/tennis_demo.mp4" type="video/mp4">
                Your browser does not support the video tag.
            </video>
          </div>
          <div class="thumbnail-container">
            <img src="thumbnail/tennis_demo.jpg" alt="Video 1" class="thumbnail-davis" data-video="./davis_results/tennis_demo.mp4">
            <img src="thumbnail/dance-twirl_demo.jpg" alt="Video 2" class="thumbnail-davis" data-video="./davis_results/dance-twirl_demo.mp4">
            <img src="thumbnail/bear_demo.jpg" alt="Video 3" class="thumbnail-davis" data-video="./davis_results/bear_demo.mp4">
            <img src="thumbnail/hockey_demo.jpg" alt="Video 4" class="thumbnail-davis" data-video="./davis_results/hockey_demo.mp4">
            <img src="thumbnail/horsejump-high_demo.jpg" alt="Video 5" class="thumbnail-davis" data-video="./davis_results/horsejump-high_demo.mp4">
            <img src="thumbnail/train_demo.jpg" alt="Video 6" class="thumbnail-davis" data-video="./davis_results/train_demo.mp4">
            <img src="thumbnail/drift-turn_demo.jpg" alt="Video 7" class="thumbnail-davis" data-video="./davis_results/drift-turn_demo.mp4">
            <img src="thumbnail/parkour_demo.jpg" alt="Video 8" class="thumbnail-davis" data-video="./davis_results/parkour_demo.mp4">
            <img src="thumbnail/horsejump-low_demo.jpg" alt="Video 10" class="thumbnail-davis" data-video="./davis_results/horsejump-low_demo.mp4">
            <img src="thumbnail/libby_demo.jpg" alt="Video 11" class="thumbnail-davis" data-video="./davis_results/libby_demo.mp4">
            <img src="thumbnail/lucia_demo.jpg" alt="Video 12" class="thumbnail-davis" data-video="./davis_results/lucia_demo.mp4">
            <img src="thumbnail//skate-park_demo.jpg" alt="Video 13" class="thumbnail-davis" data-video="./davis_results//skate-park_demo.mp4">
            <img src="thumbnail/stunt_demo.jpg" alt="Video 14" class="thumbnail-davis" data-video="./davis_results/stunt_demo.mp4">
            <img src="thumbnail/tractor-sand_demo.jpg" alt="Video 15" class="thumbnail-davis" data-video="./davis_results/tractor-sand_demo.mp4">
          </div>
            <big><em>Qualitative Results on DAVIS dataset.</em> Left is the input video, right is the video rendered from a novel camera trajectory.</big>
            <br>
        </div>
 
          <figure>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone1.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone2.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone33.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone4.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone5.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone9.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone7.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone8.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
              <source src="./dynamic/iphone6.mp4"
                      type="video/mp4">
            </video>
              <br>
              <big><em>Qualitative Results on DyCheck iPhone dataset. </em>Left is the input video, right two are the videos rendered from novel camera trajectories.</big>
              <br>
          </figure>

        <h3 class="title is-4">Dynamic Novel View Synthesis Benchmark Results</h3>
          <figure style="display: flex; flex-direction: column; align-items: center; justify-content: center; gap: 20px; text-align: center;">
            <div style="display: flex; align-items: center; justify-content: center; gap: 10px;">
                <img id="egt-table" src="./nsff/lpips_blobs.png"
                     class="interpolation-image" style="width: 30%; height: auto;"
                     alt="Quantitative Comparison" />
                <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
                    <source src="./nsff/nsff1.mp4" type="video/mp4">
                </video>
                <video id="gs" autoplay controls muted loop playsinline style="width: 30%;">
                    <source src="./nsff/nsff2.mp4" type="video/mp4">
                </video>
            </div>
            <figcaption>
                Baseline results on NVIDIA Dynamic Scene Dataset.
            </figcaption>
            <figure>
              <video id="gs" autoplay controls muted loop playsinline style="width: 80%;">
                <source src="./dynamic/scene1.mp4"
                        type="video/mp4">
              </video>
              <video id="gs" autoplay controls muted loop playsinline style="width: 80%;">
                <source src="./dynamic/scene2.mp4"
                        type="video/mp4">
              </video>
              <video id="gs" autoplay controls muted loop playsinline style="width: 80%;">
                <source src="./dynamic/scene3.mp4"
                        type="video/mp4">
              </video>
                <figcaption>
                  Baseline comparisons on DyCheck iPhone Scenes. We mask areas that are not co-visible.
                </figcaption>
            </figure>
        </figure>
            
        <h3 class="title is-4">Results on Static Scenes</h3>
          <figure>
            <video id="gs" autoplay controls muted loop playsinline style="width: 90%;">
              <source src="./figures/static_video.mp4"
                      type="video/mp4">
            </video>
              <figcaption>
                Results on the Tanks & Temples static scenes benchmark.
              </figcaption>
          </figure>
        
        <h3 class="title is-4">Effect of the NTE Module</h3>
          <figure>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./nte/nte1.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./nte/nte22.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./nte/nte3.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./nte/nte4.mp4"
                      type="video/mp4">
            </video>
              <figcaption>
                
              </figcaption>
          </figure>


        <h3 class="title is-4">Visualization of learned deformation</h3>
        <p>
          We visualize the deformation leanred by our model. With only 4 images as input, our model can reconstruct smooth 3D motions.
        </p>
          <figure>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/0.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/1.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/2.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/3.mp4"
                      type="video/mp4">
            </video>
              <figcaption>
                
              </figcaption>
          </figure>

          <h3 class="title is-4">Visualization of learned scene flow</h3>
          <p>
            We visualize the scene flow learned by our model. We color the Gaussians by the pixel positions they associate with.
          </p>
          <figure>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/flow_0.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/flow_1.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/flow_2.mp4"
                      type="video/mp4">
            </video>
            <video id="gs" autoplay controls muted loop playsinline style="width: 60%;">
              <source src="./objects/flow_3.mp4"
                      type="video/mp4">
            </video>
              <figcaption>
                
              </figcaption>
          </figure>
        </div>
      </div>
      

    </div>
</section>

</body>
</html>
