<!DOCTYPE html>
<html>
<head>
  <meta charset="utf-8">
  <meta name="viewport" content="width=device-width, initial-scale=1">
  <title>Zero-shot Synthetic Video Realism Enhancement via Structure-aware Denoising</title>

  <!-- Global site tag (gtag.js) - Google Analytics -->
  <script async src="https://www.googletagmanager.com/gtag/js?id=G-PYVRSFMDRL"></script>
  <script>
    window.dataLayer = window.dataLayer || [];

    function gtag() {
      dataLayer.push(arguments);
    }

    gtag('js', new Date());

    gtag('config', 'G-PYVRSFMDRL');
  </script>

  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
        rel="stylesheet">

  <link rel="stylesheet" href="./static/css/bulma.min.css">
  <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
  <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
  <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
  <link rel="stylesheet"
        href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
  <link rel="stylesheet" href="./static/css/index.css">

  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
  <script defer src="./static/js/fontawesome.all.min.js"></script>
  <script src="./static/js/bulma-carousel.min.js"></script>
  <script src="./static/js/bulma-slider.min.js"></script>
  <script src="./static/js/index.js"></script>
</head>
<body>


<section class="hero">
  <div class="hero-body">
    <div class="container is-max-desktop">
      <div class="columns is-centered">
        <div class="column has-text-centered">
          <h1 class="title is-2 publication-title">Zero-shot Synthetic Video Realism Enhancement via Structure-aware Denoising</h1>
        </div>
      </div>
    </div>
  </div>
</section>

<section class="hero teaser">
  <div class="container is-max-desktop">
    
        <!-- <center><h2 class="title is-3">Abstract</h2></center> -->
    <!-- <div class="hero-body has-text-centered">
        <img src = "./images/teaser.png" height="80%"></img><br>

    </div> -->

    <p>
      We propose an approach to enhancing synthetic video realism, which can re-render synthetic videos from a simulator in photorealisic fashion. Our realism enhancement approach is a zero-shot framework that focuses on preserving the multi-level structures from synthetic videos into the enhanced one in both spatial and temporal domains, built upon a diffusion video foundational model without further fine-tuning. Specifically, we incorporate an effective modification to have the generation/denoising process conditioned on estimated structure-aware information from the synthetic video, such as depth maps, semantic maps, and edge maps, by another model, rather than extracting the information from a simulator. This guidance ensures that the enhanced videos are consistent with the original synthetic video at both structural and semantic levels. Our approach is a simple yet general and powerful approach to enhancing synthetic video realism: we show that our approach outperforms alternative baselines in structural consistency with the original video while maintaining state-of-the-art photorealism quality in our experiments.
    </p>
    <br>
    
  </div>
</section>



<section class="section is-light is-small">
  <div class="container is-max-desktop">
    <center><h2 class="title is-3">Overview</h2></center>
    <div class="hero-body">
      <a href="./images/model.png"><img src = "./images/model.png" height="100%"></img></href></a><br>
    </div>
  </div>
    <!--/ Abstract. -->

</section>

<section class="section"></section>
  <div class="container is-max-desktop">

    <center><h2 class="title is-3">Qualitative Results</h2></center><br>
    <br>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/F61-ori.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/F61-ours.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> CARLA</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/F69_ori.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/F69_ours.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <br>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/418d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> WAN2.1 VACE</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/vace/418d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Cosmos-Transfer</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/base/418d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/418d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <br>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/3161.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> WAN2.1 VACE</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/vace/3161.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Cosmos-Transfer</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/base/3161.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/3161.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/2032.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> WAN2.1 VACE</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/vace/2032.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Cosmos-Transfer</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/base/2032.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/2032.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <br>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/180d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> WAN2.1 VACE</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/vace/180d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Cosmos-Transfer</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/base/180d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/180d.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <br>
    <div class="columns is-centered">
      <div class="column">
        <div id="video-container">
          <center><p><b> CARLA </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/carla/0fe7.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Cosmos-Transfer</b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/base/0fe7base.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
      <div class="column">
        <div class="content">
          
          <center><p><b> Ours </b></p></center>
          <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
              <source src="./video/ours/0fe7ours.mp4"
                      type="video/mp4">
            </video>
        </div>
      </div>
    </div>
    <br>
    <h3 class="title is-4"> More Examples </h2>
      <div class="columns is-centered">
        <div class="column">
          <div id="video-container">
            <center><p><b> CARLA </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/carla/1c4a.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> WAN2.1 VACE</b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/vace/1c4a.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> Cosmos-Transfer</b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/base/1c4a.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> Ours </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/ours/1c4a.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
      </div>

    <br>
    <h3 class="title is-4"> Qualitative Results on GTA V </h2>
      <div class="columns is-centered">
        <div class="column">
          <div id="video-container">
            <center><p><b> GTA </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/gta/gta1.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> Ours </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/ours/gta1.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> GTA</b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/gta/gta2.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> Ours </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/ours/gta2.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
      </div>
      <div class="columns is-centered">
        <div class="column">
          <div id="video-container">
            <center><p><b> GTA </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/gta/gta3.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> Ours </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/ours/gta3.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
      </div> 


    <br>
    <h3 class="title is-4"> Compared to FLUX </h2>
      <div class="columns is-centered">
        <div class="column">
          <div id="video-container">
            <center><p><b> CARLA </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/carla/79d0.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
        <div class="column">
          <div class="content">
            
            <center><p><b> FLUX controlnet frame by frame</b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/flux/79d0.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
  
        <div class="column">
          <div class="content">
            
            <center><p><b> Ours </b></p></center>
            <video id="video" muted controls autoplay loop style="width: 100%; height: 150px; object-fit: cover;">
                <source src="./video/ours/79d0.mp4"
                        type="video/mp4">
              </video>
          </div>
        </div>
      </div>
      <h3 class="title is-4"> Indoor Environment generated by Behavior Vision Suite </h2>
        <div class="columns is-centered">
          <div class="column">
            <div id="video-container">
              <center><p><b> Simulator </b></p></center>
              <center><video id="video" muted controls autoplay loop style="width: 70%; height: 150px; object-fit: cover;">
                  <source src="./video/carla/indoor_simulator.mp4"
                          type="video/mp4">
                </video></center>
            </div>
          </div>
          <div class="column">
            <div class="content">
    
              <center><p><b> Ours </b></p></center>
              <center><video id="video" muted controls autoplay loop style="width: 70%; height: 150px; object-fit: cover;">
                  <source src="./video/ours/indoor_gen.mp4"
                          type="video/mp4">
                </video></center>
            </div>
          </div>
        </div>
    
    



<script>
      var videoContainer = document.getElementById('video-container');
      var video = document.getElementById('video');

      var videoOffset = videoContainer.offsetTop;

      window.addEventListener('scroll', function() {
        var scrollPosition = window.scrollY || window.pageYOffset;

        if (scrollPosition >= videoOffset) {
          video.play();
        } else {
          video.pause();
        }
      });
    </script>

</body>
</html>
