<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
<title>From Silence to Sound: Towards Audio-Visual Subject Customization</title>
<link href="style.css" rel="stylesheet" type="text/css">

<link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
      rel="stylesheet">
<link rel="stylesheet" href="./static/css/bulma.min.css">
<link rel="stylesheet" href="./static/css/index.css">


</head>

<body>
	<button style="position: fixed;right: 15px;top:  50%;height: 100px;width: 140px; font-size: 20px;" type="button"><a href="#top">Back to top</a></button> 
<div class="page-container">
  
  <section class="hero" style="margin-top: 2em;">
    <div class="hero-body">
      <div class="container is-max-desktop">
        <div class="columns is-centered">
          <div class="column has-text-centered">
            <h1 class="title is-1 publication-title">From Silence to Sound:<br>Towards Audio-Visual Subject Customization</h1>
            <div class="column is-full_width">
            </div>
            <div class="is-size-5 publication-authors">
              <span class="author-block">Paper ID: 972</span><br>
              <span class="author-block">Anonymous Authors</span>
            </div>

            <div class="column has-text-centered">
              <div class="publication-links">

                <span class="link-block">
                  <a href="#our_results_container"
                     class="external-link button is-normal is-rounded">
                    <span>Showcases</span>
                  </a>
                </span>

                <span class="link-block">
                  <a href="#comparison_with_baseline_container"
                     class="external-link button is-normal is-rounded">
                    <span>Comparisons</span>
                  </a>
                </span>              

                <span class="link-block">
                  <a href="#comparison_with_cfg_methods_container"
                     class="external-link button is-normal is-rounded">
                    <span>Ablation Study</span>
                  </a>
                </span>              

              </div>
            </div>

          </div>
        </div>
      </div>
    </div>
  </section>
	


    <!-- <p align="center">&nbsp;</p> -->
	<a href="#top"></a>


  <hr style="margin: 0.75em 0;">

  <!------------------ BEGIN SECTION ------------------>
  
  
  <h2 style="margin-top: 0em; margin-bottom: 0.4em;" id="our_results_container" align="left"><a name="image-results" id="image-results"></a>Showcases</h2>

    <!-- Kungfu_Panda_raccoon -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Kungfu_Panda_raccoon/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Kungfu_Panda_raccoon/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Kungfu_Panda_raccoon/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/Kungfu_Panda_raccoon/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Kungfu_Panda_raccoon/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Kungfu_Panda_raccoon/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Kungfu_Panda_raccoon/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Wall-E Captain -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/016_Walle_Captain/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/016_Walle_Captain/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/016_Walle_Captain/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/016_Walle_Captain/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/016_Walle_Captain/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/016_Walle_Captain/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/016_Walle_Captain/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Zootopia Judy -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/011_Zootopia_Judy/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/011_Zootopia_Judy/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/011_Zootopia_Judy/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/011_Zootopia_Judy/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/011_Zootopia_Judy/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/011_Zootopia_Judy/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/011_Zootopia_Judy/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Arcane Viktor -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_viktor/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_viktor/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_viktor/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/arcane_viktor/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_viktor/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_viktor/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_viktor/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Arcane Caitlyn -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_caitlyn/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_caitlyn/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/arcane_caitlyn/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/arcane_caitlyn/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_caitlyn/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_caitlyn/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/arcane_caitlyn/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Interstellar Amelia -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/008_Interstellar_Amelia/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/008_Interstellar_Amelia/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/008_Interstellar_Amelia/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/008_Interstellar_Amelia/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/008_Interstellar_Amelia/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/008_Interstellar_Amelia/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/008_Interstellar_Amelia/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Game of Thrones Ned -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Ned/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Ned/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Ned/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Ned/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Ned/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Ned/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Ned/4.mp4" autoplay  controls></video>
      </div>
    </div>

    <!-- Game of Thrones Sansa -->
    <div class="result-container">
      <div class="reference-section">
        <h3 class="task-title">Reference Videos</h3>
        <div class="reference-videos-vertical">
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Sansa/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Sansa/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="reference-video-wrapper">
            <video class="reference-video" src="./results_demo/Games_of_Thrones_S01_Sansa/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="generated-videos-grid">
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Sansa/1.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Sansa/2.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Sansa/3.mp4" autoplay  controls></video>
        <video class="generated-video" src="./results_demo/Games_of_Thrones_S01_Sansa/4.mp4" autoplay  controls></video>
      </div>
    </div>


    <!-- Comparison -->
    <!-- ---------------- BEGIN SECTION ---------------- -->
    <p>&nbsp;</p>
    <hr>
        
    <h2 id="comparison_with_baseline_container" align="left"><a name="image-results" id="image-results"></a>Comparisons with previous methods</h2>
    
    <!-- Sample 09 -->
    <div class="sample-section">
      <button class="prompt-toggle-btn" onclick="togglePrompt('sample09')" style="background-color: hsl(204, 86%, 43%);">Hide prompt</button>
      <div id="sample09-prompt" class="prompt-display" style="display: block;">
        <p>The video depicts a scene set in what appears to be a historical or fantasy context, possibly during the Viking era. The character in focus has long hair and a beard, and is wearing a fur-lined garment, suggesting a cold environment. The background is dimly lit, with smoke or mist visible, adding to the atmosphere of an ancient or medieval setting. The character seems to be engaged in a serious conversation or interaction with another person who is partially visible on the right side of the frame. The overall mood of the scene is intense and dramatic.</p>
      </div>
    </div>
    <div class="comparison-result-container">
      <div class="comparison-reference-section">
        <h3 class="comparison-task-title">Reference Videos</h3>
        <div class="comparison-reference-videos-vertical">
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_09/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_09/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_09/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="comparison-generated-videos-grid">
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">SadTalker</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_09/sadtalker.mp4" autoplay  controls data-tooltip="The video depicts a scene set in what appears to be a historical or fantasy context, possibly during the Viking era. The character in focus has long hair and a beard, and is wearing a fur-lined garment, suggesting a cold environment. The background is dimly lit, with smoke or mist visible, adding to the atmosphere of an ancient or medieval setting. The character seems to be engaged in a serious conversation or interaction with another person who is partially visible on the right side of the frame. The overall mood of the scene is intense and dramatic."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Aniportrait</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_09/aniportrait.mp4" autoplay  controls data-tooltip="The video depicts a scene set in what appears to be a historical or fantasy context, possibly during the Viking era. The character in focus has long hair and a beard, and is wearing a fur-lined garment, suggesting a cold environment. The background is dimly lit, with smoke or mist visible, adding to the atmosphere of an ancient or medieval setting. The character seems to be engaged in a serious conversation or interaction with another person who is partially visible on the right side of the frame. The overall mood of the scene is intense and dramatic."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Hallo3</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_09/hallo3.mp4" autoplay  controls data-tooltip="The video depicts a scene set in what appears to be a historical or fantasy context, possibly during the Viking era. The character in focus has long hair and a beard, and is wearing a fur-lined garment, suggesting a cold environment. The background is dimly lit, with smoke or mist visible, adding to the atmosphere of an ancient or medieval setting. The character seems to be engaged in a serious conversation or interaction with another person who is partially visible on the right side of the frame. The overall mood of the scene is intense and dramatic."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Ours</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_09/ours.mp4" autoplay  controls data-tooltip="The video depicts a scene set in what appears to be a historical or fantasy context, possibly during the Viking era. The character in focus has long hair and a beard, and is wearing a fur-lined garment, suggesting a cold environment. The background is dimly lit, with smoke or mist visible, adding to the atmosphere of an ancient or medieval setting. The character seems to be engaged in a serious conversation or interaction with another person who is partially visible on the right side of the frame. The overall mood of the scene is intense and dramatic."></video>
        </div>
      </div>
    </div>


    <!-- Sample 94 -->
    <div class="sample-section">
      <button class="prompt-toggle-btn" onclick="togglePrompt('sample94')" style="background-color: hsl(204, 86%, 43%);">Hide prompt</button>
      <div id="sample94-prompt" class="prompt-display" style="display: block;">
        <p>The image depicts two characters in a dimly lit room, engaged in a conversation. The character on the right is wearing a dark, ornate tunic with intricate designs and a brooch at the collar. This character has short, light-colored hair and appears to be speaking or reacting to something. The character on the left, whose back is partially turned to the camera, has long, braided hair and is wearing a simple, light-colored garment. The setting suggests a medieval or fantasy context, possibly from a television show or movie. The lighting creates a dramatic atmosphere, highlighting the expressions and details of their attire.</p>
      </div>
    </div>
    <div class="comparison-result-container">
      <div class="comparison-reference-section">
        <h3 class="comparison-task-title">Reference Videos</h3>
        <div class="comparison-reference-videos-vertical">
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_94/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_94/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_94/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="comparison-generated-videos-grid">
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">SadTalker</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_94/sadtalker.mp4" autoplay  controls data-tooltip="The image depicts two characters in a dimly lit room, engaged in a conversation. The character on the right is wearing a dark, ornate tunic with intricate designs and a brooch at the collar. This character has short, light-colored hair and appears to be speaking or reacting to something. The character on the left, whose back is partially turned to the camera, has long, braided hair and is wearing a simple, light-colored garment. The setting suggests a medieval or fantasy context, possibly from a television show or movie. The lighting creates a dramatic atmosphere, highlighting the expressions and details of their attire."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Aniportrait</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_94/aniportrait.mp4" autoplay  controls data-tooltip="The image depicts two characters in a dimly lit room, engaged in a conversation. The character on the right is wearing a dark, ornate tunic with intricate designs and a brooch at the collar. This character has short, light-colored hair and appears to be speaking or reacting to something. The character on the left, whose back is partially turned to the camera, has long, braided hair and is wearing a simple, light-colored garment. The setting suggests a medieval or fantasy context, possibly from a television show or movie. The lighting creates a dramatic atmosphere, highlighting the expressions and details of their attire."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Hallo3</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_94/hallo3.mp4" autoplay  controls data-tooltip="The image depicts two characters in a dimly lit room, engaged in a conversation. The character on the right is wearing a dark, ornate tunic with intricate designs and a brooch at the collar. This character has short, light-colored hair and appears to be speaking or reacting to something. The character on the left, whose back is partially turned to the camera, has long, braided hair and is wearing a simple, light-colored garment. The setting suggests a medieval or fantasy context, possibly from a television show or movie. The lighting creates a dramatic atmosphere, highlighting the expressions and details of their attire."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Ours</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_94/ours.mp4" autoplay  controls data-tooltip="The image depicts two characters in a dimly lit room, engaged in a conversation. The character on the right is wearing a dark, ornate tunic with intricate designs and a brooch at the collar. This character has short, light-colored hair and appears to be speaking or reacting to something. The character on the left, whose back is partially turned to the camera, has long, braided hair and is wearing a simple, light-colored garment. The setting suggests a medieval or fantasy context, possibly from a television show or movie. The lighting creates a dramatic atmosphere, highlighting the expressions and details of their attire."></video>
        </div>
      </div>
    </div>


    <!-- Sample 12 -->
    <div class="sample-section">
      <button class="prompt-toggle-btn" onclick="togglePrompt('sample12')" style="background-color: hsl(204, 86%, 43%);">Hide prompt</button>
      <div id="sample12-prompt" class="prompt-display" style="display: block;">
        <p>In the video, a man in a suit and tie is walking down a street with a colorful mural on the wall behind him. He appears to be engaged in a conversation with another person who is partially visible on the left side of the frame. The man in the suit has a backpack over one shoulder and seems to be gesturing or explaining something as he walks. The setting suggests an urban environment with various signs and advertisements in the background. The interaction between the two individuals seems friendly and animated.</p>
      </div>
    </div>
    <div class="comparison-result-container">
      <div class="comparison-reference-section">
        <h3 class="comparison-task-title">Reference Videos</h3>
        <div class="comparison-reference-videos-vertical">
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_12/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_12/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_12/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="comparison-generated-videos-grid">
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">SadTalker</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_12/sadtalker.mp4" autoplay  controls data-tooltip="In the video, a man in a suit and tie is walking down a street with a colorful mural on the wall behind him. He appears to be engaged in a conversation with another person who is partially visible on the left side of the frame. The man in the suit has a backpack over one shoulder and seems to be gesturing or explaining something as he walks. The setting suggests an urban environment with various signs and advertisements in the background. The interaction between the two individuals seems friendly and animated."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Aniportrait</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_12/aniportrait.mp4" autoplay  controls data-tooltip="In the video, a man in a suit and tie is walking down a street with a colorful mural on the wall behind him. He appears to be engaged in a conversation with another person who is partially visible on the left side of the frame. The man in the suit has a backpack over one shoulder and seems to be gesturing or explaining something as he walks. The setting suggests an urban environment with various signs and advertisements in the background. The interaction between the two individuals seems friendly and animated."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Hallo3</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_12/hallo3.mp4" autoplay  controls data-tooltip="In the video, a man in a suit and tie is walking down a street with a colorful mural on the wall behind him. He appears to be engaged in a conversation with another person who is partially visible on the left side of the frame. The man in the suit has a backpack over one shoulder and seems to be gesturing or explaining something as he walks. The setting suggests an urban environment with various signs and advertisements in the background. The interaction between the two individuals seems friendly and animated."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Ours</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_12/ours.mp4" autoplay  controls data-tooltip="In the video, a man in a suit and tie is walking down a street with a colorful mural on the wall behind him. He appears to be engaged in a conversation with another person who is partially visible on the left side of the frame. The man in the suit has a backpack over one shoulder and seems to be gesturing or explaining something as he walks. The setting suggests an urban environment with various signs and advertisements in the background. The interaction between the two individuals seems friendly and animated."></video>
        </div>
      </div>
    </div>

    <!-- Sample 29 -->
    <div class="sample-section">
      <button class="prompt-toggle-btn" onclick="togglePrompt('sample29')" style="background-color: hsl(204, 86%, 43%);">Hide prompt</button>
      <div id="sample29-prompt" class="prompt-display" style="display: block;">
        <p>The video features two animated characters in a dimly lit, underwater-like environment with a greenish-blue hue. The character on the left is a young boy with black hair, wearing a red jacket over a white shirt and blue jeans. He appears to be speaking or reacting with an open mouth and expressive eyes. The character on the right is facing away from the camera, wearing a purple jacket and holding what looks like a piece of paper or a book. The background consists of rocky surfaces and water, suggesting they are in a cave or underground setting. The overall atmosphere is mysterious and slightly eerie.</p>
      </div>
    </div>
    <div class="comparison-result-container">
      <div class="comparison-reference-section">
        <h3 class="comparison-task-title">Reference Videos</h3>
        <div class="comparison-reference-videos-vertical">
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_29/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_29/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_29/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="comparison-generated-videos-grid">
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">SadTalker</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_29/sadtalker.mp4" autoplay  controls data-tooltip="The video features two animated characters in a dimly lit, underwater-like environment with a greenish-blue hue. The character on the left is a young boy with black hair, wearing a red jacket over a white shirt and blue jeans. He appears to be speaking or reacting with an open mouth and expressive eyes. The character on the right is facing away from the camera, wearing a purple jacket and holding what looks like a piece of paper or a book. The background consists of rocky surfaces and water, suggesting they are in a cave or underground setting. The overall atmosphere is mysterious and slightly eerie."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Aniportrait</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_29/aniportrait.mp4" autoplay  controls data-tooltip="The video features two animated characters in a dimly lit, underwater-like environment with a greenish-blue hue. The character on the left is a young boy with black hair, wearing a red jacket over a white shirt and blue jeans. He appears to be speaking or reacting with an open mouth and expressive eyes. The character on the right is facing away from the camera, wearing a purple jacket and holding what looks like a piece of paper or a book. The background consists of rocky surfaces and water, suggesting they are in a cave or underground setting. The overall atmosphere is mysterious and slightly eerie."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Hallo3</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_29/hallo3.mp4" autoplay  controls data-tooltip="The video features two animated characters in a dimly lit, underwater-like environment with a greenish-blue hue. The character on the left is a young boy with black hair, wearing a red jacket over a white shirt and blue jeans. He appears to be speaking or reacting with an open mouth and expressive eyes. The character on the right is facing away from the camera, wearing a purple jacket and holding what looks like a piece of paper or a book. The background consists of rocky surfaces and water, suggesting they are in a cave or underground setting. The overall atmosphere is mysterious and slightly eerie."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Ours</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_29/ours.mp4" autoplay  controls data-tooltip="The video features two animated characters in a dimly lit, underwater-like environment with a greenish-blue hue. The character on the left is a young boy with black hair, wearing a red jacket over a white shirt and blue jeans. He appears to be speaking or reacting with an open mouth and expressive eyes. The character on the right is facing away from the camera, wearing a purple jacket and holding what looks like a piece of paper or a book. The background consists of rocky surfaces and water, suggesting they are in a cave or underground setting. The overall atmosphere is mysterious and slightly eerie."></video>
        </div>
      </div>
    </div>

    <!-- Sample 98 -->
    <div class="sample-section">
      <button class="prompt-toggle-btn" onclick="togglePrompt('sample98')" style="background-color: hsl(204, 86%, 43%);">Hide prompt</button>
      <div id="sample98-prompt" class="prompt-display" style="display: block;">
        <p>The video features a man in a suit, standing indoors. He is wearing a patterned blazer over a white shirt and tie. The man has a cigarette in his mouth and appears to be speaking or reacting to something. The background includes framed pictures on the wall and a candelabra on a table to the left. The setting suggests a formal or professional environment, possibly an office or a study. The lighting is soft, creating a calm and composed atmosphere.</p>
      </div>
    </div>
    <div class="comparison-result-container">
      <div class="comparison-reference-section">
        <h3 class="comparison-task-title">Reference Videos</h3>
        <div class="comparison-reference-videos-vertical">
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_98/ref0.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_98/ref1.mp4" autoplay  controls></video>
          </div>
          <div class="comparison-reference-video-wrapper">
            <video class="comparison-reference-video" src="./comparison/sample_98/ref2.mp4" autoplay  controls></video>
          </div>
        </div>
      </div>
      <div class="comparison-generated-videos-grid">
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">SadTalker</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_98/sadtalker.mp4" autoplay  controls data-tooltip="The video features a man in a suit, standing indoors. He is wearing a patterned blazer over a white shirt and tie. The man has a cigarette in his mouth and appears to be speaking or reacting to something. The background includes framed pictures on the wall and a candelabra on a table to the left. The setting suggests a formal or professional environment, possibly an office or a study. The lighting is soft, creating a calm and composed atmosphere."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Aniportrait</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_98/aniportrait.mp4" autoplay  controls data-tooltip="The video features a man in a suit, standing indoors. He is wearing a patterned blazer over a white shirt and tie. The man has a cigarette in his mouth and appears to be speaking or reacting to something. The background includes framed pictures on the wall and a candelabra on a table to the left. The setting suggests a formal or professional environment, possibly an office or a study. The lighting is soft, creating a calm and composed atmosphere."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Hallo3</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_98/hallo3.mp4" autoplay  controls data-tooltip="The video features a man in a suit, standing indoors. He is wearing a patterned blazer over a white shirt and tie. The man has a cigarette in his mouth and appears to be speaking or reacting to something. The background includes framed pictures on the wall and a candelabra on a table to the left. The setting suggests a formal or professional environment, possibly an office or a study. The lighting is soft, creating a calm and composed atmosphere."></video>
        </div>
        <div class="comparison-method-item">
          <h4 class="comparison-method-title">Ours</h4>
          <video class="comparison-generated-video video-tooltip" src="./comparison/sample_98/ours.mp4" autoplay  controls data-tooltip="The video features a man in a suit, standing indoors. He is wearing a patterned blazer over a white shirt and tie. The man has a cigarette in his mouth and appears to be speaking or reacting to something. The background includes framed pictures on the wall and a candelabra on a table to the left. The setting suggests a formal or professional environment, possibly an office or a study. The lighting is soft, creating a calm and composed atmosphere."></video>
        </div>
      </div>
    </div>

    <!-- ---------------- BEGIN SECTION ---------------- -->
    <p>&nbsp;</p>
    <hr>

    <h2 id="comparison_with_cfg_methods_container" align="left"><a name="cfg-results" id="cfg-results"></a>Ablations on Region-Selective Audio CFG</h2>
    <table width="1024" align="center">
      <tbody>
        
          <tr>
            <th style="font-size: 16px; width: 50%;">w/o CFG</th>
            <th style="font-size: 16px; width: 50%;">Global CFG</th>
          </tr>
          <tr>
            <th><video class="comparison-video" src="./ablations/ablate_cfg/no.MP4" autoplay  controls ></th>
            <th><video class="comparison-video" src="./ablations/ablate_cfg/cfg.mp4" autoplay  controls ></th>
          </tr>
          <tr>
            <th style="font-size: 16px">Local CFG (Ours)</th>
            <th style="font-size: 16px">Attention Map</th>
          </tr>
          <tr>
            <th><video class="comparison-video" src="./ablations/ablate_cfg/final.mp4" autoplay  controls ></th>
            <th><video class="comparison-video" src="./ablations/ablate_cfg/attn.mp4" autoplay  controls ></th>
          </tr>
        <tr> <td><br /></td> </tr> 
      </tbody>
    </table>

    
    <h2 id="comparison_with_cfg_methods_container" align="left"><a name="cfg-results" id="cfg-results"></a>Ablations on Decoupled Audio-Visual Learning</h2>
    <table width="1024" align="center">
      <tbody>
        
          <tr>
            <th style="font-size: 16px; width: 50%;">w/o audio pt.</th>
            <th style="font-size: 16px; width: 50%;">w/o decoupling</th>
          </tr>
          <tr>
            <th><video class="comparison-video" src="./ablations/ablate_decouple/wo_pt.mp4" autoplay  controls ></th>
            <th><video class="comparison-video" src="./ablations/ablate_decouple/wo_decouple.mp4" autoplay  controls ></th>
          </tr>
          <tr>
            <th style="font-size: 16px">Ours</th>
          </tr>
          <tr>
            <th><video class="comparison-video" src="./ablations/ablate_decouple/ours.mp4" autoplay  controls ></th>
          </tr>
        <tr> <td><br /></td> </tr> 
      </tbody>
    </table>

</div>


<script>
// Prompt toggle function
function togglePrompt(sampleId) {
    const promptDiv = document.getElementById(sampleId + '-prompt');
    const button = document.querySelector(`button[onclick="togglePrompt('${sampleId}')"]`);
    if (!promptDiv || !button) return;
    if (promptDiv.style.display === 'none' || promptDiv.style.display === '') {
        promptDiv.style.display = 'block';
        button.textContent = 'Hide prompt';
        button.style.backgroundColor = 'hsl(204, 86%, 43%)';
    } else {
        promptDiv.style.display = 'none';
        button.textContent = 'Click to view prompt';
        button.style.backgroundColor = 'hsl(204, 86%, 53%)';
    }
}

// Reset videos to beginning when they end
document.addEventListener('DOMContentLoaded', function() {
    const videos = document.querySelectorAll('video');
    videos.forEach(video => {
        video.addEventListener('ended', function() {
            this.currentTime = 0;
            this.pause();
        });
    });
});
</script>


<footer class="footer">
  <div class="container" style="text-align: left;">
    <div class="columns is-centered">
      <div class="column is-8">
      </div>
    </div>
  </div>
</footer>
</body>
</html>
