fudan-generative-vision
diff --git a/‎src/assets/img/best_visual_results.png
2.62 MB b/‎src/assets/img/best_visual_results.png
2.62 MB
diff --git a/‎src/assets/video/ablation/exp_1.mp4
7.1 MB b/‎src/assets/video/ablation/exp_1.mp4
7.1 MB
diff --git a/‎src/assets/video/ablation/exp_2.mp4
5.54 MB b/‎src/assets/video/ablation/exp_2.mp4
5.54 MB
diff --git a/‎src/assets/video/ablation/lip_1.mp4
9.27 MB b/‎src/assets/video/ablation/lip_1.mp4
9.27 MB
diff --git a/‎src/assets/video/ablation/lip_2.mp4
9.61 MB b/‎src/assets/video/ablation/lip_2.mp4
9.61 MB
diff --git a/‎src/assets/video/ablation/pose_1.mp4
4.88 MB b/‎src/assets/video/ablation/pose_1.mp4
4.88 MB
diff --git a/‎src/assets/video/ablation/pose_2.mp4
4.18 MB b/‎src/assets/video/ablation/pose_2.mp4
4.18 MB
diff --git a/‎src/components/AbstractSection.vue
Lines changed: 9 additions & 0 deletions b/‎src/components/AbstractSection.vue
Lines changed: 9 additions & 0 deletions
diff --git a/‎src/components/TitleSection.vue
Lines changed: 2 additions & 2 deletions b/‎src/components/TitleSection.vue
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/components/VideoComparision.vue
Lines changed: 8 additions & 1 deletion b/‎src/components/VideoComparision.vue
Lines changed: 8 additions & 1 deletion
diff --git a/‎src/index.json
Lines changed: 35 additions & 4 deletions b/‎src/index.json
Lines changed: 35 additions & 4 deletions
@@ -2,6 +2,9 @@
     <section class="abstract">
         <div>
             <h3>Abstract</h3>
+            <div v-if="figure" class="figure">
+                <img :src="figure">
+            </div>
             <p>{{ props.content }}</p>
         </div>
     </section>
@@ -10,8 +13,10 @@
 <script setup lang="ts">
 interface Props {
     content?: string
+    figure?: string
 }
 const { props } = defineProps<{ props: Props }>()
+const figure = props.figure ? new URL(`../${props.figure}`, import.meta.url).href : ""
 
 </script>
 
@@ -31,6 +36,10 @@ const { props } = defineProps<{ props: Props }>()
     }
 }
 
+.figure {
+    margin: 1rem 0;
+}
+
 p {
     white-space: pre-line;
 }
 
@@ -11,7 +11,7 @@
                         }}</a>
                     <span class="author-name" v-else>{{ author.name }}</span>
                     <sup v-if="author.suffix">{{ author.suffix }}</sup>
-                    <span v-if="i < authorsItem.length - 1">, </span>
+                    <span v-if="i < authorsItem.length - 1">&nbsp;&nbsp;&nbsp;&nbsp;</span>
                 </span>
             </div>
         </div>
@@ -37,7 +37,7 @@
             </a>
         </div>
 
-        <video v-lazy :src="mainVideo" muted loop controls></video>
+        <video v-if="mainVideo" v-lazy :src="mainVideo" muted loop controls></video>
     </section>
 </template>
 
 
@@ -1,6 +1,7 @@
 <template>
     <section>
-        <h3>{{ title }}</h3>
+        <h3 v-if="title">{{ title }}</h3>
+        <h4 v-if="subtitle">{{ subtitle }}</h4>
         <div class="panel">
             <div ref="carouselElement" :id="id" class="relative" data-twe-carousel-init data-twe-carousel-slide
                 data-twe-ride="carousel" data-twe-interval="9999999">
@@ -60,10 +61,12 @@
 interface Props {
     id?: string
     title?: string
+    subtitle?: string
     items?: string[][]
 }
 const { props } = defineProps<{ props: Props }>()
 const title = props.title || ''
+const subtitle = props.subtitle || ''
 const items = (props.items || []).map(v => v.map(sub => new URL(`../${sub}`, import.meta.url).href))
 const id = props.id || title.replaceAll(" ", "")
 
@@ -122,6 +125,10 @@ section {
     }
 }
 
+h4 {
+    @apply text-lg mb-3
+}
+
 .video-group {
     video {
         width: 49%;
 
@@ -88,12 +88,13 @@
                 "github": "https://github.com/fudan-generative-vision/hallo",
                 "huggingface": "https://huggingface.co/fudan-generative-ai/hallo"
             },
-            "mainVideo": "assets/video/main_video.mp4"
+            "mainVideo": ""
         }
     },
     {
         "template": "abstract",
         "props": {
+            "figure": "assets/img/best_visual_results.png",
             "content": "The field of portrait image animation, driven by speech audio input, has experienced significant advancements in the generation of realistic and dynamic portraits. This research delves into the complexities of synchronizing facial movements and creating visually appealing, temporally consistent animations within the framework of diffusion-based methodologies. Moving away from traditional paradigms that rely on parametric models for intermediate facial representations, our innovative approach embraces the end-to-end diffusion paradigm and introduces a hierarchical audio-driven visual synthesis module to enhance the precision of alignment between audio inputs and visual outputs, encompassing lip, expression, and pose motion. Our proposed network architecture seamlessly integrates diffusion-based generative models, a UNet-based denoiser, temporal alignment techniques, and a reference network. The proposed hierarchical audio-driven visual synthesis offers adaptive control over expression and pose diversity, enabling more effective personalization tailored to different identities. Through a comprehensive evaluation that incorporates both qualitative and quantitative analyses, our approach demonstrates obvious enhancements in image and video quality, lip synchronization precision, and motion diversity."
         }
     },
@@ -105,11 +106,41 @@
         }
     },
     {
-        "template": "single-video",
+        "template": "video-comparision",
         "props": {
-            "title": "Cross-ID Showcase",
+            "title": "Ablation Study-Motion Scale Control",
+            "subtitle": "Lip Control",
             "items": [
-                "assets/video/singing/1.mp4"
+                [
+                    "assets/video/ablation/lip_1.mp4",
+                    "assets/video/ablation/lip_2.mp4"
+                ]
+            ]
+        }
+    },
+    {
+        "template": "video-comparision",
+        "props": {
+            "title": "",
+            "subtitle": "Expression Control",
+            "items": [
+                [
+                    "assets/video/ablation/exp_1.mp4",
+                    "assets/video/ablation/exp_2.mp4"
+                ]
+            ]
+        }
+    },
+    {
+        "template": "video-comparision",
+        "props": {
+            "title": "",
+            "subtitle": "Pose Control",
+            "items": [
+                [
+                    "assets/video/ablation/pose_1.mp4",
+                    "assets/video/ablation/pose_2.mp4"
+                ]
             ]
         }
     },