Skip to content

Commit 2b6076b

Browse files
committed
update
1 parent 614c905 commit 2b6076b

File tree

11 files changed

+54
-7
lines changed

11 files changed

+54
-7
lines changed
2.62 MB
Loading

src/assets/video/ablation/exp_1.mp4

7.1 MB
Binary file not shown.

src/assets/video/ablation/exp_2.mp4

5.54 MB
Binary file not shown.

src/assets/video/ablation/lip_1.mp4

9.27 MB
Binary file not shown.

src/assets/video/ablation/lip_2.mp4

9.61 MB
Binary file not shown.

src/assets/video/ablation/pose_1.mp4

4.88 MB
Binary file not shown.

src/assets/video/ablation/pose_2.mp4

4.18 MB
Binary file not shown.

src/components/AbstractSection.vue

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,9 @@
22
<section class="abstract">
33
<div>
44
<h3>Abstract</h3>
5+
<div v-if="figure" class="figure">
6+
<img :src="figure">
7+
</div>
58
<p>{{ props.content }}</p>
69
</div>
710
</section>
@@ -10,8 +13,10 @@
1013
<script setup lang="ts">
1114
interface Props {
1215
content?: string
16+
figure?: string
1317
}
1418
const { props } = defineProps<{ props: Props }>()
19+
const figure = props.figure ? new URL(`../${props.figure}`, import.meta.url).href : ""
1520
1621
</script>
1722

@@ -31,6 +36,10 @@ const { props } = defineProps<{ props: Props }>()
3136
}
3237
}
3338
39+
.figure {
40+
margin: 1rem 0;
41+
}
42+
3443
p {
3544
white-space: pre-line;
3645
}

src/components/TitleSection.vue

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
}}</a>
1212
<span class="author-name" v-else>{{ author.name }}</span>
1313
<sup v-if="author.suffix">{{ author.suffix }}</sup>
14-
<span v-if="i < authorsItem.length - 1">, </span>
14+
<span v-if="i < authorsItem.length - 1">&nbsp;&nbsp;&nbsp;&nbsp;</span>
1515
</span>
1616
</div>
1717
</div>
@@ -37,7 +37,7 @@
3737
</a>
3838
</div>
3939

40-
<video v-lazy :src="mainVideo" muted loop controls></video>
40+
<video v-if="mainVideo" v-lazy :src="mainVideo" muted loop controls></video>
4141
</section>
4242
</template>
4343

src/components/VideoComparision.vue

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
<template>
22
<section>
3-
<h3>{{ title }}</h3>
3+
<h3 v-if="title">{{ title }}</h3>
4+
<h4 v-if="subtitle">{{ subtitle }}</h4>
45
<div class="panel">
56
<div ref="carouselElement" :id="id" class="relative" data-twe-carousel-init data-twe-carousel-slide
67
data-twe-ride="carousel" data-twe-interval="9999999">
@@ -60,10 +61,12 @@
6061
interface Props {
6162
id?: string
6263
title?: string
64+
subtitle?: string
6365
items?: string[][]
6466
}
6567
const { props } = defineProps<{ props: Props }>()
6668
const title = props.title || ''
69+
const subtitle = props.subtitle || ''
6770
const items = (props.items || []).map(v => v.map(sub => new URL(`../${sub}`, import.meta.url).href))
6871
const id = props.id || title.replaceAll(" ", "")
6972
@@ -122,6 +125,10 @@ section {
122125
}
123126
}
124127
128+
h4 {
129+
@apply text-lg mb-3
130+
}
131+
125132
.video-group {
126133
video {
127134
width: 49%;

src/index.json

Lines changed: 35 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -88,12 +88,13 @@
8888
"github": "https://github.com/fudan-generative-vision/hallo",
8989
"huggingface": "https://huggingface.co/fudan-generative-ai/hallo"
9090
},
91-
"mainVideo": "assets/video/main_video.mp4"
91+
"mainVideo": ""
9292
}
9393
},
9494
{
9595
"template": "abstract",
9696
"props": {
97+
"figure": "assets/img/best_visual_results.png",
9798
"content": "The field of portrait image animation, driven by speech audio input, has experienced significant advancements in the generation of realistic and dynamic portraits. This research delves into the complexities of synchronizing facial movements and creating visually appealing, temporally consistent animations within the framework of diffusion-based methodologies. Moving away from traditional paradigms that rely on parametric models for intermediate facial representations, our innovative approach embraces the end-to-end diffusion paradigm and introduces a hierarchical audio-driven visual synthesis module to enhance the precision of alignment between audio inputs and visual outputs, encompassing lip, expression, and pose motion. Our proposed network architecture seamlessly integrates diffusion-based generative models, a UNet-based denoiser, temporal alignment techniques, and a reference network. The proposed hierarchical audio-driven visual synthesis offers adaptive control over expression and pose diversity, enabling more effective personalization tailored to different identities. Through a comprehensive evaluation that incorporates both qualitative and quantitative analyses, our approach demonstrates obvious enhancements in image and video quality, lip synchronization precision, and motion diversity."
9899
}
99100
},
@@ -105,11 +106,41 @@
105106
}
106107
},
107108
{
108-
"template": "single-video",
109+
"template": "video-comparision",
109110
"props": {
110-
"title": "Cross-ID Showcase",
111+
"title": "Ablation Study-Motion Scale Control",
112+
"subtitle": "Lip Control",
111113
"items": [
112-
"assets/video/singing/1.mp4"
114+
[
115+
"assets/video/ablation/lip_1.mp4",
116+
"assets/video/ablation/lip_2.mp4"
117+
]
118+
]
119+
}
120+
},
121+
{
122+
"template": "video-comparision",
123+
"props": {
124+
"title": "",
125+
"subtitle": "Expression Control",
126+
"items": [
127+
[
128+
"assets/video/ablation/exp_1.mp4",
129+
"assets/video/ablation/exp_2.mp4"
130+
]
131+
]
132+
}
133+
},
134+
{
135+
"template": "video-comparision",
136+
"props": {
137+
"title": "",
138+
"subtitle": "Pose Control",
139+
"items": [
140+
[
141+
"assets/video/ablation/pose_1.mp4",
142+
"assets/video/ablation/pose_2.mp4"
143+
]
113144
]
114145
}
115146
},

0 commit comments

Comments
 (0)