Skip to content

Commit f9ffeb8

Browse files
committed
Use latest version of F5-TTS
1 parent 39bb860 commit f9ffeb8

File tree

3 files changed

+27
-7
lines changed

3 files changed

+27
-7
lines changed

F5TTS.py

Lines changed: 25 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -139,7 +139,14 @@ def get_vocab_file(self):
139139

140140
def load_e2_model(self, vocoder):
141141
model_cls = UNetT
142-
model_cfg = dict(dim=1024, depth=24, heads=16, ff_mult=4)
142+
model_cfg = dict(
143+
dim=1024,
144+
depth=24,
145+
heads=16,
146+
ff_mult=4,
147+
text_mask_padding=False,
148+
pe_attn_head=1,
149+
)
143150
repo_name = "E2-TTS"
144151
exp_name = "E2TTS_Base"
145152
ckpt_step = 1200000
@@ -219,8 +226,15 @@ def cached_path(self, url):
219226

220227
def load_f5_model_hi(self, vocoder):
221228
model_cfg = dict(
222-
dim=768, depth=18, heads=12,
223-
ff_mult=2, text_dim=512, conv_layers=4
229+
dim=768,
230+
depth=18,
231+
heads=12,
232+
ff_mult=2,
233+
text_dim=512,
234+
text_mask_padding=False,
235+
conv_layers=4,
236+
pe_attn_head=1,
237+
checkpoint_activations=False,
224238
)
225239
return self.load_f5_model_url(
226240
"hf://SPRINGLab/F5-Hindi-24KHz/model_2500000.safetensors",
@@ -236,8 +250,14 @@ def load_f5_model_url(
236250
model_cls = DiT
237251
if model_cfg is None:
238252
model_cfg = dict(
239-
dim=1024, depth=22, heads=16,
240-
ff_mult=2, text_dim=512, conv_layers=4
253+
dim=1024,
254+
depth=22,
255+
heads=16,
256+
ff_mult=2,
257+
text_dim=512,
258+
text_mask_padding=False,
259+
conv_layers=4,
260+
pe_attn_head=1,
241261
)
242262

243263
ckpt_file = str(self.cached_path(url)) # noqa E501

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[project]
22
name = "comfyui-f5-tts"
33
description = "Text to speech with F5-TTS"
4-
version = "1.0.18"
4+
version = "1.0.19"
55
license = {text = "MIT License"}
66

77
[project.urls]

0 commit comments

Comments
 (0)