From 58966a66989fc4a4949eaf85641bc525b03a5025 Mon Sep 17 00:00:00 2001 From: Eric Lam Date: Mon, 22 Jan 2024 17:47:46 +0000 Subject: [PATCH 1/2] change default win_duration to 5.0 --- dac/model/base.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dac/model/base.py b/dac/model/base.py index 546b3cb..1fa4d95 100644 --- a/dac/model/base.py +++ b/dac/model/base.py @@ -126,7 +126,7 @@ def get_output_length(self, input_length): def compress( self, audio_path_or_signal: Union[str, Path, AudioSignal], - win_duration: float = 1.0, + win_duration: float = 5.0, verbose: bool = False, normalize_db: float = -16, n_quantizers: int = None, From 1beee4412b0b0fd3bf74219d58083d5bde64601b Mon Sep 17 00:00:00 2001 From: Eric Lam Date: Tue, 23 Jan 2024 10:19:40 +0000 Subject: [PATCH 2/2] merge fix DecoderBlock bug --- dac/model/dac.py | 1 + 1 file changed, 1 insertion(+) diff --git a/dac/model/dac.py b/dac/model/dac.py index eb754b2..5aabbda 100644 --- a/dac/model/dac.py +++ b/dac/model/dac.py @@ -102,6 +102,7 @@ def __init__(self, input_dim: int = 16, output_dim: int = 8, stride: int = 1): kernel_size=2 * stride, stride=stride, padding=math.ceil(stride / 2), + output_padding=1, # https://github.com/descriptinc/descript-audio-codec/pull/44/files ), ResidualUnit(output_dim, dilation=1), ResidualUnit(output_dim, dilation=3),