diff --git a/parakeet/modules/audio.py b/parakeet/modules/audio.py index cfa215f..fb55e3a 100644 --- a/parakeet/modules/audio.py +++ b/parakeet/modules/audio.py @@ -71,6 +71,8 @@ def dequantize(quantized, n_bands, dtype=None): value = (paddle.cast(quantized, dtype) + 0.5) * (2.0 / n_bands) - 1.0 return value +import librosa +librosa.stft( class STFT(nn.Layer): """A module for computing stft transformation in a differentiable way. @@ -117,7 +119,11 @@ class STFT(nn.Layer): """ def __init__(self, n_fft, hop_length=None, win_length=None, window="hanning", center=True, pad_mode="reflect"): +<<<<<<< HEAD super().__init__() +======= + super(STFT, self).__init__() +>>>>>>> 6749ce40eab7c5de0ca11fe5d2fd57120b10415c # By default, use the entire frame if win_length is None: win_length = n_fft