add demo and tutorials
This commit is contained in:
parent
c321fcd098
commit
4fde5c7e64
|
@ -1,2 +1,143 @@
|
||||||
Audio Sample
|
Audio Sample
|
||||||
==================
|
==================
|
||||||
|
|
||||||
|
TTS udio samples
|
||||||
|
-------------------
|
||||||
|
|
||||||
|
Audio samples generated by a TTS system. Text is first transformed into spectrogram
|
||||||
|
by a text-to-spectrogram model, then the spectrogram is converted into raw audio by
|
||||||
|
a vocoder.
|
||||||
|
|
||||||
|
.. raw:: html
|
||||||
|
|
||||||
|
<embed>
|
||||||
|
<table>
|
||||||
|
<tr>
|
||||||
|
<th align="left"> TransformerTTS + WaveFlow</th>
|
||||||
|
<th align="left"> Tacotron2 + WaveFlow </th>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_1.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_2.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_3.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_4.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_5.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_6.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_7.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_8.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_9.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
</td>
|
||||||
|
<td>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_1.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_2.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_3.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_4.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_5.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_6.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_7.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_8.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
<audio controls="controls">
|
||||||
|
<source
|
||||||
|
src="https://paddlespeech.bj.bcebos.com/Parakeet/tacotron2_ljspeech_waveflow_samples_0.2/sentence_9.wav"
|
||||||
|
type="audio/wav">
|
||||||
|
Your browser does not support the <code>audio</code> element.
|
||||||
|
</audio>
|
||||||
|
</td>
|
||||||
|
</tr>
|
||||||
|
</tabel>
|
||||||
|
</table>
|
||||||
|
</embed>
|
||||||
|
|
||||||
|
|
||||||
|
Vocoder audio samples
|
||||||
|
--------------------------
|
||||||
|
|
||||||
|
Audio samples generated from ground-truth spectrograms with a vocoder.
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -25,7 +25,7 @@ The code below show how to use a transformer_tts model. After loading the pretra
|
||||||
>>> from parakeet.models import TransformerTTS
|
>>> from parakeet.models import TransformerTTS
|
||||||
>>> from pathlib import Path
|
>>> from pathlib import Path
|
||||||
>>> import yacs
|
>>> import yacs
|
||||||
|
>>>
|
||||||
>>> # load the pretrained model
|
>>> # load the pretrained model
|
||||||
>>> frontend = English()
|
>>> frontend = English()
|
||||||
>>> checkpoint_dir = Path("transformer_tts_pretrained")
|
>>> checkpoint_dir = Path("transformer_tts_pretrained")
|
||||||
|
@ -61,12 +61,7 @@ Like the example above, after loading the pretrained ConditionalWaveFlow model,
|
||||||
|
|
||||||
For more details on how to use the model, please refer the documentation.
|
For more details on how to use the model, please refer the documentation.
|
||||||
|
|
||||||
.. raw:: html
|
|
||||||
|
|
||||||
<audio controls="controls">
|
|
||||||
<source src="https://paddlespeech.bj.bcebos.com/Parakeet/transformer_tts_ljspeech_griffin-lim_samples_1.0/step_120000_sentence_0.wav" type="audio/wav">
|
|
||||||
Your browser does not support the <code>audio</code> element.
|
|
||||||
</audio>
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue